From 9de2b3789a11c8cf9a1d37e145e93203f5475300 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Sat, 20 Jun 2026 13:45:44 +0800
Subject: [PATCH 01/13] fix: doc page url in readme

---
 README.md    | 25 +++++++++++++------------
 README_CN.md | 25 +++++++++++++------------
 2 files changed, 26 insertions(+), 24 deletions(-)
diff --git a/README.md b/README.md
index 53a2110..3f4cd2f 100644
--- a/README.md
+++ b/README.md
@@ -10,7 +10,7 @@
 [![Latest](https://img.shields.io/badge/Latest-v0.2.1-f28500)](./fluxon_release)
 [![Interfaces](https://img.shields.io/badge/Interfaces-KV%2FRPC%20%7C%20MQ%20%7C%20FS-1f6feb)](#interface-capabilities)
 
-[English](./README.md) | [中文](./README_CN.md) | [Docs](https://tele-ai.github.io/fluxon/) | [中文文档](https://tele-ai.github.io/fluxon/cn/) | <a href="https://github.com/Tele-AI/fluxon" title="GitHub Repository"><img src="https://github.githubassets.com/images/modules/logos_page/GitHub-Mark.png" width="18" height="18" alt="GitHub repository" /></a>
+[English](./README.md) | [中文](./README_CN.md) | [Docs](https://tele-ai.github.io/Fluxon/) | [中文文档](https://tele-ai.github.io/Fluxon/cn/) | <a href="https://github.com/Tele-AI/Fluxon" title="GitHub Repository"><img src="https://github.githubassets.com/images/modules/logos_page/GitHub-Mark.png" width="18" height="18" alt="GitHub repository" /></a>
 
 </div>
 
@@ -145,7 +145,7 @@ The benchmark results show that small-file reads and large-file writes are alrea
 
 ## 🚀 Quick Start
 
-Quick Start is the shortest path to try Fluxon. For formal installation, deployment, and operations, see [User Docs](https://tele-ai.github.io/fluxon/user_doc/).
+Quick Start is the shortest path to try Fluxon. For formal installation, deployment, and operations, see [User Docs](https://tele-ai.github.io/Fluxon/user_doc/).
 
 ### KV Quick Start
 
@@ -178,7 +178,7 @@ Open the printed link to view the KV Web UI:
 
 Related interface docs:
 
-- [KV and RPC Interface](https://tele-ai.github.io/fluxon/user_doc/User---3---KV-and-RPC-Interface/)
+- [KV and RPC Interface](https://tele-ai.github.io/Fluxon/user_doc/User---3---KV-and-RPC-Interface/)
 
 ### MQ Quick Start
 
@@ -209,7 +209,7 @@ Runtime view:
 
 Related interface docs:
 
-- [MQ Interface](https://tele-ai.github.io/fluxon/user_doc/User---4---MQ-Interface/)
+- [MQ Interface](https://tele-ai.github.io/Fluxon/user_doc/User---4---MQ-Interface/)
 
 ### FS Quick Start
 
@@ -247,7 +247,7 @@ Open the printed link to view the FS Web UI:
 
 Related interface docs:
 
-- [FS Interface](https://tele-ai.github.io/fluxon/user_doc/User---5---FS-Interface/)
+- [FS Interface](https://tele-ai.github.io/Fluxon/user_doc/User---5---FS-Interface/)
 
 <a id="repository-structure"></a>
 
@@ -267,17 +267,18 @@ Related interface docs:
 
 Contributions are welcome. Before you start, please read the developer docs on GitHub Pages:
 
-- [Developer Docs](https://tele-ai.github.io/fluxon/dev_doc/)
-- [Developer - 1 - Package core install artifacts](https://tele-ai.github.io/fluxon/dev_doc/Developer---1---Package-Core-Install-Artifacts/)
-- [Developer - 2 - Package middleware and images](https://tele-ai.github.io/fluxon/dev_doc/Developer---2---Package-Middleware-and-Images/)
-- [Developer - 4 - Publish a release](https://tele-ai.github.io/fluxon/dev_doc/Developer---4---Publish-a-Release/)
+- [Developer Docs](https://tele-ai.github.io/Fluxon/dev_doc/)
+- [Developer - 1 - Package core install artifacts](https://tele-ai.github.io/Fluxon/dev_doc/Developer---1---Package-Core-Install-Artifacts/)
+- [Developer - 2 - Package middleware and images](https://tele-ai.github.io/Fluxon/dev_doc/Developer---2---Package-Middleware-and-Images/)
+- [Developer - 3 - Documentation Writing Rules](https://tele-ai.github.io/Fluxon/dev_doc/Developer---3---Documentation-Writing-Rules/)
+- [Developer - 4 - Publish a release](https://tele-ai.github.io/Fluxon/dev_doc/Developer---4---Publish-a-Release/)
 
 <a id="contributors"></a>
 
 ## 👥 Contributors
 
-<a href="https://github.com/Tele-AI/fluxon/graphs/contributors">
-  <img src="https://contrib.rocks/image?repo=Tele-AI/fluxon" />
+<a href="https://github.com/Tele-AI/Fluxon/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=Tele-AI/Fluxon" />
 </a>
 
 Some earlier contribution records are no longer fully reflected in the current commit history. Historical highlights:
@@ -312,4 +313,4 @@ Fluxon is open-sourced under Apache License 2.0, see [LICENSE](./LICENSE).
 
 ## ⭐ Stargazers over time
 
-[![Star History Chart](https://api.star-history.com/chart?repos=Tele-AI/fluxon&type=date&legend=top-left)](https://www.star-history.com/?repos=Tele-AI%2Ffluxon&type=date&legend=top-left)
+[![Star History Chart](https://api.star-history.com/chart?repos=Tele-AI/Fluxon&type=date&legend=top-left)](https://www.star-history.com/?repos=Tele-AI%2FFluxon&type=date&legend=top-left)
diff --git a/README_CN.md b/README_CN.md
index 715511b..da2cdb4 100644
--- a/README_CN.md
+++ b/README_CN.md
@@ -20,7 +20,7 @@
 [![Latest](https://img.shields.io/badge/Latest-v0.2.1-f28500)](./fluxon_release)
 [![Interfaces](https://img.shields.io/badge/Interfaces-KV%2FRPC%20%7C%20MQ%20%7C%20FS-1f6feb)](#接口能力)
 
-[中文](./README_CN.md) | [English](./README.md) | [用户文档](https://tele-ai.github.io/fluxon/cn/) | [English Docs](https://tele-ai.github.io/fluxon/) | <a href="https://github.com/Tele-AI/fluxon" title="GitHub 仓库"><img src="https://github.githubassets.com/images/modules/logos_page/GitHub-Mark.png" width="18" height="18" alt="GitHub repository" /></a>
+[中文](./README_CN.md) | [English](./README.md) | [用户文档](https://tele-ai.github.io/Fluxon/cn/) | [English Docs](https://tele-ai.github.io/Fluxon/) | <a href="https://github.com/Tele-AI/Fluxon" title="GitHub 仓库"><img src="https://github.githubassets.com/images/modules/logos_page/GitHub-Mark.png" width="18" height="18" alt="GitHub repository" /></a>
 
 </div>
 
@@ -147,7 +147,7 @@ benchmark 显示，小文件读和大文件写已显著领先 `Alluxio`，大文
 
 ## 🚀 快速开始
 
-Quick Start 用于最短路径体验；正式安装、部署和运维入口见 [用户文档](https://tele-ai.github.io/fluxon/cn/user_doc/)。
+Quick Start 用于最短路径体验；正式安装、部署和运维入口见 [用户文档](https://tele-ai.github.io/Fluxon/cn/user_doc/)。
 
 ### KV 快速开始
 
@@ -180,7 +180,7 @@ del demo:hello
 
 对应接口文档：
 
-- [KV 和 RPC 接口](https://tele-ai.github.io/fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---3---KV-RPC%E6%8E%A5%E5%8F%A3/)
+- [KV 和 RPC 接口](https://tele-ai.github.io/Fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---3---KV-RPC%E6%8E%A5%E5%8F%A3/)
 
 ### MQ 快速开始
 
@@ -211,7 +211,7 @@ exit
 
 对应接口文档：
 
-- [MQ 接口](https://tele-ai.github.io/fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---4---MQ%E6%8E%A5%E5%8F%A3/)
+- [MQ 接口](https://tele-ai.github.io/Fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---4---MQ%E6%8E%A5%E5%8F%A3/)
 
 ### FS 快速开始
 
@@ -249,7 +249,7 @@ FS Quick Start 会额外打印：
 
 对应接口文档：
 
-- [FS 接口](https://tele-ai.github.io/fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---5---FS%E6%8E%A5%E5%8F%A3/)
+- [FS 接口](https://tele-ai.github.io/Fluxon/cn/user_doc/%E7%94%A8%E6%88%B7---5---FS%E6%8E%A5%E5%8F%A3/)
 
 <a id="项目结构"></a>
 
@@ -269,17 +269,18 @@ FS Quick Start 会额外打印：
 
 欢迎参与贡献。开始之前，建议先阅读 GitHub Pages 上的开发者文档：
 
-- [开发者文档总入口](https://tele-ai.github.io/fluxon/cn/dev_doc/)
-- [开发者 - 1 - 打包核心安装包](https://tele-ai.github.io/fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---1---%E6%89%93%E5%8C%85%E6%A0%B8%E5%BF%83%E5%AE%89%E8%A3%85%E5%8C%85/)
-- [开发者 - 2 - 打包中间件和镜像](https://tele-ai.github.io/fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---2---%E6%89%93%E5%8C%85%E4%B8%AD%E9%97%B4%E4%BB%B6%E5%92%8C%E9%95%9C%E5%83%8F/)
-- [开发者 - 4 - 发布 Release](https://tele-ai.github.io/fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---4---%E5%8F%91%E5%B8%83-Release/)
+- [开发者文档总入口](https://tele-ai.github.io/Fluxon/cn/dev_doc/)
+- [开发者 - 1 - 打包核心安装包](https://tele-ai.github.io/Fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---1---%E6%89%93%E5%8C%85%E6%A0%B8%E5%BF%83%E5%AE%89%E8%A3%85%E5%8C%85/)
+- [开发者 - 2 - 打包中间件和镜像](https://tele-ai.github.io/Fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---2---%E6%89%93%E5%8C%85%E4%B8%AD%E9%97%B4%E4%BB%B6%E5%92%8C%E9%95%9C%E5%83%8F/)
+- [开发者 - 3 - 文档写作规约](https://tele-ai.github.io/Fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---3---%E6%96%87%E6%A1%A3%E5%86%99%E4%BD%9C%E8%A7%84%E7%BA%A6/)
+- [开发者 - 4 - 发布 Release](https://tele-ai.github.io/Fluxon/cn/dev_doc/%E5%BC%80%E5%8F%91%E8%80%85---4---%E5%8F%91%E5%B8%83-Release/)
 
 <a id="contributors"></a>
 
 ## 👥 Contributors
 
-<a href="https://github.com/Tele-AI/fluxon/graphs/contributors">
-  <img src="https://contrib.rocks/image?repo=Tele-AI/fluxon" />
+<a href="https://github.com/Tele-AI/Fluxon/graphs/contributors">
+  <img src="https://contrib.rocks/image?repo=Tele-AI/Fluxon" />
 </a>
 
 部分更早期的贡献记录已经无法从当前 commit 历史里完整反映，这里补充说明：
@@ -314,4 +315,4 @@ Fluxon 基于 Apache License 2.0 开源，见 [LICENSE](./LICENSE)。
 
 ## ⭐ Star 增长趋势
 
-[![Star History Chart](https://api.star-history.com/chart?repos=Tele-AI/fluxon&type=date&legend=top-left)](https://www.star-history.com/?repos=Tele-AI%2Ffluxon&type=date&legend=top-left)
+[![Star History Chart](https://api.star-history.com/chart?repos=Tele-AI/Fluxon&type=date&legend=top-left)](https://www.star-history.com/?repos=Tele-AI%2FFluxon&type=date&legend=top-left)

From cf6c5c09a306bc354f5deeb85b302ebc2afd34c8 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Mon, 22 Jun 2026 18:02:48 +0800
Subject: [PATCH 02/13] test

---
 .github/workflows/all_test.yml                |   9 +-
 deployment/gen_bare_deploy_bash.py            | 588 ++++-------
 .../atomic_group_node_resolution_tail.sh.tmpl |  14 +
 .../atomic_group_service_block.sh.tmpl        |  24 +
 .../atomic_group_start.sh.tmpl                |   7 +
 .../atomic_group_stop.sh.tmpl                 |   6 +
 .../bare_entrypoint.sh.tmpl                   |   5 +
 .../common_node_resolution_tail.sh.tmpl       |  15 +
 .../etcd_health_wait_block.sh.tmpl            |   4 +
 .../gen_bare_deploy_bash/host_prelude.sh.tmpl |  57 +
 .../selection_present_probe_fn.sh.tmpl        |  19 +
 ...ction_supervisor_launch_wait_block.sh.tmpl |   9 +
 ...on_supervisor_path_from_script_dir.sh.tmpl |   7 +
 .../standalone_start.sh.tmpl                  |   6 +
 .../standalone_start_body.sh.tmpl             |  27 +
 .../standalone_stop.sh.tmpl                   |  15 +
 .../start_lock_block.sh.tmpl                  |  14 +
 .../tcp_ready_helpers.sh.tmpl                 | 120 +++
 .../tcp_ready_wait_block.sh.tmpl              |   6 +
 deployment/tests/test_gen_bare_deploy_bash.py | 153 ++-
 deployment/tests/test_gen_k8s_daemonset.py    |   2 +-
 deployment/tests/test_log_shard.py            | 117 ++
 .../test_selection_supervisor_codegen.py      | 191 +++-
 .../test_start_test_bed_bootstrap_log.py      |  33 +-
 deployment/utils/log_shard.py                 | 196 ++++
 deployment/utils/proc_lifecycle_codegen.py    |  41 +-
 .../utils/selection_supervisor_codegen.py     |  90 +-
 ...15\347\275\256\346\200\273\350\247\210.md" | 217 ++++
 ...74\345\207\272\351\223\276\350\267\257.md" | 414 ++++++++
 fluxon_py/config.py                           |  15 +
 fluxon_py/tests/test_config.py                |  49 +
 fluxon_rs/Cargo.lock                          |   2 +
 fluxon_rs/fluxon_fs/src/agent.rs              |   8 +-
 .../fluxon_kv/src/client_seg_pool/mod.rs      |  23 +
 fluxon_rs/fluxon_kv/src/config.rs             | 150 ++-
 .../external_client_test.rs                   |  12 +-
 .../fluxon_kv/src/external_client_api/mod.rs  |   7 +
 fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs    |   4 +
 fluxon_rs/fluxon_kv/src/lib.rs                | 653 +++++++-----
 .../fluxon_kv/src/memholder/memholder_test.rs |   8 +
 fluxon_rs/fluxon_ops/Cargo.toml               |   4 +
 fluxon_rs/fluxon_ops/build.rs                 |  13 +
 fluxon_rs/fluxon_ops/src/lib.rs               | 250 ++++-
 fluxon_rs/fluxon_util/build.rs                |  19 +-
 fluxon_rs/fluxon_util/src/lib.rs              |   7 +-
 fluxon_rs/fluxon_util/src/log.rs              | 380 +++++--
 fluxon_rs/fluxon_util/tests/log_mgmt.rs       | 120 +++
 fluxon_test_stack/ci_2_virt_node.py           |   2 +
 fluxon_test_stack/ci_test_list.yaml           |  16 +
 fluxon_test_stack/deployconf_testbed.yml      |   5 +-
 fluxon_test_stack/pack_test_stack_rsc.py      | 261 +----
 fluxon_test_stack/start_test_bed.py           |  32 +-
 fluxon_test_stack/test_runner.py              | 284 +++--
 ...fluxon_fs_s3_download_and_exec.sh.template | 108 ++
 fluxon_test_stack/test_runner_ui.py           |   4 +
 .../tests/test_ci_2_virt_node_contract.py     |  97 +-
 .../tests/test_pack_test_stack_rsc_cli.py     | 125 ++-
 .../tests/test_runner_contract.py             |  50 +
 .../test_test_runner_testbed_contract.py      |  99 ++
 .../tests/test_test_runner_ui_contract.py     |  37 +-
 .../test_top_attention_log_mgmt_contract.py   | 112 ++
 .../top_attention_test_index/README.md        |   1 +
 .../top_attention_test_index/_log_mgmt.py     |  54 +
 scripts/git_source_selection.py               | 163 +++
 scripts/source_selection_profiles.py          | 134 +++
 setup_and_pack/nix/lib_layout.py              |  35 +-
 setup_and_pack/nix/pack_fluxonkv_pylib.py     | 232 +---
 setup_and_pack/public_workspace_contract.py   |  56 +-
 .../tests/test_git_source_selection_utils.py  | 182 ++++
 setup_and_pack/tests/test_lib_layout.py       |   7 +
 ...est_pack_fluxonkv_pylib_bridge_prebuilt.py |  33 +
 setup_and_pack/utils/__init__.py              |   2 +
 .../utils/artifact_cache_digest_utils.py      |  29 +-
 skills/browser-helm/SKILL.md                  | 232 ++++
 skills/browser-helm/agents/openai.yaml        |   6 +
 skills/browser-helm/references/commands.md    | 131 +++
 skills/canvas-dag_organizer-v1/SKILL.md       |  10 +
 .../agents/openai.yaml                        |   6 +
 skills/canvas-ops-v1/SKILL.md                 |  10 +
 skills/canvas-ops-v1/agents/openai.yaml       |   6 +
 skills/canvas-tidy_selection-v1/SKILL.md      |  10 +
 .../agents/openai.yaml                        |   6 +
 skills/find-skills/SKILL.md                   | 133 +++
 skills/imagegen/LICENSE.txt                   | 201 ++++
 skills/imagegen/SKILL.md                      | 356 +++++++
 skills/imagegen/agents/openai.yaml            |   6 +
 skills/imagegen/assets/imagegen-small.svg     |   5 +
 skills/imagegen/assets/imagegen.png           | Bin 0 -> 1711 bytes
 skills/imagegen/references/cli.md             | 242 +++++
 skills/imagegen/references/codex-network.md   |  33 +
 skills/imagegen/references/image-api.md       |  90 ++
 skills/imagegen/references/prompting.md       | 118 +++
 skills/imagegen/references/sample-prompts.md  | 433 ++++++++
 skills/imagegen/scripts/image_gen.py          | 995 ++++++++++++++++++
 skills/imagegen/scripts/remove_chroma_key.py  | 440 ++++++++
 skills/openai-docs/LICENSE.txt                | 201 ++++
 skills/openai-docs/SKILL.md                   | 167 +++
 skills/openai-docs/agents/openai.yaml         |  14 +
 skills/openai-docs/assets/openai-small.svg    |   3 +
 skills/openai-docs/assets/openai.png          | Bin 0 -> 1429 bytes
 skills/openai-docs/references/latest-model.md |  37 +
 .../openai-docs/references/prompting-guide.md | 244 +++++
 .../openai-docs/references/upgrade-guide.md   | 181 ++++
 .../scripts/fetch-codex-manual.mjs            | 598 +++++++++++
 .../scripts/resolve-latest-model-info.js      | 147 +++
 skills/plugin-creator/SKILL.md                | 243 +++++
 skills/plugin-creator/agents/openai.yaml      |   6 +
 .../assets/plugin-creator-small.svg           |   3 +
 .../plugin-creator/assets/plugin-creator.png  | Bin 0 -> 1563 bytes
 .../references/installing-and-updating.md     | 143 +++
 .../references/plugin-json-spec.md            | 194 ++++
 .../scripts/create_basic_plugin.py            | 324 ++++++
 .../scripts/read_marketplace_name.py          |  48 +
 .../scripts/update_plugin_cachebuster.py      |  78 ++
 .../plugin-creator/scripts/validate_plugin.py | 593 +++++++++++
 .../SKILL.md                                  |  11 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  16 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  27 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  15 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 .../SKILL.md                                  |  10 +
 .../agents/openai.yaml                        |   6 +
 skills/rs-skill-smoke-09e1daf7/SKILL.md       |   8 +
 skills/rs-skill-smoke-529efbc9/SKILL.md       |   8 +
 skills/rs-skill-smoke-cde1029f/SKILL.md       |   8 +
 skills/skill-creator/SKILL.md                 | 416 ++++++++
 skills/skill-creator/agents/openai.yaml       |   5 +
 .../assets/skill-creator-small.svg            |   3 +
 skills/skill-creator/assets/skill-creator.png | Bin 0 -> 1563 bytes
 skills/skill-creator/license.txt              | 202 ++++
 .../skill-creator/references/openai_yaml.md   |  49 +
 .../scripts/generate_openai_yaml.py           | 226 ++++
 skills/skill-creator/scripts/init_skill.py    | 400 +++++++
 .../skill-creator/scripts/quick_validate.py   | 101 ++
 skills/skill-installer/LICENSE.txt            | 202 ++++
 skills/skill-installer/SKILL.md               |  58 +
 skills/skill-installer/agents/openai.yaml     |   5 +
 .../assets/skill-installer-small.svg          |   3 +
 .../assets/skill-installer.png                | Bin 0 -> 1086 bytes
 .../skill-installer/scripts/github_utils.py   |  21 +
 .../scripts/install-skill-from-github.py      | 308 ++++++
 skills/skill-installer/scripts/list-skills.py | 107 ++
 173 files changed, 13984 insertions(+), 1462 deletions(-)
 create mode 100644 deployment/templates/gen_bare_deploy_bash/atomic_group_node_resolution_tail.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/atomic_group_stop.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/bare_entrypoint.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/common_node_resolution_tail.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/host_prelude.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/selection_present_probe_fn.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/selection_supervisor_path_from_script_dir.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/standalone_start.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/standalone_stop.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/start_lock_block.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
 create mode 100644 deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl
 create mode 100644 deployment/tests/test_log_shard.py
 create mode 100644 deployment/utils/log_shard.py
 create mode 100644 "fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
 create mode 100644 "fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
 create mode 100644 fluxon_rs/fluxon_util/tests/log_mgmt.rs
 create mode 100644 fluxon_test_stack/test_runner_templates/payload_fluxon_fs_s3_download_and_exec.sh.template
 create mode 100644 fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
 create mode 100644 fluxon_test_stack/top_attention_test_index/_log_mgmt.py
 create mode 100644 scripts/git_source_selection.py
 create mode 100644 scripts/source_selection_profiles.py
 create mode 100644 setup_and_pack/tests/test_git_source_selection_utils.py
 create mode 100644 skills/browser-helm/SKILL.md
 create mode 100644 skills/browser-helm/agents/openai.yaml
 create mode 100644 skills/browser-helm/references/commands.md
 create mode 100644 skills/canvas-dag_organizer-v1/SKILL.md
 create mode 100644 skills/canvas-dag_organizer-v1/agents/openai.yaml
 create mode 100644 skills/canvas-ops-v1/SKILL.md
 create mode 100644 skills/canvas-ops-v1/agents/openai.yaml
 create mode 100644 skills/canvas-tidy_selection-v1/SKILL.md
 create mode 100644 skills/canvas-tidy_selection-v1/agents/openai.yaml
 create mode 100644 skills/find-skills/SKILL.md
 create mode 100644 skills/imagegen/LICENSE.txt
 create mode 100644 skills/imagegen/SKILL.md
 create mode 100644 skills/imagegen/agents/openai.yaml
 create mode 100644 skills/imagegen/assets/imagegen-small.svg
 create mode 100644 skills/imagegen/assets/imagegen.png
 create mode 100644 skills/imagegen/references/cli.md
 create mode 100644 skills/imagegen/references/codex-network.md
 create mode 100644 skills/imagegen/references/image-api.md
 create mode 100644 skills/imagegen/references/prompting.md
 create mode 100644 skills/imagegen/references/sample-prompts.md
 create mode 100644 skills/imagegen/scripts/image_gen.py
 create mode 100644 skills/imagegen/scripts/remove_chroma_key.py
 create mode 100644 skills/openai-docs/LICENSE.txt
 create mode 100644 skills/openai-docs/SKILL.md
 create mode 100644 skills/openai-docs/agents/openai.yaml
 create mode 100644 skills/openai-docs/assets/openai-small.svg
 create mode 100644 skills/openai-docs/assets/openai.png
 create mode 100644 skills/openai-docs/references/latest-model.md
 create mode 100644 skills/openai-docs/references/prompting-guide.md
 create mode 100644 skills/openai-docs/references/upgrade-guide.md
 create mode 100644 skills/openai-docs/scripts/fetch-codex-manual.mjs
 create mode 100644 skills/openai-docs/scripts/resolve-latest-model-info.js
 create mode 100644 skills/plugin-creator/SKILL.md
 create mode 100644 skills/plugin-creator/agents/openai.yaml
 create mode 100644 skills/plugin-creator/assets/plugin-creator-small.svg
 create mode 100644 skills/plugin-creator/assets/plugin-creator.png
 create mode 100644 skills/plugin-creator/references/installing-and-updating.md
 create mode 100644 skills/plugin-creator/references/plugin-json-spec.md
 create mode 100644 skills/plugin-creator/scripts/create_basic_plugin.py
 create mode 100644 skills/plugin-creator/scripts/read_marketplace_name.py
 create mode 100644 skills/plugin-creator/scripts/update_plugin_cachebuster.py
 create mode 100644 skills/plugin-creator/scripts/validate_plugin.py
 create mode 100644 skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
 create mode 100644 skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
 create mode 100644 skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
 create mode 100644 skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
 create mode 100644 skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
 create mode 100644 skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
 create mode 100644 skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
 create mode 100644 skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
 create mode 100644 skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
 create mode 100644 skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
 create mode 100644 skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
 create mode 100644 skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
 create mode 100644 skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
 create mode 100644 skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
 create mode 100644 skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
 create mode 100644 skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
 create mode 100644 skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
 create mode 100644 skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
 create mode 100644 skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
 create mode 100644 skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
 create mode 100644 skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
 create mode 100644 skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
 create mode 100644 skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
 create mode 100644 skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
 create mode 100644 skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
 create mode 100644 skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
 create mode 100644 skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
 create mode 100644 skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
 create mode 100644 skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
 create mode 100644 skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
 create mode 100644 skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
 create mode 100644 skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
 create mode 100644 skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
 create mode 100644 skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
 create mode 100644 skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
 create mode 100644 skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
 create mode 100644 skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
 create mode 100644 skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
 create mode 100644 skills/rs-skill-smoke-09e1daf7/SKILL.md
 create mode 100644 skills/rs-skill-smoke-529efbc9/SKILL.md
 create mode 100644 skills/rs-skill-smoke-cde1029f/SKILL.md
 create mode 100644 skills/skill-creator/SKILL.md
 create mode 100644 skills/skill-creator/agents/openai.yaml
 create mode 100644 skills/skill-creator/assets/skill-creator-small.svg
 create mode 100644 skills/skill-creator/assets/skill-creator.png
 create mode 100644 skills/skill-creator/license.txt
 create mode 100644 skills/skill-creator/references/openai_yaml.md
 create mode 100644 skills/skill-creator/scripts/generate_openai_yaml.py
 create mode 100644 skills/skill-creator/scripts/init_skill.py
 create mode 100644 skills/skill-creator/scripts/quick_validate.py
 create mode 100644 skills/skill-installer/LICENSE.txt
 create mode 100644 skills/skill-installer/SKILL.md
 create mode 100644 skills/skill-installer/agents/openai.yaml
 create mode 100644 skills/skill-installer/assets/skill-installer-small.svg
 create mode 100644 skills/skill-installer/assets/skill-installer.png
 create mode 100644 skills/skill-installer/scripts/github_utils.py
 create mode 100644 skills/skill-installer/scripts/install-skill-from-github.py
 create mode 100644 skills/skill-installer/scripts/list-skills.py

diff --git a/.github/workflows/all_test.yml b/.github/workflows/all_test.yml
index 4300c60..33cdd5b 100644
--- a/.github/workflows/all_test.yml
+++ b/.github/workflows/all_test.yml
@@ -86,10 +86,15 @@ jobs:
           # Scene selection:
           # - ci_top_attention_doc_page_build keeps the doc-site build as a CI scene workload.
           # - ci_top_attention_bin_kvtest keeps the Rust kv_test entry under the same CI scene contract.
+          # - ci_top_attention_log_mgmt keeps log rolling/sharding coverage under the same CI scene contract.
           suite["scenes"] = {
               key: value
               for key, value in suite["scenes"].items()
-              if key in ("ci_top_attention_doc_page_build", "ci_top_attention_bin_kvtest")
+              if key in (
+                  "ci_top_attention_doc_page_build",
+                  "ci_top_attention_bin_kvtest",
+                  "ci_top_attention_log_mgmt",
+              )
           }
 
           # Profile selection:
@@ -107,11 +112,13 @@ jobs:
           suite["profiles"]["fluxon_tcp"]["runtime"]["ci"]["scene_configs"]["ci_top_attention_doc_page_build"]["doc_site_base_url"] = (
               "${{ github.repository_owner }}.github.io/${{ github.event.repository.name }}"
           )
+          suite["profiles"]["fluxon_tcp"]["runtime"]["ci"]["scene_configs"]["ci_top_attention_log_mgmt"]["enabled"] = True
 
           # Scale selection:
           # - Keep the original per-scene scales from ci_test_list.yaml.
           # - ci_top_attention_doc_page_build stays on n1_kvowner_dram_3gib.
           # - ci_top_attention_bin_kvtest stays on n1_kvowner_dram_20gib.
+          # - ci_top_attention_log_mgmt stays on n1_kvowner_dram_20gib.
 
           out_path.write_text(
               yaml.safe_dump(suite, sort_keys=False, allow_unicode=False),
diff --git a/deployment/gen_bare_deploy_bash.py b/deployment/gen_bare_deploy_bash.py
index ce51025..5503658 100644
--- a/deployment/gen_bare_deploy_bash.py
+++ b/deployment/gen_bare_deploy_bash.py
@@ -4,8 +4,10 @@
 import argparse
 import json
 import os
+import re
 import shlex
 import sys
+from functools import lru_cache
 from pathlib import Path
 from typing import Any, Dict, List
 
@@ -25,7 +27,9 @@
     StopTimeouts,
     render_bash_proc_lifecycle_funcs_pid_tree,
 )
+from log_shard import render_module_source as render_log_shard_module_source  # type: ignore
 from selection_supervisor_codegen import (  # type: ignore
+    LOG_SHARD_HELPER_FILENAME,
     PYTHON_SELECTION_SUPERVISOR_FILENAME,
     render_python_selection_supervisor_module,
 )
@@ -44,13 +48,36 @@
 ATOMIC_GROUP_CRASHLOOP_CONSECUTIVE_RESTARTS = 10
 ATOMIC_GROUP_CRASHLOOP_INTERVAL_LT_SECONDS = 30
 ATOMIC_GROUP_PROBABLE_READY_SECONDS = 10
-STANDALONE_PROBABLE_READY_SECONDS = 3
-STANDALONE_STARTUP_DEADLINE_SECONDS = 60
-ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS = 10 * 60
+STANDALONE_PROBABLE_READY_SECONDS = 10
+STANDALONE_STARTUP_DEADLINE_SECONDS = 10
+ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS = 10
 HOSTWORKDIR_RUNTIME_TOKEN = "${HOSTWORKDIR}"
 REPO_ROOT = SCRIPT_DIR.parent
-TCP_READY_STABLE_SECONDS = 2
-TCP_READY_POLL_INTERVAL_SECONDS = 0.2
+BARE_TEMPLATE_DIR = SCRIPT_DIR / "templates" / "gen_bare_deploy_bash"
+_TEMPLATE_TOKEN_RE = re.compile(r"\{\{([A-Z0-9_]+)\}\}")
+
+
+@lru_cache(maxsize=None)
+def _load_bare_template(*, template_name: str) -> str:
+    template_path = BARE_TEMPLATE_DIR / template_name
+    if not template_path.is_file():
+        raise RuntimeError(f"missing bare deploy template: {template_path}")
+    return template_path.read_text(encoding="utf-8")
+
+
+def _render_bare_template(*, template_name: str, values: Dict[str, str]) -> str:
+    template = _load_bare_template(template_name=template_name)
+
+    def _replace(match: re.Match[str]) -> str:
+        key = match.group(1)
+        if key not in values:
+            raise RuntimeError(f"missing bare deploy template value: template={template_name} key={key}")
+        value = values[key]
+        if not isinstance(value, str):
+            raise ValueError(f"bare deploy template value must be a string: template={template_name} key={key}")
+        return value
+
+    return _TEMPLATE_TOKEN_RE.sub(_replace, template)
 
 
 def _resolve_repo_root_cli_path(*, raw_path: Path, field_name: str) -> Path:
@@ -89,6 +116,10 @@ def main() -> None:
         outdir / PYTHON_SELECTION_SUPERVISOR_FILENAME,
         render_python_selection_supervisor_module(timeouts=STOP_TIMEOUTS),
     )
+    (outdir / LOG_SHARD_HELPER_FILENAME).write_text(
+        render_log_shard_module_source(),
+        encoding="utf-8",
+    )
 
     name_prefix = _require_str(cfg.get("name_prefix"), "name_prefix")
     cluster_nodes_raw = _require_list(cfg.get("cluster_nodes"), "cluster_nodes")
@@ -306,12 +337,12 @@ def _bare_entrypoint_script_name(*, workload_name: str) -> str:
 
 
 def _render_bare_entrypoint_script(*, service_name: str, entrypoint: str) -> str:
-    return (
-        "#!/usr/bin/env bash\n"
-        "set -euo pipefail\n\n"
-        f"export SERVICE={_sh_quote(service_name)}\n"
-        + entrypoint.strip()
-        + "\n"
+    return _render_bare_template(
+        template_name="bare_entrypoint.sh.tmpl",
+        values={
+            "SERVICE_EXPORT": _sh_quote(service_name),
+            "ENTRYPOINT": entrypoint.strip(),
+        },
     )
 
 
@@ -353,29 +384,25 @@ def _render_standalone_start_script(
     service_cfg: Dict[str, Any],
 ) -> str:
     allowed_nodes = _extract_nodes(service_cfg)
-    service_port = _extract_port(service_cfg)
-    port_export = ""
-    if service_port is not None:
-        port_export = f"export {service_name.upper()}__PORT={_sh_quote(str(service_port))}\n"
-    return (
-        "#!/usr/bin/env bash\n"
-        "set -euo pipefail\n\n"
-        f"SERVICE={_sh_quote(service_name)}\n"
-        f"NAME_PREFIX={_sh_quote(name_prefix)}\n"
-        + _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes)
-        + _render_host_prelude(cluster_nodes=cluster_nodes)
-        + _render_common_node_resolution_tail(service_name=service_name)
-        + _render_selection_supervisor_path_from_script_dir()
-        + _render_proc_lifecycle_pid_tree_helpers()
-        + _render_tcp_ready_helpers()
-        + _render_selection_present_probe_fn()
-        + _render_start_lock_block()
-        + _render_global_env_exports(global_envs)
-        + port_export
-        + _render_standalone_start_body(
-            name_prefix=name_prefix,
-            service_name=service_name,
-        )
+    return _render_bare_template(
+        template_name="standalone_start.sh.tmpl",
+        values={
+            "SERVICE_ASSIGN": _sh_quote(service_name),
+            "NAME_PREFIX_ASSIGN": _sh_quote(name_prefix),
+            "ALLOWED_NODES_BLOCK": _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes),
+            "HOST_PRELUDE": _render_host_prelude(cluster_nodes=cluster_nodes),
+            "COMMON_NODE_RESOLUTION_TAIL": _render_common_node_resolution_tail(service_name=service_name),
+            "SELECTION_SUPERVISOR_PATH_BLOCK": _render_selection_supervisor_path_from_script_dir(),
+            "PROC_LIFECYCLE_HELPERS": _render_proc_lifecycle_pid_tree_helpers(),
+            "SELECTION_PRESENT_PROBE_FN": _render_selection_present_probe_fn(),
+            "START_LOCK_BLOCK": _render_start_lock_block(),
+            "GLOBAL_ENV_EXPORTS": _render_global_env_exports(global_envs),
+            "PORT_EXPORT": _render_service_port_export(service_name=service_name, service_cfg=service_cfg),
+            "START_BODY": _render_standalone_start_body(
+                name_prefix=name_prefix,
+                service_name=service_name,
+            ),
+        },
     )
 
 
@@ -387,25 +414,19 @@ def _render_standalone_stop_script(
     service_cfg: Dict[str, Any],
 ) -> str:
     allowed_nodes = _extract_nodes(service_cfg)
-    return (
-        "#!/usr/bin/env bash\n"
-        "set -euo pipefail\n\n"
-        f"SERVICE={_sh_quote(service_name)}\n"
-        f"NAME_PREFIX={_sh_quote(name_prefix)}\n"
-        + _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes)
-        + _render_host_prelude(cluster_nodes=cluster_nodes)
-        + _render_common_node_resolution_tail(service_name=service_name)
-        + _render_selection_supervisor_path_from_script_dir()
-        + f'SUPERVISOR_LABEL={_sh_quote(_bare_plain_selection_supervisor_label(name_prefix=name_prefix, service_name=service_name))}\n'
-        + "# English note:\n"
-        + "# - Generated bare stop is retained as a manual operator tool.\n"
-        + "# - Automation must not depend on this path for handover or rollout convergence.\n"
-        + "# - The command only asks the shared selection supervisor to retire the concrete selection\n"
-        + "#   identity identified by label on this node.\n"
-        + 'if ! python3 "$SELECTION_SUPERVISOR" stop --label "$SUPERVISOR_LABEL" --scope-key "$HOSTWORKDIR" --missing-ok >/dev/null; then\n'
-        + '  echo "[bare] stop failed svc=$SERVICE label=$SUPERVISOR_LABEL hostworkdir=$HOSTWORKDIR"\n'
-        + "  exit 1\n"
-        + "fi\n"
+    return _render_bare_template(
+        template_name="standalone_stop.sh.tmpl",
+        values={
+            "SERVICE_ASSIGN": _sh_quote(service_name),
+            "NAME_PREFIX_ASSIGN": _sh_quote(name_prefix),
+            "ALLOWED_NODES_BLOCK": _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes),
+            "HOST_PRELUDE": _render_host_prelude(cluster_nodes=cluster_nodes),
+            "COMMON_NODE_RESOLUTION_TAIL": _render_common_node_resolution_tail(service_name=service_name),
+            "SELECTION_SUPERVISOR_PATH_BLOCK": _render_selection_supervisor_path_from_script_dir(),
+            "SUPERVISOR_LABEL_ASSIGN": _sh_quote(
+                _bare_plain_selection_supervisor_label(name_prefix=name_prefix, service_name=service_name)
+            ),
+        },
     )
 
 
@@ -429,20 +450,19 @@ def _render_atomic_group_start_script(
                 service_cfg=service_cfg,
             )
         )
-    return (
-        "#!/usr/bin/env bash\n"
-        "set -euo pipefail\n\n"
-        f"GROUP={_sh_quote(group_name)}\n"
-        f"NAME_PREFIX={_sh_quote(name_prefix)}\n"
-        + _render_host_prelude(cluster_nodes=cluster_nodes)
-        + _render_atomic_group_node_resolution_tail(group_cfg["nodes"])
-        + _render_selection_supervisor_path_from_script_dir()
-        + _render_proc_lifecycle_pid_tree_helpers()
-        + _render_tcp_ready_helpers()
-        + _render_global_env_exports(global_envs)
-        + f"GROUP_STARTUP_DEADLINE_TS=$(( $(date +%s) + {ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS} ))\n"
-        + "".join(service_blocks)
-        + 'echo "[atomic-group] ready group=$GROUP node=$NODE_ID"\n'
+    return _render_bare_template(
+        template_name="atomic_group_start.sh.tmpl",
+        values={
+            "GROUP_ASSIGN": _sh_quote(group_name),
+            "NAME_PREFIX_ASSIGN": _sh_quote(name_prefix),
+            "HOST_PRELUDE": _render_host_prelude(cluster_nodes=cluster_nodes),
+            "ATOMIC_GROUP_NODE_RESOLUTION_TAIL": _render_atomic_group_node_resolution_tail(group_cfg["nodes"]),
+            "SELECTION_SUPERVISOR_PATH_BLOCK": _render_selection_supervisor_path_from_script_dir(),
+            "PROC_LIFECYCLE_HELPERS": _render_proc_lifecycle_pid_tree_helpers(),
+            "GLOBAL_ENV_EXPORTS": _render_global_env_exports(global_envs),
+            "GROUP_STARTUP_DEADLINE_ASSIGN": str(ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS),
+            "SERVICE_BLOCKS": "".join(service_blocks),
+        },
     )
 
 
@@ -454,276 +474,105 @@ def _render_atomic_group_stop_script(
     group_cfg: Dict[str, Any],
 ) -> str:
     stop_services = list(reversed(group_cfg["services"]))
-    return (
-        "#!/usr/bin/env bash\n"
-        "set -u -o pipefail\n\n"
-        f"GROUP={_sh_quote(group_name)}\n"
-        f"NAME_PREFIX={_sh_quote(name_prefix)}\n"
-        + _render_host_prelude(cluster_nodes=cluster_nodes)
-        + _render_atomic_group_node_resolution_tail(group_cfg["nodes"])
-        + _render_selection_supervisor_path_from_script_dir()
-        + _render_atomic_group_stop_fn(
-            runtime_specs=[
-                {
-                    "service_name": service_name,
-                    "supervisor_label": _bare_atomic_group_member_selection_supervisor_label(
-                        name_prefix=name_prefix,
-                        group_name=group_name,
-                        service_name=service_name,
-                    ),
-                }
-                for service_name in stop_services
-            ],
-        )
-        + "stop_group\n"
+    return _render_bare_template(
+        template_name="atomic_group_stop.sh.tmpl",
+        values={
+            "GROUP_ASSIGN": _sh_quote(group_name),
+            "NAME_PREFIX_ASSIGN": _sh_quote(name_prefix),
+            "HOST_PRELUDE": _render_host_prelude(cluster_nodes=cluster_nodes),
+            "ATOMIC_GROUP_NODE_RESOLUTION_TAIL": _render_atomic_group_node_resolution_tail(group_cfg["nodes"]),
+            "SELECTION_SUPERVISOR_PATH_BLOCK": _render_selection_supervisor_path_from_script_dir(),
+            "ATOMIC_GROUP_STOP_FN": _render_atomic_group_stop_fn(
+                runtime_specs=[
+                    {
+                        "service_name": service_name,
+                        "supervisor_label": _bare_atomic_group_member_selection_supervisor_label(
+                            name_prefix=name_prefix,
+                            group_name=group_name,
+                            service_name=service_name,
+                        ),
+                    }
+                    for service_name in stop_services
+                ],
+            ),
+        },
     )
 
 
 def _render_host_prelude(*, cluster_nodes: List[Dict[str, Any]]) -> str:
     all_nodes = [_require_str(node.get("hostname"), "cluster_nodes[].hostname") for node in cluster_nodes]
-    out = _render_nodes_bash(name="ALL_NODES", nodes=all_nodes)
-    out += "\nLOCAL_HOSTNAME=$(hostname -s 2>/dev/null || hostname 2>/dev/null || echo unknown)\n"
-    out += 'LOCAL_FQDN=$(hostname -f 2>/dev/null || echo "$LOCAL_HOSTNAME")\n'
-    out += 'NODE_ID="${NODE_ID:-}"\n'
-    out += 'if [ -n "$NODE_ID" ]; then\n'
-    out += '  _node_id_known=false\n'
-    out += '  for n in "${ALL_NODES[@]}"; do\n'
-    out += '    if [ "$n" = "$NODE_ID" ]; then\n'
-    out += '      _node_id_known=true\n'
-    out += "      break\n"
-    out += "    fi\n"
-    out += "  done\n"
-    out += '  if [ "$_node_id_known" != true ]; then\n'
-    out += '    echo "Unknown preset NODE_ID: $NODE_ID"\n'
-    out += f'    echo "Known nodes: {" ".join(all_nodes)}"\n'
-    out += "    exit 1\n"
-    out += "  fi\n"
-    out += "fi\n"
-    out += 'if [ -z "$NODE_ID" ]; then\n'
-    out += 'for n in "${ALL_NODES[@]}"; do\n'
-    out += '  if [ "$n" = "$LOCAL_HOSTNAME" ] || [ "$n" = "$LOCAL_FQDN" ]; then\n'
-    out += '    NODE_ID="$n"\n'
-    out += "    break\n"
-    out += "  fi\n"
-    out += "done\n"
-    out += "fi\n"
-    out += 'if [ -z "$NODE_ID" ] && [ ${#ALL_NODES[@]} -eq 1 ]; then\n'
-    out += '  NODE_ID="${ALL_NODES[0]}"\n'
-    out += "fi\n"
-    out += 'if [ -z "$NODE_ID" ]; then\n'
-    out += '  for ip in $(hostname -I 2>/dev/null); do\n'
-    out += '    for n in "${ALL_NODES[@]}"; do\n'
-    out += '      _ip_n=""\n'
-    out += '      case "$n" in\n'
-    for node in cluster_nodes:
-        node_name = _require_str(node.get("hostname"), "cluster_nodes[].hostname")
-        node_ip = _require_str(node.get("ip"), f"cluster_nodes[{node_name}].ip")
-        out += f"        {_sh_quote(node_name)}) _ip_n={_sh_quote(node_ip)};;\n"
-    out += '        *) _ip_n="";;\n'
-    out += "      esac\n"
-    out += '      if [ "$_ip_n" = "$ip" ]; then\n'
-    out += '        NODE_ID="$n"\n'
-    out += "        break\n"
-    out += "      fi\n"
-    out += "    done\n"
-    out += '    [ -n "$NODE_ID" ] && break\n'
-    out += "  done\n"
-    out += "fi\n"
-    out += 'if [ -z "$NODE_ID" ]; then\n'
-    out += '  echo "Cannot map host to a configured node. Hostname=$LOCAL_HOSTNAME FQDN=$LOCAL_FQDN IPs=$(hostname -I 2>/dev/null)"\n'
-    out += f'  echo "Known nodes: {" ".join(all_nodes)}"\n'
-    out += "  exit 1\n"
-    out += "fi\n\n"
-    out += 'HOST_IP=""\nHOSTWORKDIR=""\ncase "$NODE_ID" in\n'
+    ip_case_lines: list[str] = []
+    host_case_lines: list[str] = []
     for node in cluster_nodes:
         node_name = _require_str(node.get("hostname"), "cluster_nodes[].hostname")
         node_ip = _require_str(node.get("ip"), f"cluster_nodes[{node_name}].ip")
         hostworkdir = _require_str(node.get("hostworkdir"), f"cluster_nodes[{node_name}].hostworkdir")
-        out += f"  {_sh_quote(node_name)}) HOST_IP={_sh_quote(node_ip)}; HOSTWORKDIR={_sh_quote(hostworkdir)};;\n"
-    out += '  *) echo "Unknown NODE_ID: $NODE_ID"; exit 1;;\n'
-    out += "esac\n"
-    return out
+        ip_case_lines.append(f"        {_sh_quote(node_name)}) _ip_n={_sh_quote(node_ip)};;")
+        host_case_lines.append(
+            f"  {_sh_quote(node_name)}) HOST_IP={_sh_quote(node_ip)}; HOSTWORKDIR={_sh_quote(hostworkdir)};;"
+        )
+    return _render_bare_template(
+        template_name="host_prelude.sh.tmpl",
+        values={
+            "ALL_NODES_BLOCK": _render_nodes_bash(name="ALL_NODES", nodes=all_nodes),
+            "KNOWN_NODES": " ".join(all_nodes),
+            "IP_CASE_LINES": "\n".join(ip_case_lines),
+            "HOST_CASE_LINES": "\n".join(host_case_lines),
+        },
+    )
 
 
 def _render_common_node_resolution_tail(*, service_name: str) -> str:
-    return (
-        'if [ ${#ALLOWED_NODES[@]} -gt 0 ]; then\n'
-        + '  _ok=false\n'
-        + '  for n in "${ALLOWED_NODES[@]}"; do\n'
-        + '    if [ "$n" = "$NODE_ID" ]; then _ok=true; fi\n'
-        + "  done\n"
-        + '  if [ "$_ok" != true ]; then\n'
-        + f'    echo "Service {service_name} not scheduled on this node ($NODE_ID). Allowed: ${{ALLOWED_NODES[*]}}"\n'
-        + "    exit 0\n"
-        + "  fi\n"
-        + "fi\n\n"
-        + 'export NODE_ID="$NODE_ID"\n'
-        + 'export HOST_IP="$HOST_IP"\n'
-        + 'export HOSTWORKDIR="$HOSTWORKDIR"\n\n'
+    return _render_bare_template(
+        template_name="common_node_resolution_tail.sh.tmpl",
+        values={"SERVICE_NAME": service_name},
     )
 
 
 def _render_atomic_group_node_resolution_tail(allowed_nodes: List[str]) -> str:
-    return (
-        _render_nodes_bash(name="GROUP_NODES", nodes=allowed_nodes)
-        + 'scheduled=false\n'
-        + 'for n in "${GROUP_NODES[@]}"; do\n'
-        + '  if [ "$n" = "$NODE_ID" ]; then scheduled=true; fi\n'
-        + "done\n"
-        + 'if [ "$scheduled" != true ]; then\n'
-        + '  echo "[atomic-group] skip group=$GROUP node=$NODE_ID allowed=${GROUP_NODES[*]}"\n'
-        + "  exit 0\n"
-        + "fi\n\n"
-        + 'export NODE_ID="$NODE_ID"\n'
-        + 'export HOST_IP="$HOST_IP"\n'
-        + 'export HOSTWORKDIR="$HOSTWORKDIR"\n'
-        + 'echo "[atomic-group] group=$GROUP node=$NODE_ID hostworkdir=$HOSTWORKDIR"\n\n'
+    return _render_bare_template(
+        template_name="atomic_group_node_resolution_tail.sh.tmpl",
+        values={"GROUP_NODES_BLOCK": _render_nodes_bash(name="GROUP_NODES", nodes=allowed_nodes)},
     )
 
 
 def _render_start_lock_block() -> str:
-    return (
-        'PID_DIR="$HOSTWORKDIR/run"\n'
-        + 'mkdir -p "$PID_DIR"\n'
-        + 'START_LOCKFILE="$PID_DIR/${SERVICE}.start.lock"\n'
-        + 'if ! command -v flock >/dev/null 2>&1; then\n'
-        + '  echo "Missing required command: flock"\n'
-        + "  exit 1\n"
-        + "fi\n"
-        + 'exec 9>"$START_LOCKFILE"\n'
-        + 'if ! flock -xn 9; then\n'
-        + '  echo "[bare] start skipped svc=$SERVICE reason=another start is already running lockfile=$START_LOCKFILE"\n'
-        + "  exit 0\n"
-        + "fi\n"
-        + 'exec 9>&-\n\n'
-    )
+    return _load_bare_template(template_name="start_lock_block.sh.tmpl")
 
 
 def _render_proc_lifecycle_pid_tree_helpers() -> str:
     return render_bash_proc_lifecycle_funcs_pid_tree(timeouts=STOP_TIMEOUTS) + "\n\n"
 
 
-def _render_tcp_ready_helpers() -> str:
-    return (
-        "wait_service_tcp_ready() {\n"
-        + '  svc="$1"\n'
-        + '  host="$2"\n'
-        + '  port="$3"\n'
-        + '  stable_seconds="$4"\n'
-        + '  deadline_ts="$5"\n'
-        + '  context="$6"\n'
-        + '  if [[ ! "$port" =~ ^[0-9]+$ ]]; then\n'
-        + '    echo "$context tcp-ready: invalid port svc=$svc port=$port"\n'
-        + "    return 1\n"
-        + "  fi\n"
-        + '  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then\n'
-        + '    echo "$context tcp-ready: invalid stable_seconds svc=$svc stable_seconds=$stable_seconds"\n'
-        + "    return 1\n"
-        + "  fi\n"
-        + f"  poll_interval_seconds={TCP_READY_POLL_INTERVAL_SECONDS}\n"
-        + '  stable_checks=$(python3 - "$stable_seconds" "$poll_interval_seconds" <<\'__FLUXON_TCP_READY_CHECKS__\'\n'
-        + "import math\n"
-        + "import sys\n"
-        + "stable_seconds = float(sys.argv[1])\n"
-        + "poll_interval_seconds = float(sys.argv[2])\n"
-        + "print(max(1, int(math.ceil(stable_seconds / poll_interval_seconds))))\n"
-        + "__FLUXON_TCP_READY_CHECKS__\n"
-        + ")\n"
-        + '  if [[ ! "$stable_checks" =~ ^[0-9]+$ ]] || [ "$stable_checks" -le 0 ]; then\n'
-        + '    echo "$context tcp-ready: failed to compute stable_checks svc=$svc"\n'
-        + "    return 1\n"
-        + "  fi\n"
-        + "  ok_checks=0\n"
-        + "  while true; do\n"
-        + '    now=$(date +%s)\n'
-        + '    if [ "$now" -ge "$deadline_ts" ]; then\n'
-        + '      echo "$context tcp-ready: deadline exceeded svc=$svc host=$host port=$port"\n'
-        + "      return 1\n"
-        + "    fi\n"
-        + '    if python3 - "$host" "$port" <<\'__FLUXON_TCP_READY_PROBE__\'\n'
-        + "import socket\n"
-        + "import sys\n"
-        + "host = sys.argv[1]\n"
-        + "port = int(sys.argv[2])\n"
-        + "with socket.create_connection((host, port), timeout=1.0):\n"
-        + "    pass\n"
-        + "__FLUXON_TCP_READY_PROBE__\n"
-        + "    then\n"
-        + "      ok_checks=$((ok_checks+1))\n"
-        + '      if [ "$ok_checks" -ge "$stable_checks" ]; then\n'
-        + '        echo "$context tcp-ready: ok svc=$svc host=$host port=$port stable_checks=$stable_checks"\n'
-        + "        return 0\n"
-        + "      fi\n"
-        + "    else\n"
-        + '      if [ "$ok_checks" -ne 0 ]; then\n'
-        + '        echo "$context tcp-ready: reset svc=$svc ok_checks=$ok_checks host=$host port=$port"\n'
-        + "      fi\n"
-        + "      ok_checks=0\n"
-        + "    fi\n"
-        + '    sleep "$poll_interval_seconds"\n'
-        + "  done\n"
-        + "}\n\n"
-    )
-
-
 def _render_selection_present_probe_fn() -> str:
-    return (
-        "selection_present() {\n"
-        + "  python3 - \"$SELECTION_SUPERVISOR\" \"$SUPERVISOR_LABEL\" \"$HOSTWORKDIR\" <<'__FLUXON_SELECTION_PRESENT__'\n"
-        + "import importlib.util\n"
-        + "import sys\n"
-        + "from pathlib import Path\n"
-        + "\n"
-        + "supervisor_path = Path(sys.argv[1])\n"
-        + "label = sys.argv[2]\n"
-        + "scope_key = sys.argv[3]\n"
-        + 'spec = importlib.util.spec_from_file_location("fluxon_selection_supervisor_probe", supervisor_path)\n'
-        + "if spec is None or spec.loader is None:\n"
-        + '    raise RuntimeError(f"failed to load selection supervisor module: {supervisor_path}")\n'
-        + "module = importlib.util.module_from_spec(spec)\n"
-        + "sys.modules[spec.name] = module\n"
-        + "spec.loader.exec_module(module)\n"
-        + "raise SystemExit(0 if module._selection_present(label, scope_key=scope_key) else 1)\n"
-        + "__FLUXON_SELECTION_PRESENT__\n"
-        + "}\n\n"
-    )
+    return _load_bare_template(template_name="selection_present_probe_fn.sh.tmpl")
 
 
 def _render_selection_supervisor_launch_wait_block(
     *,
     run_cmd: str,
-    logfile_expr: str,
     stable_seconds_expr: str,
     deadline_ts_expr: str,
     context: str,
 ) -> str:
-    return (
-        'SUPERVISOR_PID=$( '
-        + run_cmd
-        + f' >>{logfile_expr} 2>&1 < /dev/null & echo "$!" )\n'
-        + 'if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then\n'
-        + f'  echo "{context} launch failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"\n'
-        + "  exit 1\n"
-        + "fi\n"
-        + 'if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" '
-        + stable_seconds_expr
-        + " "
-        + deadline_ts_expr
-        + f' "{context}"; then\n'
-        + f'  echo "{context} probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"\n'
-        + "  exit 1\n"
-        + "fi\n"
+    return _render_bare_template(
+        template_name="selection_supervisor_launch_wait_block.sh.tmpl",
+        values={
+            "RUN_CMD": run_cmd,
+            "STABLE_SECONDS_EXPR": stable_seconds_expr,
+            "DEADLINE_TS_EXPR": deadline_ts_expr,
+            "CONTEXT": context,
+        },
     )
 
 
-def _render_tcp_ready_wait_block(*, context: str) -> str:
+def _render_service_port_export(*, service_name: str, service_cfg: Dict[str, Any], indent: str = "") -> str:
+    service_port = _extract_port(service_cfg)
+    if service_port is None:
+        return indent + "unset SERVICE_PORT\n"
     return (
-        'if [[ "${SERVICE_PORT:-}" =~ ^[0-9]+$ ]]; then\n'
-        + f'  if ! wait_service_tcp_ready "$SERVICE" "$HOST_IP" "$SERVICE_PORT" {TCP_READY_STABLE_SECONDS} "$STARTUP_DEADLINE_TS" "{context}"; then\n'
-        + f'    echo "{context} tcp-ready failed svc=$SERVICE host=$HOST_IP port=$SERVICE_PORT"\n'
-        + "    exit 1\n"
-        + "  fi\n"
-        + "fi\n"
+        indent + f"export {service_name.upper()}__PORT={_sh_quote(str(service_port))}\n"
+        + indent + f"export SERVICE_PORT={_sh_quote(str(service_port))}\n"
     )
 
 
@@ -759,54 +608,28 @@ def _render_standalone_start_body(*, name_prefix: str, service_name: str) -> str
         crashloop_interval_lt_seconds=0,
         child_command=child_command,
     )
-    return (
-        f'SUPERVISOR_LABEL={_sh_quote(_bare_plain_selection_supervisor_label(name_prefix=name_prefix, service_name=service_name))}\n'
-        + f'RUNTIME_STATE_JSON={_sh_quote(runtime_state_json)}\n'
-        + 'OWNER_TS_MS=$(python3 -c \'import time; print(int(time.time() * 1000))\')\n'
-        + f"STARTUP_DEADLINE_TS=$(( $(date +%s) + {STANDALONE_STARTUP_DEADLINE_SECONDS} ))\n"
-        + 'LOG_DIR="$HOSTWORKDIR/log"\n'
-        + 'LOGFILE="$LOG_DIR/${SERVICE}.log"\n'
-        + 'mkdir -p "$LOG_DIR"\n'
-        + 'touch "$LOGFILE"\n'
-        + 'echo "Starting $SERVICE on $NODE_ID (IP: $HOST_IP, workdir: $HOSTWORKDIR)"\n'
-        + "# English note:\n"
-        + "# - bootstrap bare start must be idempotent when the shared selection supervisor already owns\n"
-        + "#   a live child for the same label.\n"
-        + "# - start_test_bed enables this path only for deployconf.bootstrap_bare_services.\n"
-        + 'if [ "${FLUXON_BARE_ALLOW_ALREADY_PRESENT:-false}" = "true" ]; then\n'
-        + "  if selection_present; then\n"
-        + '    echo "[bare] already present svc=$SERVICE label=$SUPERVISOR_LABEL"\n'
-        + '    echo "Started $SERVICE (label: $SUPERVISOR_LABEL)"\n'
-        + '    echo "Logs: $LOGFILE"\n'
-        + "    exit 0\n"
-        + "  fi\n"
-        + "fi\n"
-        + "# English note:\n"
-        + "# - Bare start must not depend on extra supervisor observation subcommands because the shared\n"
-        + "#   runtime surface is intentionally reduced to run/stop.\n"
-        + "# - We therefore launch the detached supervisor and wait until its pid subtree keeps a live child\n"
-        + "#   process for a short stable window.\n"
-        + _render_selection_supervisor_launch_wait_block(
-            run_cmd=run_cmd,
-            logfile_expr='"$LOGFILE"',
-            stable_seconds_expr=str(STANDALONE_PROBABLE_READY_SECONDS),
-            deadline_ts_expr='"$STARTUP_DEADLINE_TS"',
-            context="[bare]",
-        )
-        + _render_tcp_ready_wait_block(context="[bare]")
-        + 'echo "Started $SERVICE (label: $SUPERVISOR_LABEL)"\n'
-        + 'echo "Logs: $LOGFILE"\n'
+    return _render_bare_template(
+        template_name="standalone_start_body.sh.tmpl",
+        values={
+            "SUPERVISOR_LABEL_ASSIGN": _sh_quote(
+                _bare_plain_selection_supervisor_label(name_prefix=name_prefix, service_name=service_name)
+            ),
+            "RUNTIME_STATE_JSON_ASSIGN": _sh_quote(runtime_state_json),
+            "STARTUP_DEADLINE_SECONDS": str(STANDALONE_STARTUP_DEADLINE_SECONDS),
+            "SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK": _render_selection_supervisor_launch_wait_block(
+                run_cmd=run_cmd,
+                stable_seconds_expr=str(STANDALONE_PROBABLE_READY_SECONDS),
+                deadline_ts_expr='"$STARTUP_DEADLINE_TS"',
+                context="[bare]",
+            ),
+        },
     )
 
 
 def _render_selection_supervisor_path_from_script_dir() -> str:
-    return (
-        'DIR=$(cd "$(dirname "$0")" && pwd)\n'
-        + f'SELECTION_SUPERVISOR="$DIR/{PYTHON_SELECTION_SUPERVISOR_FILENAME}"\n'
-        + 'if [ ! -f "$SELECTION_SUPERVISOR" ]; then\n'
-        + '  echo "Missing selection supervisor: $SELECTION_SUPERVISOR"\n'
-        + "  exit 1\n"
-        + "fi\n\n"
+    return _render_bare_template(
+        template_name="selection_supervisor_path_from_script_dir.sh.tmpl",
+        values={"SELECTION_SUPERVISOR_FILENAME": PYTHON_SELECTION_SUPERVISOR_FILENAME},
     )
 
 
@@ -833,10 +656,6 @@ def _render_atomic_group_service_block(
         log_path=f"${{HOSTWORKDIR}}/log/{service_name}.log",
     )
     allowed_nodes = _extract_nodes(service_cfg)
-    service_port = _extract_port(service_cfg)
-    port_export = ""
-    if service_port is not None:
-        port_export = f"  export {service_name.upper()}__PORT={_sh_quote(str(service_port))}\n"
     run_cmd = _render_selection_supervisor_run_shell(
         subcommand="run",
         supervisor_expr='"$SELECTION_SUPERVISOR"',
@@ -850,54 +669,37 @@ def _render_atomic_group_service_block(
         crashloop_interval_lt_seconds=ATOMIC_GROUP_CRASHLOOP_INTERVAL_LT_SECONDS,
         child_command=child_command,
     )
-    return (
-        f"\n# rollout: {service_name}\n"
-        + _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes)
-        + "scheduled=false\n"
-        + 'for n in "${ALLOWED_NODES[@]}"; do\n'
-        + '  if [ "$n" = "$NODE_ID" ]; then scheduled=true; fi\n'
-        + "done\n"
-        + 'if [ "$scheduled" != true ]; then\n'
-        + f'  echo "[rollout] skip {service_name}: not scheduled on node $NODE_ID"\n'
-        + "else\n"
-        + f"  export SERVICE={_sh_quote(service_name)}\n"
-        + port_export
-        + '  LOG_DIR="$HOSTWORKDIR/log"\n'
-        + '  mkdir -p "$LOG_DIR"\n'
-        + f'  SUPERVISOR_LABEL={_sh_quote(_bare_atomic_group_member_selection_supervisor_label(name_prefix=name_prefix, group_name=group_name, service_name=service_name))}\n'
-        + f'  RUNTIME_STATE_JSON={_sh_quote(runtime_state_json)}\n'
-        + '  OWNER_TS_MS=$(python3 -c \'import time; print(int(time.time() * 1000))\')\n'
-        + f'  LOGFILE="$HOSTWORKDIR/log/{service_name}.log"\n'
-        + '  touch "$LOGFILE"\n'
-        + f'  echo "[rollout] start {service_name} node=$NODE_ID hostworkdir=$HOSTWORKDIR"\n'
-        + "  # English note:\n"
-        + "  # - Atomic-group order still depends on a readiness gate, but that gate now observes only the\n"
-        + "  #   detached supervisor process subtree on this host.\n"
-        + "  # - Ownership stays inside the shared selection supervisor big loop; the group runner only waits\n"
-        + "  #   until that loop has a stable live child before advancing to the next service.\n"
-        # English note:
-        # - The embedded `run_cmd` contains a nested `bash -lc` payload, and that payload may contain
-        #   heredocs used by real service entrypoints.
-        # - A blind newline replacement would shift heredoc terminators away from column 0 inside the
-        #   child shell and silently turn valid entrypoints into immediate no-op exits.
-        # - Indent only the outer block lines while preserving each inner line start exactly.
-        + _indent_script_block(
-            script=_render_selection_supervisor_launch_wait_block(
-                run_cmd=run_cmd,
-                logfile_expr='"$LOGFILE"',
-                stable_seconds_expr=str(ATOMIC_GROUP_PROBABLE_READY_SECONDS),
-                deadline_ts_expr='"$GROUP_STARTUP_DEADLINE_TS"',
-                context="[rollout]",
-            ).rstrip() + "\n",
-            prefix="  ",
-        ).rstrip()
-        + "\n"
-        + _indent_script_block(
-            script=_render_tcp_ready_wait_block(context="[rollout]"),
-            prefix="  ",
-        ).rstrip()
-        + "\n"
-        + "fi\n"
+    return _render_bare_template(
+        template_name="atomic_group_service_block.sh.tmpl",
+        values={
+            "SERVICE_NAME": service_name,
+            "ALLOWED_NODES_BLOCK": _render_nodes_bash(name="ALLOWED_NODES", nodes=allowed_nodes),
+            "SERVICE_EXPORT": _sh_quote(service_name),
+            "PORT_EXPORT": _render_service_port_export(
+                service_name=service_name,
+                service_cfg=service_cfg,
+                indent="  ",
+            ),
+            "SUPERVISOR_LABEL_ASSIGN": _sh_quote(
+                _bare_atomic_group_member_selection_supervisor_label(
+                    name_prefix=name_prefix,
+                    group_name=group_name,
+                    service_name=service_name,
+                )
+            ),
+            "RUNTIME_STATE_JSON_ASSIGN": _sh_quote(runtime_state_json),
+            "LOGFILE_PATH": f"$HOSTWORKDIR/log/{service_name}.log",
+            "INDENTED_SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK": _indent_script_block(
+                script=_render_selection_supervisor_launch_wait_block(
+                    run_cmd=run_cmd,
+                    stable_seconds_expr=str(ATOMIC_GROUP_PROBABLE_READY_SECONDS),
+                    deadline_ts_expr='"$GROUP_STARTUP_DEADLINE_TS"',
+                    context="[rollout]",
+                ).rstrip()
+                + "\n",
+                prefix="  ",
+            ).rstrip(),
+        },
     )
 
 
diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_node_resolution_tail.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_node_resolution_tail.sh.tmpl
new file mode 100644
index 0000000..d385995
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_node_resolution_tail.sh.tmpl
@@ -0,0 +1,14 @@
+{{GROUP_NODES_BLOCK}}scheduled=false
+for n in "${GROUP_NODES[@]}"; do
+  if [ "$n" = "$NODE_ID" ]; then scheduled=true; fi
+done
+if [ "$scheduled" != true ]; then
+  echo "[atomic-group] skip group=$GROUP node=$NODE_ID allowed=${GROUP_NODES[*]}"
+  exit 0
+fi
+
+export NODE_ID="$NODE_ID"
+export HOST_IP="$HOST_IP"
+export HOSTWORKDIR="$HOSTWORKDIR"
+echo "[atomic-group] group=$GROUP node=$NODE_ID hostworkdir=$HOSTWORKDIR"
+
diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
new file mode 100644
index 0000000..6ad9a1a
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
@@ -0,0 +1,24 @@
+
+# rollout: {{SERVICE_NAME}}
+{{ALLOWED_NODES_BLOCK}}scheduled=false
+for n in "${ALLOWED_NODES[@]}"; do
+  if [ "$n" = "$NODE_ID" ]; then scheduled=true; fi
+done
+if [ "$scheduled" != true ]; then
+  echo "[rollout] skip {{SERVICE_NAME}}: not scheduled on node $NODE_ID"
+else
+  export SERVICE={{SERVICE_EXPORT}}
+{{PORT_EXPORT}}  LOG_DIR="$HOSTWORKDIR/log"
+  mkdir -p "$LOG_DIR"
+  SUPERVISOR_LABEL={{SUPERVISOR_LABEL_ASSIGN}}
+  RUNTIME_STATE_JSON={{RUNTIME_STATE_JSON_ASSIGN}}
+  OWNER_TS_MS=$(python3 -c 'import time; print(int(time.time() * 1000))')
+  LOGFILE="{{LOGFILE_PATH}}"
+  echo "[rollout] start {{SERVICE_NAME}} node=$NODE_ID hostworkdir=$HOSTWORKDIR"
+  # English note:
+  # - Atomic-group order still depends on a readiness gate, but that gate now observes only the
+  #   detached supervisor process subtree on this host.
+  # - Ownership stays inside the shared selection supervisor big loop; the group runner only waits
+  #   through the fixed startup observation window before advancing to the next service.
+{{INDENTED_SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK}}
+fi
diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
new file mode 100644
index 0000000..d0c82ad
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+GROUP={{GROUP_ASSIGN}}
+NAME_PREFIX={{NAME_PREFIX_ASSIGN}}
+{{HOST_PRELUDE}}{{ATOMIC_GROUP_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}{{PROC_LIFECYCLE_HELPERS}}{{GLOBAL_ENV_EXPORTS}}GROUP_STARTUP_DEADLINE_TS=$(( $(date +%s) + {{GROUP_STARTUP_DEADLINE_ASSIGN}} ))
+{{SERVICE_BLOCKS}}echo "[atomic-group] ready group=$GROUP node=$NODE_ID"
diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_stop.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_stop.sh.tmpl
new file mode 100644
index 0000000..5501b8f
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_stop.sh.tmpl
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+set -u -o pipefail
+
+GROUP={{GROUP_ASSIGN}}
+NAME_PREFIX={{NAME_PREFIX_ASSIGN}}
+{{HOST_PRELUDE}}{{ATOMIC_GROUP_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}{{ATOMIC_GROUP_STOP_FN}}stop_group
diff --git a/deployment/templates/gen_bare_deploy_bash/bare_entrypoint.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/bare_entrypoint.sh.tmpl
new file mode 100644
index 0000000..39db682
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/bare_entrypoint.sh.tmpl
@@ -0,0 +1,5 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+export SERVICE={{SERVICE_EXPORT}}
+{{ENTRYPOINT}}
diff --git a/deployment/templates/gen_bare_deploy_bash/common_node_resolution_tail.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/common_node_resolution_tail.sh.tmpl
new file mode 100644
index 0000000..e0cb433
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/common_node_resolution_tail.sh.tmpl
@@ -0,0 +1,15 @@
+if [ ${#ALLOWED_NODES[@]} -gt 0 ]; then
+  _ok=false
+  for n in "${ALLOWED_NODES[@]}"; do
+    if [ "$n" = "$NODE_ID" ]; then _ok=true; fi
+  done
+  if [ "$_ok" != true ]; then
+    echo "Service {{SERVICE_NAME}} not scheduled on this node ($NODE_ID). Allowed: ${ALLOWED_NODES[*]}"
+    exit 0
+  fi
+fi
+
+export NODE_ID="$NODE_ID"
+export HOST_IP="$HOST_IP"
+export HOSTWORKDIR="$HOSTWORKDIR"
+
diff --git a/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
new file mode 100644
index 0000000..b424bc3
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
@@ -0,0 +1,4 @@
+if ! wait_service_etcd_endpoint_healthy "$SERVICE" "$HOSTWORKDIR/fluxon_release/ext_images/etcd/etcdctl" "http://$HOST_IP:$SERVICE_PORT" {{ETCD_HEALTH_STABLE_SECONDS}} {{ETCD_HEALTH_DEADLINE_TS}} "{{CONTEXT}}"; then
+  echo "{{CONTEXT}} etcd-health failed svc=$SERVICE endpoint=http://$HOST_IP:$SERVICE_PORT"
+  exit 1
+fi
diff --git a/deployment/templates/gen_bare_deploy_bash/host_prelude.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/host_prelude.sh.tmpl
new file mode 100644
index 0000000..6075106
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/host_prelude.sh.tmpl
@@ -0,0 +1,57 @@
+{{ALL_NODES_BLOCK}}
+LOCAL_HOSTNAME=$(hostname -s 2>/dev/null || hostname 2>/dev/null || echo unknown)
+LOCAL_FQDN=$(hostname -f 2>/dev/null || echo "$LOCAL_HOSTNAME")
+NODE_ID="${NODE_ID:-}"
+if [ -n "$NODE_ID" ]; then
+  _node_id_known=false
+  for n in "${ALL_NODES[@]}"; do
+    if [ "$n" = "$NODE_ID" ]; then
+      _node_id_known=true
+      break
+    fi
+  done
+  if [ "$_node_id_known" != true ]; then
+    echo "Unknown preset NODE_ID: $NODE_ID"
+    echo "Known nodes: {{KNOWN_NODES}}"
+    exit 1
+  fi
+fi
+if [ -z "$NODE_ID" ]; then
+for n in "${ALL_NODES[@]}"; do
+  if [ "$n" = "$LOCAL_HOSTNAME" ] || [ "$n" = "$LOCAL_FQDN" ]; then
+    NODE_ID="$n"
+    break
+  fi
+done
+fi
+if [ -z "$NODE_ID" ] && [ ${#ALL_NODES[@]} -eq 1 ]; then
+  NODE_ID="${ALL_NODES[0]}"
+fi
+if [ -z "$NODE_ID" ]; then
+  for ip in $(hostname -I 2>/dev/null); do
+    for n in "${ALL_NODES[@]}"; do
+      _ip_n=""
+      case "$n" in
+{{IP_CASE_LINES}}
+        *) _ip_n="";;
+      esac
+      if [ "$_ip_n" = "$ip" ]; then
+        NODE_ID="$n"
+        break
+      fi
+    done
+    [ -n "$NODE_ID" ] && break
+  done
+fi
+if [ -z "$NODE_ID" ]; then
+  echo "Cannot map host to a configured node. Hostname=$LOCAL_HOSTNAME FQDN=$LOCAL_FQDN IPs=$(hostname -I 2>/dev/null)"
+  echo "Known nodes: {{KNOWN_NODES}}"
+  exit 1
+fi
+
+HOST_IP=""
+HOSTWORKDIR=""
+case "$NODE_ID" in
+{{HOST_CASE_LINES}}
+  *) echo "Unknown NODE_ID: $NODE_ID"; exit 1;;
+esac
diff --git a/deployment/templates/gen_bare_deploy_bash/selection_present_probe_fn.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/selection_present_probe_fn.sh.tmpl
new file mode 100644
index 0000000..0a7282b
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/selection_present_probe_fn.sh.tmpl
@@ -0,0 +1,19 @@
+selection_present() {
+  python3 - "$SELECTION_SUPERVISOR" "$SUPERVISOR_LABEL" "$HOSTWORKDIR" <<'__FLUXON_SELECTION_PRESENT__'
+import importlib.util
+import sys
+from pathlib import Path
+
+supervisor_path = Path(sys.argv[1])
+label = sys.argv[2]
+scope_key = sys.argv[3]
+spec = importlib.util.spec_from_file_location("fluxon_selection_supervisor_probe", supervisor_path)
+if spec is None or spec.loader is None:
+    raise RuntimeError(f"failed to load selection supervisor module: {supervisor_path}")
+module = importlib.util.module_from_spec(spec)
+sys.modules[spec.name] = module
+spec.loader.exec_module(module)
+raise SystemExit(0 if module._selection_present(label, scope_key=scope_key) else 1)
+__FLUXON_SELECTION_PRESENT__
+}
+
diff --git a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
new file mode 100644
index 0000000..f466cbc
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
@@ -0,0 +1,9 @@
+SUPERVISOR_PID=$( {{RUN_CMD}} < /dev/null & echo "$!" )
+if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then
+  echo "{{CONTEXT}} launch failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
+  exit 1
+fi
+if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" {{STABLE_SECONDS_EXPR}} {{DEADLINE_TS_EXPR}} "{{CONTEXT}}"; then
+  echo "{{CONTEXT}} probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
+  exit 1
+fi
diff --git a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_path_from_script_dir.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_path_from_script_dir.sh.tmpl
new file mode 100644
index 0000000..dac7dff
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_path_from_script_dir.sh.tmpl
@@ -0,0 +1,7 @@
+DIR=$(cd "$(dirname "$0")" && pwd)
+SELECTION_SUPERVISOR="$DIR/{{SELECTION_SUPERVISOR_FILENAME}}"
+if [ ! -f "$SELECTION_SUPERVISOR" ]; then
+  echo "Missing selection supervisor: $SELECTION_SUPERVISOR"
+  exit 1
+fi
+
diff --git a/deployment/templates/gen_bare_deploy_bash/standalone_start.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/standalone_start.sh.tmpl
new file mode 100644
index 0000000..5a565f1
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/standalone_start.sh.tmpl
@@ -0,0 +1,6 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+SERVICE={{SERVICE_ASSIGN}}
+NAME_PREFIX={{NAME_PREFIX_ASSIGN}}
+{{ALLOWED_NODES_BLOCK}}{{HOST_PRELUDE}}{{COMMON_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}{{PROC_LIFECYCLE_HELPERS}}{{SELECTION_PRESENT_PROBE_FN}}{{START_LOCK_BLOCK}}{{GLOBAL_ENV_EXPORTS}}{{PORT_EXPORT}}{{START_BODY}}
diff --git a/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
new file mode 100644
index 0000000..bc2fc40
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
@@ -0,0 +1,27 @@
+SUPERVISOR_LABEL={{SUPERVISOR_LABEL_ASSIGN}}
+RUNTIME_STATE_JSON={{RUNTIME_STATE_JSON_ASSIGN}}
+OWNER_TS_MS=$(python3 -c 'import time; print(int(time.time() * 1000))')
+STARTUP_DEADLINE_TS=$(( $(date +%s) + {{STARTUP_DEADLINE_SECONDS}} ))
+LOG_DIR="$HOSTWORKDIR/log"
+LOGFILE="$LOG_DIR/${SERVICE}.log"
+mkdir -p "$LOG_DIR"
+echo "Starting $SERVICE on $NODE_ID (IP: $HOST_IP, workdir: $HOSTWORKDIR)"
+# English note:
+# - bootstrap bare start must be idempotent when the shared selection supervisor already owns
+#   a live child for the same label.
+# - start_test_bed enables this path only for deployconf.bootstrap_bare_services.
+if [ "${FLUXON_BARE_ALLOW_ALREADY_PRESENT:-false}" = "true" ]; then
+  if selection_present; then
+    echo "[bare] already present svc=$SERVICE label=$SUPERVISOR_LABEL"
+    echo "Started $SERVICE (label: $SUPERVISOR_LABEL)"
+    echo "Logs: $LOGFILE"
+    exit 0
+  fi
+fi
+# English note:
+# - Bare start must not depend on extra supervisor observation subcommands because the shared
+#   runtime surface is intentionally reduced to run/stop.
+# - We therefore launch the detached supervisor and wait until its pid subtree keeps a live child
+#   process alive across the fixed startup observation window.
+{{SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK}}echo "Started $SERVICE (label: $SUPERVISOR_LABEL)"
+echo "Logs: $LOGFILE"
diff --git a/deployment/templates/gen_bare_deploy_bash/standalone_stop.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/standalone_stop.sh.tmpl
new file mode 100644
index 0000000..4f7dc37
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/standalone_stop.sh.tmpl
@@ -0,0 +1,15 @@
+#!/usr/bin/env bash
+set -euo pipefail
+
+SERVICE={{SERVICE_ASSIGN}}
+NAME_PREFIX={{NAME_PREFIX_ASSIGN}}
+{{ALLOWED_NODES_BLOCK}}{{HOST_PRELUDE}}{{COMMON_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}SUPERVISOR_LABEL={{SUPERVISOR_LABEL_ASSIGN}}
+# English note:
+# - Generated bare stop is retained as a manual operator tool.
+# - Automation must not depend on this path for handover or rollout convergence.
+# - The command only asks the shared selection supervisor to retire the concrete selection
+#   identity identified by label on this node.
+if ! python3 "$SELECTION_SUPERVISOR" stop --label "$SUPERVISOR_LABEL" --scope-key "$HOSTWORKDIR" --missing-ok >/dev/null; then
+  echo "[bare] stop failed svc=$SERVICE label=$SUPERVISOR_LABEL hostworkdir=$HOSTWORKDIR"
+  exit 1
+fi
diff --git a/deployment/templates/gen_bare_deploy_bash/start_lock_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/start_lock_block.sh.tmpl
new file mode 100644
index 0000000..47ec770
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/start_lock_block.sh.tmpl
@@ -0,0 +1,14 @@
+PID_DIR="$HOSTWORKDIR/run"
+mkdir -p "$PID_DIR"
+START_LOCKFILE="$PID_DIR/${SERVICE}.start.lock"
+if ! command -v flock >/dev/null 2>&1; then
+  echo "Missing required command: flock"
+  exit 1
+fi
+exec 9>"$START_LOCKFILE"
+if ! flock -xn 9; then
+  echo "[bare] start skipped svc=$SERVICE reason=another start is already running lockfile=$START_LOCKFILE"
+  exit 0
+fi
+exec 9>&-
+
diff --git a/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
new file mode 100644
index 0000000..0c0cc3b
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
@@ -0,0 +1,120 @@
+wait_service_tcp_ready() {
+  svc="$1"
+  host="$2"
+  port="$3"
+  stable_seconds="$4"
+  deadline_ts="$5"
+  context="$6"
+  if [[ ! "$port" =~ ^[0-9]+$ ]]; then
+    echo "$context tcp-ready: invalid port svc=$svc port=$port"
+    return 1
+  fi
+  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then
+    echo "$context tcp-ready: invalid stable_seconds svc=$svc stable_seconds=$stable_seconds"
+    return 1
+  fi
+  poll_interval_seconds={{TCP_READY_POLL_INTERVAL_SECONDS}}
+  stable_checks=$(python3 - "$stable_seconds" "$poll_interval_seconds" <<'__FLUXON_TCP_READY_CHECKS__'
+import math
+import sys
+stable_seconds = float(sys.argv[1])
+poll_interval_seconds = float(sys.argv[2])
+print(max(1, int(math.ceil(stable_seconds / poll_interval_seconds))))
+__FLUXON_TCP_READY_CHECKS__
+)
+  if [[ ! "$stable_checks" =~ ^[0-9]+$ ]] || [ "$stable_checks" -le 0 ]; then
+    echo "$context tcp-ready: failed to compute stable_checks svc=$svc"
+    return 1
+  fi
+  ok_checks=0
+  while true; do
+    now=$(date +%s)
+    if [ "$now" -ge "$deadline_ts" ]; then
+      echo "$context tcp-ready: deadline exceeded svc=$svc host=$host port=$port"
+      return 1
+    fi
+    if python3 - "$host" "$port" <<'__FLUXON_TCP_READY_PROBE__'
+import socket
+import sys
+host = sys.argv[1]
+port = int(sys.argv[2])
+with socket.create_connection((host, port), timeout=1.0):
+    pass
+__FLUXON_TCP_READY_PROBE__
+    then
+      ok_checks=$((ok_checks+1))
+      if [ "$ok_checks" -ge "$stable_checks" ]; then
+        echo "$context tcp-ready: ok svc=$svc host=$host port=$port stable_checks=$stable_checks"
+        return 0
+      fi
+    else
+      if [ "$ok_checks" -ne 0 ]; then
+        echo "$context tcp-ready: reset svc=$svc ok_checks=$ok_checks host=$host port=$port"
+      fi
+      ok_checks=0
+    fi
+    sleep "$poll_interval_seconds"
+  done
+}
+
+wait_service_etcd_endpoint_healthy() {
+  svc="$1"
+  etcdctl_bin="$2"
+  endpoint="$3"
+  stable_seconds="$4"
+  deadline_ts="$5"
+  context="$6"
+  if [ ! -x "$etcdctl_bin" ]; then
+    echo "$context etcd-health: missing etcdctl svc=$svc path=$etcdctl_bin"
+    return 1
+  fi
+  if [ -z "$endpoint" ]; then
+    echo "$context etcd-health: missing endpoint svc=$svc"
+    return 1
+  fi
+  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then
+    echo "$context etcd-health: invalid stable_seconds svc=$svc stable_seconds=$stable_seconds"
+    return 1
+  fi
+  poll_interval_seconds={{ETCD_HEALTH_POLL_INTERVAL_SECONDS}}
+  stable_checks=$(python3 - "$stable_seconds" "$poll_interval_seconds" <<'__FLUXON_ETCD_HEALTH_CHECKS__'
+import math
+import sys
+stable_seconds = float(sys.argv[1])
+poll_interval_seconds = float(sys.argv[2])
+print(max(1, int(math.ceil(stable_seconds / poll_interval_seconds))))
+__FLUXON_ETCD_HEALTH_CHECKS__
+)
+  if [[ ! "$stable_checks" =~ ^[0-9]+$ ]] || [ "$stable_checks" -le 0 ]; then
+    echo "$context etcd-health: failed to compute stable_checks svc=$svc"
+    return 1
+  fi
+  ok_checks=0
+  last_output=""
+  while true; do
+    now=$(date +%s)
+    if [ "$now" -ge "$deadline_ts" ]; then
+      if [ -n "$last_output" ]; then
+        last_output="${last_output//$'\n'/ }"
+        echo "$context etcd-health: deadline exceeded svc=$svc endpoint=$endpoint last_output=$last_output"
+      else
+        echo "$context etcd-health: deadline exceeded svc=$svc endpoint=$endpoint"
+      fi
+      return 1
+    fi
+    if probe_output=$(ETCDCTL_API=3 "$etcdctl_bin" --endpoints "$endpoint" --dial-timeout "{{ETCD_HEALTH_PROBE_TIMEOUT_MS}}ms" --command-timeout "{{ETCD_HEALTH_PROBE_TIMEOUT_MS}}ms" endpoint health 2>&1); then
+      ok_checks=$((ok_checks+1))
+      if [ "$ok_checks" -ge "$stable_checks" ]; then
+        echo "$context etcd-health: ok svc=$svc endpoint=$endpoint stable_checks=$stable_checks"
+        return 0
+      fi
+    else
+      last_output="$probe_output"
+      if [ "$ok_checks" -ne 0 ]; then
+        echo "$context etcd-health: reset svc=$svc ok_checks=$ok_checks endpoint=$endpoint"
+      fi
+      ok_checks=0
+    fi
+    sleep "$poll_interval_seconds"
+  done
+}
diff --git a/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl
new file mode 100644
index 0000000..bbf021b
--- /dev/null
+++ b/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl
@@ -0,0 +1,6 @@
+if [[ "${SERVICE_PORT:-}" =~ ^[0-9]+$ ]]; then
+  if ! wait_service_tcp_ready "$SERVICE" "$HOST_IP" "$SERVICE_PORT" {{TCP_READY_STABLE_SECONDS}} {{TCP_READY_DEADLINE_TS}} "{{CONTEXT}}"; then
+    echo "{{CONTEXT}} tcp-ready failed svc=$SERVICE host=$HOST_IP port=$SERVICE_PORT"
+    exit 1
+  fi
+fi
diff --git a/deployment/tests/test_gen_bare_deploy_bash.py b/deployment/tests/test_gen_bare_deploy_bash.py
index f51a923..f1645a3 100644
--- a/deployment/tests/test_gen_bare_deploy_bash.py
+++ b/deployment/tests/test_gen_bare_deploy_bash.py
@@ -13,6 +13,8 @@
 from pathlib import Path
 from typing import Callable, List, Optional, Tuple
 
+import yaml
+
 
 SCRIPT_DIR = Path(__file__).resolve().parent
 DEPLOYMENT_DIR = SCRIPT_DIR.parent
@@ -50,6 +52,12 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("preserves_hostworkdir_runtime_token", test_preserves_hostworkdir_runtime_token),
         ("generated_scripts_do_not_embed_pidfile_authority", test_generated_scripts_do_not_embed_pidfile_authority),
         ("ops_entrypoints_use_direct_scripts", test_ops_entrypoints_use_direct_scripts),
+        ("bare_start_uses_no_exit_startup_gate", test_bare_start_uses_no_exit_startup_gate),
+        (
+            "normalized_testbed_master_exports_service_port_for_atomic_group",
+            test_normalized_testbed_master_exports_service_port_for_atomic_group,
+        ),
+        ("normalized_testbed_owner_emits_large_file_paths", test_normalized_testbed_owner_emits_large_file_paths),
         ("bare_child_command_preserves_runtime_hostworkdir_expansion", test_bare_child_command_preserves_runtime_hostworkdir_expansion),
         ("supervisor_label_uses_stable_selection_suffix", test_supervisor_label_uses_stable_selection_suffix),
         ("bootstrap_start_reuses_already_present_selection", test_bootstrap_start_reuses_already_present_selection),
@@ -93,6 +101,7 @@ def test_preserves_hostworkdir_runtime_token() -> None:
                   FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
                 service:
                   svc_plain:
+                    port: 12345
                     entrypoint: |
                       WORKDIR="${HOSTWORKDIR}/svc_${NODE_ID}"
                       EXPORT_TABLE=$(cat <<EOF
@@ -127,8 +136,14 @@ def test_preserves_hostworkdir_runtime_token() -> None:
         assert "wait-present" not in script, script
         assert "launch_only_start_gate" not in script, script
         assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID"' in script, script
-        assert 'wait_service_tcp_ready "$SERVICE" "$HOST_IP" "$SERVICE_PORT"' in script, script
+        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
+        assert "export SERVICE_PORT=12345" in script, script
+        assert 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
+        assert "wait_service_tcp_ready" not in script, script
+        assert "wait_service_etcd_endpoint_healthy" not in script, script
         assert 'SUPERVISOR_PID=$( setsid ' not in script, script
+        assert '>>"$LOGFILE" 2>&1' not in script, script
+        assert 'touch "$LOGFILE"' not in script, script
         assert 'python3 "$SELECTION_SUPERVISOR" stop --label "$SUPERVISOR_LABEL" --scope-key "$HOSTWORKDIR" --missing-ok' in stop_script, stop_script
         assert "retire-runtime" not in stop_script, stop_script
         print("PASS: test_preserves_hostworkdir_runtime_token")
@@ -149,6 +164,7 @@ def test_atomic_group_start_does_not_auto_stop_on_failure() -> None:
                     hostworkdir: /tmp/hostworkdir
                 service:
                   svc_a:
+                    port: 23456
                     entrypoint: |
                       echo svc_a
                     node_bind:
@@ -179,7 +195,12 @@ def test_atomic_group_start_does_not_auto_stop_on_failure() -> None:
         assert 'SUPERVISOR_PID=$( setsid ' not in script, script
         assert 'echo "[rollout] probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"' in script, script
         assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID"' in script, script
-        assert 'wait_service_tcp_ready "$SERVICE" "$HOST_IP" "$SERVICE_PORT"' in script, script
+        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$GROUP_STARTUP_DEADLINE_TS" "[rollout]"' in script, script
+        assert 'GROUP_STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
+        assert "export SERVICE_PORT=23456" in script, script
+        assert "unset SERVICE_PORT" in script, script
+        assert "wait_service_tcp_ready" not in script, script
+        assert "wait_service_etcd_endpoint_healthy" not in script, script
         print("PASS: test_atomic_group_start_does_not_auto_stop_on_failure")
 
 
@@ -251,11 +272,129 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
 
         assert "-m fluxon_py.runtime.start_ops_controller" in controller_entrypoint, controller_entrypoint
         assert "examples/fluxon_ops/start_controller.py" not in controller_entrypoint, controller_entrypoint
+        assert 'http_listen_addr: "0.0.0.0:19080"' in controller_entrypoint, controller_entrypoint
+        assert 'http_listen_addr: "0.0.0.0:${MASTER__PORT}"' not in controller_entrypoint, controller_entrypoint
         assert "-m fluxon_py.runtime.start_ops_agent" in agent_entrypoint, agent_entrypoint
         assert "examples/fluxon_ops/start_agent.py" not in agent_entrypoint, agent_entrypoint
         print("PASS: test_ops_entrypoints_use_direct_scripts")
 
 
+def test_bare_start_uses_no_exit_startup_gate() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_no_exit_gate_") as td:
+        tmpdir = Path(td)
+        config_path = tmpdir / "deployconf.yaml"
+        outdir = tmpdir / "out"
+        config_path.write_text(
+            textwrap.dedent(
+                """
+                name_prefix: fluxon-testbed
+                cluster_nodes:
+                  - hostname: node-a
+                    ip: 127.0.0.1
+                    hostworkdir: /tmp/hostworkdir
+                service:
+                  etcd:
+                    port: 2379
+                    entrypoint: |
+                      echo etcd
+                    node_bind:
+                      node: ["node-a"]
+                  tikv:
+                    port: 20160
+                    entrypoint: |
+                      echo tikv
+                    node_bind:
+                      node: ["node-a"]
+                  svc_plain:
+                    port: 12345
+                    entrypoint: |
+                      echo plain
+                    node_bind:
+                      node: ["node-a"]
+                """
+            ).strip()
+            + "\n",
+            encoding="utf-8",
+        )
+
+        result = _run_generator(config_path=config_path, outdir=outdir)
+        assert result.returncode == 0, f"generator failed: stdout={result.stdout} stderr={result.stderr}"
+
+        etcd_script = (outdir / "start_etcd.sh").read_text(encoding="utf-8")
+        tikv_script = (outdir / "start_tikv.sh").read_text(encoding="utf-8")
+        plain_script = (outdir / "start_svc_plain.sh").read_text(encoding="utf-8")
+
+        for script in (etcd_script, tikv_script, plain_script):
+            assert 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
+            assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
+            assert "wait_service_tcp_ready" not in script, script
+            assert "wait_service_etcd_endpoint_healthy" not in script, script
+        print("PASS: test_bare_start_uses_no_exit_startup_gate")
+
+
+def test_normalized_testbed_master_exports_service_port_for_atomic_group() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_normalized_testbed_") as td:
+        tmpdir = Path(td)
+        config_path = tmpdir / "deployconf.normalized.yaml"
+        outdir = tmpdir / "out"
+
+        start_test_bed = _load_python_module(
+            module_name="start_test_bed_for_gen_bare_tests",
+            path=DEPLOYMENT_DIR.parent / "fluxon_test_stack" / "start_test_bed.py",
+        )
+        base_cfg = yaml.safe_load(
+            (DEPLOYMENT_DIR.parent / "fluxon_test_stack" / "deployconf_testbed.yml").read_text(encoding="utf-8")
+        )
+        normalized, _ = start_test_bed._normalize_bootstrap_deployconf(deployconf=base_cfg)
+        config_path.write_text(
+            yaml.safe_dump(normalized, sort_keys=False, allow_unicode=False),
+            encoding="utf-8",
+        )
+
+        result = _run_generator(config_path=config_path, outdir=outdir)
+        assert result.returncode == 0, f"generator failed: stdout={result.stdout} stderr={result.stderr}"
+
+        script = (outdir / "start_fluxon_core_controller.sh").read_text(encoding="utf-8")
+        master_block_start = script.index("export SERVICE=master")
+        owner_block_start = script.index("export SERVICE=owner")
+        master_block = script[master_block_start:owner_block_start]
+        assert "export MASTER__PORT=51051" in master_block, master_block
+        assert "export SERVICE_PORT=51051" in master_block, master_block
+        assert "unset SERVICE_PORT" not in master_block, master_block
+        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$GROUP_STARTUP_DEADLINE_TS" "[rollout]"' in master_block, master_block
+        assert "wait_service_tcp_ready" not in master_block, master_block
+        print("PASS: test_normalized_testbed_master_exports_service_port_for_atomic_group")
+
+
+def test_normalized_testbed_owner_emits_large_file_paths() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_testbed_owner_large_paths_") as td:
+        tmpdir = Path(td)
+        config_path = tmpdir / "deployconf.normalized.yaml"
+        outdir = tmpdir / "out"
+
+        start_test_bed = _load_python_module(
+            module_name="start_test_bed_for_owner_large_paths_tests",
+            path=DEPLOYMENT_DIR.parent / "fluxon_test_stack" / "start_test_bed.py",
+        )
+        base_cfg = yaml.safe_load(
+            (DEPLOYMENT_DIR.parent / "fluxon_test_stack" / "deployconf_testbed.yml").read_text(encoding="utf-8")
+        )
+        normalized, _ = start_test_bed._normalize_bootstrap_deployconf(deployconf=base_cfg)
+        config_path.write_text(
+            yaml.safe_dump(normalized, sort_keys=False, allow_unicode=False),
+            encoding="utf-8",
+        )
+
+        result = _run_generator(config_path=config_path, outdir=outdir)
+        assert result.returncode == 0, f"generator failed: stdout={result.stdout} stderr={result.stderr}"
+
+        script = (outdir / "entrypoint__fluxon-self-host2-fluxon_core_controller__owner.sh").read_text(encoding="utf-8")
+        assert 'large_file_paths:' in script, script
+        assert 'log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"' in script, script
+        assert 'cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"' in script, script
+        print("PASS: test_normalized_testbed_owner_emits_large_file_paths")
+
+
 def test_bare_child_command_preserves_runtime_hostworkdir_expansion() -> None:
     with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_runtime_expand_") as td:
         tmpdir = Path(td)
@@ -600,6 +739,16 @@ def _load_generated_supervisor_module(supervisor_path: Path):
     return module
 
 
+def _load_python_module(*, module_name: str, path: Path):
+    spec = importlib.util.spec_from_file_location(module_name, path)
+    if spec is None or spec.loader is None:
+        raise RuntimeError(f"failed to load module: {path}")
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
 def _wait_until_selection_present(module, *, label: str, timeout_seconds: int = 15) -> None:
     deadline = time.time() + timeout_seconds
     while time.time() < deadline:
diff --git a/deployment/tests/test_gen_k8s_daemonset.py b/deployment/tests/test_gen_k8s_daemonset.py
index eff0aad..2cd769e 100644
--- a/deployment/tests/test_gen_k8s_daemonset.py
+++ b/deployment/tests/test_gen_k8s_daemonset.py
@@ -248,7 +248,7 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
                         cluster_name: "${FLUXON_CLUSTER_NAME}"
                         member_kind: kv
                         output: web
-                        http_listen_addr: "0.0.0.0:${MASTER__PORT}"
+                        http_listen_addr: "0.0.0.0:${OPS_CONTROLLER__PORT}"
                       YAML
                       ${HOSTWORKDIR}/venv/bin/python -m fluxon_py.runtime.start_ops_controller -c "${WORKDIR}/ops_controller.yaml" -w "${WORKDIR}"
                     node_bind:
diff --git a/deployment/tests/test_log_shard.py b/deployment/tests/test_log_shard.py
new file mode 100644
index 0000000..642e718
--- /dev/null
+++ b/deployment/tests/test_log_shard.py
@@ -0,0 +1,117 @@
+#!/usr/bin/env python3
+
+from __future__ import annotations
+
+import argparse
+import datetime
+import os
+import sys
+import tempfile
+import time
+from pathlib import Path
+from typing import Callable, List, Optional, Tuple
+
+SCRIPT_DIR = Path(__file__).resolve().parent
+DEPLOYMENT_DIR = SCRIPT_DIR.parent
+sys.path.insert(0, str(DEPLOYMENT_DIR))
+
+from utils import log_shard
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description="log_shard util test runner")
+    parser.add_argument("--test-id", help="Run only the named test id")
+    args = parser.parse_args()
+
+    checks = _build_checks(args.test_id)
+    failures = 0
+    for _, check in checks:
+        try:
+            check()
+            print(f"PASS: {check.__name__}")
+        except Exception as exc:
+            print(f"FAIL: {check.__name__}: {exc}")
+            failures += 1
+    return 0 if failures == 0 else 1
+
+
+def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[], None]]]:
+    checks: List[Tuple[str, Callable[[], None]]] = [
+        ("daily_path_uses_utc_date_suffix", test_daily_path_uses_utc_date_suffix),
+        ("daily_path_uses_test_window_suffix_when_configured", test_daily_path_uses_test_window_suffix_when_configured),
+        ("resolve_readable_prefers_latest_existing_shard", test_resolve_readable_prefers_latest_existing_shard),
+        ("cleanup_keeps_only_retention_window", test_cleanup_keeps_only_retention_window),
+    ]
+    if selected_test_id is None:
+        return checks
+    for check_id, check in checks:
+        if check_id == selected_test_id:
+            return [(check_id, check)]
+    available = ", ".join(check_id for check_id, _ in checks)
+    raise ValueError(f"unknown --test-id: {selected_test_id}. Available: {available}")
+
+
+def test_daily_path_uses_utc_date_suffix() -> None:
+    base = Path("/tmp/test_runner.log")
+    now = datetime.datetime(2026, 6, 21, 4, 0, 0, tzinfo=datetime.timezone.utc)
+    resolved = log_shard.daily_sharded_log_path(base, now=now)
+    assert resolved.name == "test_runner.2026-06-21.log", resolved
+
+
+def test_resolve_readable_prefers_latest_existing_shard() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_log_shard_resolve_") as td:
+        root = Path(td)
+        base = root / "service.log"
+        (root / "service.2026-06-19.log").write_text("old\n", encoding="utf-8")
+        (root / "service.2026-06-20.log").write_text("new\n", encoding="utf-8")
+        resolved = log_shard.resolve_readable_log_path(base)
+        assert resolved == (root / "service.2026-06-20.log").resolve(), resolved
+
+
+def test_daily_path_uses_test_window_suffix_when_configured() -> None:
+    base = Path("/tmp/test_runner.log")
+    saved_window = os.environ.get(log_shard.TEST_LOG_SHARD_WINDOW_SECONDS_ENV)
+    saved_anchor = os.environ.get(log_shard.TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV)
+    try:
+        os.environ[log_shard.TEST_LOG_SHARD_WINDOW_SECONDS_ENV] = "10"
+        os.environ[log_shard.TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV] = str(
+            int(datetime.datetime(2026, 6, 21, 0, 0, 0, tzinfo=datetime.timezone.utc).timestamp())
+        )
+        now_0 = datetime.datetime(2026, 6, 21, 0, 0, 5, tzinfo=datetime.timezone.utc)
+        now_1 = datetime.datetime(2026, 6, 21, 0, 0, 15, tzinfo=datetime.timezone.utc)
+        resolved_0 = log_shard.daily_sharded_log_path(base, now=now_0)
+        resolved_1 = log_shard.daily_sharded_log_path(base, now=now_1)
+        assert resolved_0.name == "test_runner.2026-01-01.log", resolved_0
+        assert resolved_1.name == "test_runner.2026-01-02.log", resolved_1
+    finally:
+        if saved_window is None:
+            os.environ.pop(log_shard.TEST_LOG_SHARD_WINDOW_SECONDS_ENV, None)
+        else:
+            os.environ[log_shard.TEST_LOG_SHARD_WINDOW_SECONDS_ENV] = saved_window
+        if saved_anchor is None:
+            os.environ.pop(log_shard.TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV, None)
+        else:
+            os.environ[log_shard.TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV] = saved_anchor
+
+
+def test_cleanup_keeps_only_retention_window() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_log_shard_cleanup_") as td:
+        root = Path(td)
+        base = root / "service.log"
+        keep_date = datetime.datetime.now(datetime.timezone.utc).date()
+        old_date = keep_date - datetime.timedelta(days=31)
+        recent_date = keep_date - datetime.timedelta(days=30)
+        stale_path = root / f"service.{old_date.isoformat()}.log"
+        recent_path = root / f"service.{recent_date.isoformat()}.log"
+        today_path = root / f"service.{keep_date.isoformat()}.log"
+        stale_path.write_text("stale\n", encoding="utf-8")
+        recent_path.write_text("recent\n", encoding="utf-8")
+        today_path.write_text("today\n", encoding="utf-8")
+        log_shard.cleanup_old_daily_sharded_logs(base, retention_days=31)
+        assert not stale_path.exists(), stale_path
+        assert recent_path.exists(), recent_path
+        assert today_path.exists(), today_path
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/deployment/tests/test_selection_supervisor_codegen.py b/deployment/tests/test_selection_supervisor_codegen.py
index 02ffa3b..a00caa9 100644
--- a/deployment/tests/test_selection_supervisor_codegen.py
+++ b/deployment/tests/test_selection_supervisor_codegen.py
@@ -19,6 +19,7 @@
 UTILS_DIR = SCRIPT_DIR.parent / "utils"
 sys.path.insert(0, str(UTILS_DIR))
 
+from log_shard import render_module_source as render_log_shard_module_source  # type: ignore
 from selection_supervisor_codegen import render_python_selection_supervisor_module  # type: ignore
 
 
@@ -41,6 +42,9 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("install_subreaper_uses_prctl", test_install_subreaper_uses_prctl),
         ("spawn_child_sanitizes_rdma_driver_env", test_spawn_child_sanitizes_rdma_driver_env),
         ("selection_present_requires_live_child_process", test_selection_present_requires_live_child_process),
+        ("runtime_log_path_uses_daily_shard_files", test_runtime_log_path_uses_daily_shard_files),
+        ("runtime_log_path_expands_hostworkdir_env", test_runtime_log_path_expands_hostworkdir_env),
+        ("runtime_log_shards_roll_and_preserve_content_boundaries", test_runtime_log_shards_roll_and_preserve_content_boundaries),
         ("selection_present_checks_all_live_supervisors", test_selection_present_checks_all_live_supervisors),
         ("zombie_supervisor_is_treated_as_stopped", test_zombie_supervisor_is_treated_as_stopped),
         ("legacy_replace_process_is_observed_as_live_owner", test_legacy_replace_process_is_observed_as_live_owner),
@@ -99,6 +103,10 @@ def _write_runtime_script(root: Path, *, term_seconds: int = 5, kill_seconds: in
         ),
         encoding="utf-8",
     )
+    (root / "log_shard.py").write_text(
+        render_log_shard_module_source(),
+        encoding="utf-8",
+    )
     return supervisor_path
 
 
@@ -561,6 +569,181 @@ def test_selection_present_requires_live_child_process() -> None:
             _terminate_process(supervisor)
 
 
+def test_runtime_log_path_uses_daily_shard_files() -> None:
+    module = _load_runtime_module()
+    with tempfile.TemporaryDirectory(prefix="test_selection_supervisor_log_shard_") as td:
+        root = Path(td)
+        supervisor_path = _write_runtime_script(root)
+        child_path = root / "child.py"
+        child_path.write_text(
+            "import sys, time\n"
+            "print('hello-log-shard', flush=True)\n"
+            "time.sleep(30)\n",
+            encoding="utf-8",
+        )
+        label = "DaemonSet/test-log-shard"
+        child_argv = [sys.executable, str(child_path)]
+        base_log_path = root / "test-log-shard.log"
+        supervisor = _run_supervisor_command(
+            supervisor_path=supervisor_path,
+            label=label,
+            owner_ts_ms=1,
+            state_json=json.dumps(
+                {
+                    "kind": "DaemonSet",
+                    "name": "test-log-shard",
+                    "service_name": "test-log-shard",
+                    "argv": child_argv,
+                    "cwd": str(root),
+                    "log_path": str(base_log_path),
+                },
+                sort_keys=True,
+            ),
+            child_argv=child_argv,
+            cwd=root,
+        )
+        try:
+            _wait_until_present(module, label)
+            deadline = time.time() + 5.0
+            shard_path = root / f"test-log-shard.{time.strftime('%Y-%m-%d', time.gmtime())}.log"
+            while time.time() < deadline and not shard_path.exists():
+                time.sleep(0.1)
+            assert shard_path.exists(), shard_path
+            assert not base_log_path.exists(), base_log_path
+            assert "hello-log-shard" in shard_path.read_text(encoding="utf-8", errors="replace")
+        finally:
+            _terminate_process(supervisor)
+
+
+def test_runtime_log_path_expands_hostworkdir_env() -> None:
+    module = _load_runtime_module()
+    with tempfile.TemporaryDirectory(prefix="test_selection_supervisor_expand_hostworkdir_") as td:
+        root = Path(td)
+        hostworkdir = root / "hostworkdir"
+        hostworkdir.mkdir(parents=True, exist_ok=True)
+        supervisor_path = _write_runtime_script(root)
+        child_path = root / "child.py"
+        child_path.write_text(
+            "import time\n"
+            "print('expanded-hostworkdir-log', flush=True)\n"
+            "time.sleep(30)\n",
+            encoding="utf-8",
+        )
+        label = "DaemonSet/test-expand-hostworkdir"
+        child_argv = [sys.executable, str(child_path)]
+        saved_hostworkdir = os.environ.get("HOSTWORKDIR")
+        os.environ["HOSTWORKDIR"] = str(hostworkdir)
+        supervisor = _run_supervisor_command(
+            supervisor_path=supervisor_path,
+            label=label,
+            owner_ts_ms=1,
+            state_json=json.dumps(
+                {
+                    "kind": "DaemonSet",
+                    "name": "test-expand-hostworkdir",
+                    "service_name": "test-expand-hostworkdir",
+                    "argv": child_argv,
+                    "cwd": str(root),
+                    "log_path": "${HOSTWORKDIR}/log/test-expand-hostworkdir.log",
+                },
+                sort_keys=True,
+            ),
+            child_argv=child_argv,
+            cwd=root,
+        )
+        try:
+            _wait_until_present(module, label)
+            deadline = time.time() + 5.0
+            shard_path = hostworkdir / "log" / f"test-expand-hostworkdir.{time.strftime('%Y-%m-%d', time.gmtime())}.log"
+            while time.time() < deadline and not shard_path.exists():
+                time.sleep(0.1)
+            assert shard_path.exists(), shard_path
+            assert "expanded-hostworkdir-log" in shard_path.read_text(encoding="utf-8", errors="replace")
+        finally:
+            _terminate_process(supervisor)
+            if saved_hostworkdir is None:
+                os.environ.pop("HOSTWORKDIR", None)
+            else:
+                os.environ["HOSTWORKDIR"] = saved_hostworkdir
+
+
+def test_runtime_log_shards_roll_and_preserve_content_boundaries() -> None:
+    module = _load_runtime_module()
+    saved_window = os.environ.get("FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS")
+    saved_anchor = os.environ.get("FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS")
+    with tempfile.TemporaryDirectory(prefix="test_selection_supervisor_log_roll_") as td:
+        root = Path(td)
+        supervisor_path = _write_runtime_script(root)
+        child_path = root / "child.py"
+        child_path.write_text(
+            "import sys, time\n"
+            "print('[ops-log-mgmt][phase=before] ts=' + str(int(time.time())), flush=True)\n"
+            "time.sleep(11)\n"
+            "print('[ops-log-mgmt][phase=after] ts=' + str(int(time.time())), flush=True)\n"
+            "time.sleep(30)\n",
+            encoding="utf-8",
+        )
+        anchor = str(int(time.time()) - 2)
+        os.environ["FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS"] = "10"
+        os.environ["FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS"] = anchor
+        label = "DaemonSet/test-log-roll"
+        child_argv = [sys.executable, str(child_path)]
+        base_log_path = root / "test-log-roll.log"
+        stale_shard = root / "test-log-roll.2025-12-01.log"
+        stale_shard.write_text("stale\n", encoding="utf-8")
+        supervisor = _run_supervisor_command(
+            supervisor_path=supervisor_path,
+            label=label,
+            owner_ts_ms=1,
+            state_json=json.dumps(
+                {
+                    "kind": "DaemonSet",
+                    "name": "test-log-roll",
+                    "service_name": "test-log-roll",
+                    "argv": child_argv,
+                    "cwd": str(root),
+                    "log_path": str(base_log_path),
+                },
+                sort_keys=True,
+            ),
+            child_argv=child_argv,
+            cwd=root,
+        )
+        try:
+            _wait_until_present(module, label)
+            first_shard = root / "test-log-roll.2026-01-01.log"
+            second_shard = root / "test-log-roll.2026-01-02.log"
+            deadline = time.time() + 20.0
+            while time.time() < deadline:
+                if first_shard.exists() and second_shard.exists():
+                    first_text = first_shard.read_text(encoding="utf-8", errors="replace")
+                    second_text = second_shard.read_text(encoding="utf-8", errors="replace")
+                    if "[ops-log-mgmt][phase=before]" in first_text and "[ops-log-mgmt][phase=after]" in second_text:
+                        break
+                time.sleep(0.2)
+            assert first_shard.exists(), first_shard
+            assert second_shard.exists(), second_shard
+            assert not stale_shard.exists(), stale_shard
+            shard_names = sorted(path.name for path in root.glob("test-log-roll.*.log"))
+            assert shard_names == ["test-log-roll.2026-01-01.log", "test-log-roll.2026-01-02.log"], shard_names
+            first_text = first_shard.read_text(encoding="utf-8", errors="replace")
+            second_text = second_shard.read_text(encoding="utf-8", errors="replace")
+            assert "[ops-log-mgmt][phase=before]" in first_text, first_text
+            assert "[ops-log-mgmt][phase=after]" not in first_text, first_text
+            assert "[ops-log-mgmt][phase=after]" in second_text, second_text
+            assert "[ops-log-mgmt][phase=before]" not in second_text, second_text
+        finally:
+            _terminate_process(supervisor)
+            if saved_window is None:
+                os.environ.pop("FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS", None)
+            else:
+                os.environ["FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS"] = saved_window
+            if saved_anchor is None:
+                os.environ.pop("FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS", None)
+            else:
+                os.environ["FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS"] = saved_anchor
+
+
 def test_selection_present_checks_all_live_supervisors() -> None:
     module = _load_runtime_module()
     label = "DaemonSet/test-present-any-live-child"
@@ -569,7 +752,9 @@ def test_selection_present_checks_all_live_supervisors() -> None:
     original_iter_live_supervisors = module._iter_live_supervisors
     original_count_pid_tree_members = module._count_pid_tree_members
     try:
-        module._iter_live_supervisors = lambda current_label=None: [stale_new, old_live] if current_label == label else []
+        module._iter_live_supervisors = (
+            lambda current_label=None, scope_key=None: [stale_new, old_live] if current_label == label else []
+        )
         module._count_pid_tree_members = lambda pid: {11: 1, 22: 2}[pid]
         assert module._selection_present(label) is True
     finally:
@@ -1135,7 +1320,7 @@ def test_retire_adopted_children_stops_live_roots() -> None:
     calls: List[tuple[str, object]] = []
     try:
         module._direct_live_child_pids = lambda pid: [41, 42] if pid == module.os.getpid() else []
-        module._iter_live_supervisors = lambda label=None: []
+        module._iter_live_supervisors = lambda label=None, scope_key=None: []
         module._stop_pid_tree_batch = lambda roots, label: calls.append(("stop", (list(roots), label)))
         module._reap_terminated_children = lambda: [(41, 0), (42, 0)]
         module._log_reaped_children = lambda **kwargs: calls.append(("reap", kwargs))
@@ -1160,7 +1345,7 @@ def test_retire_adopted_children_preserves_live_supervisor_roots() -> None:
     calls: List[tuple[str, object]] = []
     try:
         module._direct_live_child_pids = lambda pid: [41, 42] if pid == module.os.getpid() else []
-        module._iter_live_supervisors = lambda label=None: [
+        module._iter_live_supervisors = lambda label=None, scope_key=None: [
             module.LiveSupervisor(
                 process_info=module.ProcessInfo(pid=42, ppid=module.os.getpid(), pgid=42, state="S", start_time_ticks=1),
                 owner_ts_ms=7,
diff --git a/deployment/tests/test_start_test_bed_bootstrap_log.py b/deployment/tests/test_start_test_bed_bootstrap_log.py
index 312deea..9f5ef49 100644
--- a/deployment/tests/test_start_test_bed_bootstrap_log.py
+++ b/deployment/tests/test_start_test_bed_bootstrap_log.py
@@ -3,6 +3,7 @@
 from __future__ import annotations
 
 import argparse
+import copy
 import importlib.util
 import io
 import sys
@@ -604,6 +605,7 @@ def test_normalize_bootstrap_deployconf_strips_legacy_master_p2p_listen_port() -
     ops_agent_entrypoint = normalized["service"]["ops_agent"]["entrypoint"]
     assert "p2p_listen_port: 31100" not in master_entrypoint, master_entrypoint
     assert "p2p_listen_port: 12102" in ops_agent_entrypoint, ops_agent_entrypoint
+    assert normalized["service"]["master"]["port"] == 51051, normalized["service"]["master"]
     assert notes == ["service.master.entrypoint: removed legacy master field p2p_listen_port"], notes
     assert "p2p_listen_port: 31100" in deployconf["service"]["master"]["entrypoint"], deployconf
     print("PASS: test_normalize_bootstrap_deployconf_strips_legacy_master_p2p_listen_port")
@@ -789,6 +791,7 @@ def test_normalize_bootstrap_deployconf_rewrites_same_host_local_multi_node_fixe
     assert "--http-addr 0.0.0.0:19390" in normalized["service"]["greptime"]["entrypoint"], normalized["service"]["greptime"]["entrypoint"]
     assert normalized["service"]["tikv_pd"]["port"] == 19400, normalized["service"]["tikv_pd"]
     assert normalized["service"]["tikv"]["port"] == 19410, normalized["service"]["tikv"]
+    assert normalized["service"]["master"]["port"] == 19290, normalized["service"]["master"]
     assert "port: 19290" in normalized["service"]["master"]["entrypoint"], normalized["service"]["master"]["entrypoint"]
     assert "OPS_AGENT_P2P_LISTEN_PORT=19320" in normalized["service"]["ops_agent"]["entrypoint"], normalized["service"]["ops_agent"]["entrypoint"]
     assert "OPS_AGENT_P2P_LISTEN_PORT=19321" in normalized["service"]["ops_agent"]["entrypoint"], normalized["service"]["ops_agent"]["entrypoint"]
@@ -845,11 +848,35 @@ def test_normalize_bootstrap_deployconf_keeps_non_local_or_single_node_ports_unc
         },
     }
     normalized, notes = module._normalize_bootstrap_deployconf(deployconf=deployconf)
-    assert normalized == deployconf, normalized
+    assert normalized["service"]["master"]["port"] == 51051, normalized["service"]["master"]
+    expected = copy.deepcopy(deployconf)
+    expected["service"]["master"]["port"] = 51051
+    assert normalized == expected, normalized
     assert notes == [], notes
     print("PASS: test_normalize_bootstrap_deployconf_keeps_non_local_or_single_node_ports_unchanged")
 
 
+def test_normalize_bootstrap_deployconf_promotes_master_port_from_entrypoint() -> None:
+    module = _load_start_test_bed_module()
+    deployconf = {
+        "service": {
+            "master": {
+                "entrypoint": (
+                    'cat > "${CONFIG_PATH}" <<YAML\n'
+                    'instance_key: "unified_master"\n'
+                    "port: 51051\n"
+                    "YAML\n"
+                )
+            }
+        }
+    }
+    normalized, notes = module._normalize_bootstrap_deployconf(deployconf=deployconf)
+    assert normalized["service"]["master"]["port"] == 51051, normalized["service"]["master"]
+    assert notes == [], notes
+    assert "port" not in deployconf["service"]["master"], deployconf
+    print("PASS: test_normalize_bootstrap_deployconf_promotes_master_port_from_entrypoint")
+
+
 def test_refresh_cluster_bare_deploy_scripts_copies_local_and_remote_nodes() -> None:
     module = _load_start_test_bed_module()
     with tempfile.TemporaryDirectory(prefix="test_start_test_bed_refresh_bare_") as td:
@@ -1476,6 +1503,10 @@ def main() -> int:
             "normalize_bootstrap_deployconf_keeps_non_local_or_single_node_ports_unchanged",
             test_normalize_bootstrap_deployconf_keeps_non_local_or_single_node_ports_unchanged,
         ),
+        (
+            "normalize_bootstrap_deployconf_promotes_master_port_from_entrypoint",
+            test_normalize_bootstrap_deployconf_promotes_master_port_from_entrypoint,
+        ),
         (
             "refresh_cluster_bare_deploy_scripts_copies_local_and_remote_nodes",
             test_refresh_cluster_bare_deploy_scripts_copies_local_and_remote_nodes,
diff --git a/deployment/utils/log_shard.py b/deployment/utils/log_shard.py
new file mode 100644
index 0000000..415d4ff
--- /dev/null
+++ b/deployment/utils/log_shard.py
@@ -0,0 +1,196 @@
+#!/usr/bin/env python3
+
+from __future__ import annotations
+
+import datetime
+import os
+from pathlib import Path
+from typing import Optional
+
+
+DEFAULT_DAILY_LOG_RETENTION_DAYS = 31
+TEST_LOG_SHARD_WINDOW_SECONDS_ENV = "FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS"
+TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV = "FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS"
+TEST_LOG_SHARD_BASE_DATE = datetime.date(2026, 1, 1)
+
+
+def _read_test_log_shard_window_seconds() -> Optional[int]:
+    raw_value = os.environ.get(TEST_LOG_SHARD_WINDOW_SECONDS_ENV)
+    if raw_value is None:
+        return None
+    text = raw_value.strip()
+    if not text:
+        return None
+    window_seconds = int(text)
+    if window_seconds <= 0:
+        raise ValueError(
+            f"{TEST_LOG_SHARD_WINDOW_SECONDS_ENV} must be a positive integer, got: {raw_value!r}"
+        )
+    return window_seconds
+
+
+def _read_test_log_shard_anchor_unix_seconds() -> int:
+    raw_value = os.environ.get(TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV)
+    if raw_value is None or not raw_value.strip():
+        raise ValueError(
+            f"{TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV} is required when "
+            f"{TEST_LOG_SHARD_WINDOW_SECONDS_ENV} is set"
+        )
+    return int(raw_value.strip())
+
+
+def _resolve_shard_date(ts: datetime.datetime) -> datetime.date:
+    window_seconds = _read_test_log_shard_window_seconds()
+    if window_seconds is None:
+        return ts.date()
+    anchor_unix_seconds = _read_test_log_shard_anchor_unix_seconds()
+    unix_seconds = int(ts.timestamp())
+    bucket_index = (unix_seconds - anchor_unix_seconds) // window_seconds
+    if bucket_index < 0:
+        raise ValueError(
+            "test log shard anchor must not be in the future: "
+            f"anchor={anchor_unix_seconds}, ts={unix_seconds}"
+        )
+    return TEST_LOG_SHARD_BASE_DATE + datetime.timedelta(days=bucket_index)
+
+
+def daily_sharded_log_path(
+    base_path: Path,
+    *,
+    now: Optional[datetime.datetime] = None,
+) -> Path:
+    ts = datetime.datetime.now(datetime.timezone.utc) if now is None else now.astimezone(datetime.timezone.utc)
+    name = base_path.name
+    if not name.endswith(".log"):
+        raise ValueError(f"log base path must end with .log: {base_path}")
+    stem = name[:-4]
+    shard_date = _resolve_shard_date(ts)
+    return (base_path.parent / f"{stem}.{shard_date.isoformat()}.log").resolve()
+
+
+def latest_existing_daily_sharded_log_path(base_path: Path) -> Optional[Path]:
+    name = base_path.name
+    if not name.endswith(".log"):
+        return base_path.resolve() if base_path.exists() else None
+    stem = name[:-4]
+    prefix = stem + "."
+    suffix = ".log"
+    latest: Optional[tuple[datetime.date, Path]] = None
+    parent = base_path.parent
+    if not parent.exists():
+        return base_path.resolve() if base_path.exists() else None
+    for path in parent.iterdir():
+        if not path.is_file():
+            continue
+        entry_name = path.name
+        if not entry_name.startswith(prefix) or not entry_name.endswith(suffix):
+            continue
+        date_text = entry_name[len(prefix):-len(suffix)]
+        try:
+            shard_date = datetime.date.fromisoformat(date_text)
+        except ValueError:
+            continue
+        if latest is None or shard_date > latest[0]:
+            latest = (shard_date, path.resolve())
+    if latest is not None:
+        return latest[1]
+    if base_path.exists():
+        return base_path.resolve()
+    return None
+
+
+def resolve_readable_log_path(base_path: Path) -> Optional[Path]:
+    current = daily_sharded_log_path(base_path)
+    if current.exists():
+        return current
+    return latest_existing_daily_sharded_log_path(base_path)
+
+
+def cleanup_old_daily_sharded_logs(
+    base_path: Path,
+    *,
+    retention_days: int = DEFAULT_DAILY_LOG_RETENTION_DAYS,
+) -> None:
+    name = base_path.name
+    if not name.endswith(".log"):
+        return
+    current_shard_date = _resolve_shard_date(datetime.datetime.now(datetime.timezone.utc))
+    keep_since = current_shard_date - datetime.timedelta(days=max(int(retention_days) - 1, 0))
+    stem = name[:-4]
+    prefix = stem + "."
+    suffix = ".log"
+    parent = base_path.parent
+    parent.mkdir(parents=True, exist_ok=True)
+    for path in parent.iterdir():
+        if not path.is_file():
+            continue
+        entry_name = path.name
+        if not entry_name.startswith(prefix) or not entry_name.endswith(suffix):
+            continue
+        date_text = entry_name[len(prefix):-len(suffix)]
+        try:
+            shard_date = datetime.date.fromisoformat(date_text)
+        except ValueError:
+            continue
+        if shard_date < keep_since:
+            try:
+                path.unlink()
+            except FileNotFoundError:
+                pass
+
+
+def render_module_source() -> str:
+    module_path = Path(__file__).resolve()
+    return module_path.read_text(encoding="utf-8")
+
+
+def import_sibling_log_shard():
+    import importlib.util
+    import sys
+
+    helper_path = Path(__file__).resolve().with_name("log_shard.py")
+    module_name = "_fluxon_log_shard_runtime"
+    loaded = sys.modules.get(module_name)
+    if loaded is not None:
+        return loaded
+    spec = importlib.util.spec_from_file_location(module_name, helper_path)
+    if spec is None or spec.loader is None:
+        raise RuntimeError(f"failed to load log shard helper: {helper_path}")
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
+def relay_fd_to_daily_sharded_logs(
+    *,
+    base_log_path: str,
+    read_fd: int,
+    retention_days: int = DEFAULT_DAILY_LOG_RETENTION_DAYS,
+) -> None:
+    base_path = Path(os.path.abspath(base_log_path))
+    current_path: Optional[Path] = None
+    current_fp = None
+    try:
+        while True:
+            try:
+                chunk = os.read(read_fd, 65536)
+            except OSError:
+                break
+            if not chunk:
+                break
+            next_path = daily_sharded_log_path(base_path)
+            if current_path != next_path:
+                if current_fp is not None:
+                    current_fp.flush()
+                    current_fp.close()
+                cleanup_old_daily_sharded_logs(base_path, retention_days=retention_days)
+                next_path.parent.mkdir(parents=True, exist_ok=True)
+                current_fp = next_path.open("ab", buffering=0)
+                current_path = next_path
+            current_fp.write(chunk)
+    finally:
+        if current_fp is not None:
+            current_fp.flush()
+            current_fp.close()
+        os.close(read_fd)
diff --git a/deployment/utils/proc_lifecycle_codegen.py b/deployment/utils/proc_lifecycle_codegen.py
index 31ef2b0..116b0c4 100644
--- a/deployment/utils/proc_lifecycle_codegen.py
+++ b/deployment/utils/proc_lifecycle_codegen.py
@@ -150,22 +150,19 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
 }}
 
 wait_service_probably_ready_pid_tree() {{
-  # "Probably ready" contract:
-  # - A service is considered probably-ready iff for N consecutive seconds:
-  #   - the supervisor PID exists, and
-  #   - the supervisor PID subtree has at least one other PID besides the supervisor.
-  # - If the child process restarts during the window, we reset the counter and keep waiting,
-  #   until the provided deadline is reached.
-  #
-  # This is used by atomic-group runners to enforce strict start ordering.
+  # Startup gate contract:
+  # - Success means the supervisor PID stays alive across the fixed startup window.
+  # - During this startup window we do not probe service ports or readiness endpoints.
+  # - We intentionally do not require the child to expose ports, endpoints, or even finish
+  #   spawning before the window ends.
   svc="$1"
   root_pid="$2"
-  stable_seconds="$3"
+  startup_window_seconds="$3"
   deadline_ts="$4"
   context="$5"
 
-  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then
-    echo "$context probable-ready: invalid stable_seconds=$stable_seconds svc=$svc"
+  if [[ ! "$startup_window_seconds" =~ ^[0-9]+$ ]] || [ "$startup_window_seconds" -le 0 ]; then
+    echo "$context probable-ready: invalid startup_window_seconds=$startup_window_seconds svc=$svc"
     return 1
   fi
   if [[ ! "$deadline_ts" =~ ^[0-9]+$ ]] || [ "$deadline_ts" -le 0 ]; then
@@ -173,30 +170,16 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
     return 1
   fi
 
-  ok_s=0
   while true; do
-    now=$(date +%s)
-    if [ "$now" -ge "$deadline_ts" ]; then
-      echo "$context probable-ready: deadline exceeded svc=$svc stable_seconds=$stable_seconds pid=$root_pid"
-      return 1
-    fi
-
     if ! _pid_exists "$root_pid"; then
       echo "$context probable-ready: supervisor pid exited svc=$svc pid=$root_pid"
       return 1
     fi
 
-    if _pid_tree_has_child_process "$root_pid"; then
-      ok_s=$((ok_s+1))
-      if [ "$ok_s" -ge "$stable_seconds" ]; then
-        echo "$context probable-ready: ok svc=$svc stable_seconds=$stable_seconds pid=$root_pid"
-        return 0
-      fi
-    else
-      if [ "$ok_s" -ne 0 ]; then
-        echo "$context probable-ready: reset svc=$svc ok_s=$ok_s missing_child=true"
-      fi
-      ok_s=0
+    now=$(date +%s)
+    if [ "$now" -ge "$deadline_ts" ]; then
+      echo "$context probable-ready: ok svc=$svc startup_window_seconds=$startup_window_seconds pid=$root_pid"
+      return 0
     fi
 
     sleep 1
diff --git a/deployment/utils/selection_supervisor_codegen.py b/deployment/utils/selection_supervisor_codegen.py
index 2945ff5..ab76dfc 100644
--- a/deployment/utils/selection_supervisor_codegen.py
+++ b/deployment/utils/selection_supervisor_codegen.py
@@ -13,6 +13,7 @@
 
 
 PYTHON_SELECTION_SUPERVISOR_FILENAME = "selection_supervisor.py"
+LOG_SHARD_HELPER_FILENAME = "log_shard.py"
 
 
 def render_python_selection_supervisor_module(*, timeouts) -> str:
@@ -42,11 +43,13 @@ def render_python_selection_supervisor_module(*, timeouts) -> str:
 import enum
 import fcntl
 import hashlib
+import importlib.util
 import json
 import os
 import signal
 import subprocess
 import sys
+import threading
 import time
 from dataclasses import dataclass
 from pathlib import Path
@@ -62,6 +65,37 @@ def render_python_selection_supervisor_module(*, timeouts) -> str:
 SANITIZED_CHILD_ENV_KEYS = ("RDMAV_DRIVERS", "IBV_DRIVERS")
 
 _shutdown_requested = False
+_STDIO_ROUTER_THREAD = None
+_STDIO_ROUTER_KEEPALIVE_FP = None
+
+
+def _load_log_shard_helper():
+    candidates = []
+    raw_file = globals().get("__file__")
+    if isinstance(raw_file, str) and raw_file:
+        candidates.append(Path(raw_file).resolve().with_name("__LOG_SHARD_HELPER_FILENAME__"))
+    cwd = Path.cwd().resolve()
+    candidates.append(cwd / "__LOG_SHARD_HELPER_FILENAME__")
+    candidates.append(cwd / "deployment" / "utils" / "__LOG_SHARD_HELPER_FILENAME__")
+    for entry in sys.path:
+        if not isinstance(entry, str) or not entry:
+            continue
+        candidates.append(Path(entry).resolve() / "__LOG_SHARD_HELPER_FILENAME__")
+    helper_path = candidates[0]
+    for candidate in candidates:
+        if candidate.is_file():
+            helper_path = candidate
+            break
+    spec = importlib.util.spec_from_file_location("_fluxon_selection_log_shard", helper_path)
+    if spec is None or spec.loader is None:
+        raise RuntimeError(f"failed to load log shard helper: {helper_path}")
+    module = importlib.util.module_from_spec(spec)
+    sys.modules[spec.name] = module
+    spec.loader.exec_module(module)
+    return module
+
+
+_LOG_SHARD = _load_log_shard_helper()
 
 
 def main() -> int:
@@ -96,6 +130,8 @@ def main() -> int:
     stop_parser.add_argument("--missing-ok", action="store_true")
 
     args = parser.parse_args()
+    runtime_state_for_stdio = _runtime_state_for_startup_stdio(args)
+    _redirect_process_stdio_to_runtime_log(runtime_state_for_stdio)
     # English note:
     # - The supervisor module is invoked both as a long-running `run` daemon and as a short-lived
     #   `stop` helper from ops-managed reconcile loops.
@@ -356,6 +392,16 @@ def _parse_run_command_spec(args: argparse.Namespace) -> RunCommandSpec:
     )
 
 
+def _runtime_state_for_startup_stdio(args: argparse.Namespace) -> Optional[SelectionRuntimeState]:
+    if str(args.command) != "run":
+        return None
+    label = _require_non_empty_str(args.label, "label")
+    state_json = args.state_json
+    if state_json is None:
+        return None
+    return _build_runtime_state(label=label, state_json=state_json)
+
+
 def _requested_phase1_overlap_with_applyless_owner(
     current_owner: Optional[LiveSupervisor],
     requested_runtime_state: Optional[SelectionRuntimeState],
@@ -438,6 +484,7 @@ def _run_supervisor(spec: RunCommandSpec, selection_lock_fp=None) -> int:
 
     restart_timestamps: List[float] = []
     backoff_seconds = spec.restart_delay_seconds
+    _redirect_process_stdio_to_runtime_log(runtime_state)
 
     while True:
         _log_reaped_children(
@@ -661,6 +708,10 @@ def _sanitize_child_ld_library_path(raw_value: Optional[str]) -> Optional[str]:
     return ":".join(sanitized_entries)
 
 
+def _expand_runtime_state_path(value: str) -> str:
+    return os.path.expandvars(value)
+
+
 def _spawn_child(command: List[str], workdir: Optional[Path]) -> subprocess.Popen[bytes]:
     def _set_pdeathsig_sigterm() -> None:
         libc = ctypes.CDLL("libc.so.6", use_errno=True)
@@ -687,6 +738,40 @@ def _set_pdeathsig_sigterm() -> None:
     )
 
 
+def _redirect_process_stdio_to_runtime_log(runtime_state: Optional[SelectionRuntimeState]) -> None:
+    global _STDIO_ROUTER_THREAD
+    global _STDIO_ROUTER_KEEPALIVE_FP
+    if runtime_state is None:
+        return
+    if _STDIO_ROUTER_THREAD is not None:
+        return
+    base_log_path = _require_non_empty_str(runtime_state.log_path, "state.log_path")
+    read_fd, write_fd = os.pipe()
+    router_keepalive = os.dup(write_fd)
+
+    def _router_loop() -> None:
+        _LOG_SHARD.relay_fd_to_daily_sharded_logs(
+            base_log_path=base_log_path,
+            read_fd=read_fd,
+            retention_days=_LOG_SHARD.DEFAULT_DAILY_LOG_RETENTION_DAYS,
+        )
+
+    router = threading.Thread(
+        target=_router_loop,
+        name="selection-supervisor-stdio-log-router",
+        daemon=True,
+    )
+    router.start()
+    os.dup2(write_fd, sys.stdout.fileno())
+    os.dup2(write_fd, sys.stderr.fileno())
+    sys.stdout = os.fdopen(sys.stdout.fileno(), "w", encoding="utf-8", buffering=1, closefd=False)
+    sys.stderr = os.fdopen(sys.stderr.fileno(), "w", encoding="utf-8", buffering=1, closefd=False)
+    try:
+        os.close(write_fd)
+    except OSError:
+        pass
+    _STDIO_ROUTER_KEEPALIVE_FP = os.fdopen(router_keepalive, "w", encoding="utf-8", buffering=1)
+    _STDIO_ROUTER_THREAD = router
 def _retired_and_preserved_adopted_roots(root_pid: int) -> Tuple[List[int], List[int]]:
     adopted_roots = _direct_live_child_pids(root_pid)
     if not adopted_roots:
@@ -788,7 +873,9 @@ def _selection_runtime_state_from_raw(
         apply_id=_require_optional_non_empty_str(raw.get("apply_id"), "state.apply_id"),
         argv=_require_non_empty_str_list(raw.get("argv"), "state.argv"),
         cwd=_require_optional_non_empty_str(raw.get("cwd"), "state.cwd"),
-        log_path=_require_non_empty_str(raw.get("log_path"), "state.log_path"),
+        log_path=_expand_runtime_state_path(
+            _require_non_empty_str(raw.get("log_path"), "state.log_path")
+        ),
         owner_ts_ms=owner_ts_ms,
         started_ts_ms=started_ts_ms,
     )
@@ -1337,6 +1424,7 @@ def _signal_pid_tree(root_pid: int, sig: signal.Signals, label: str) -> None:
 """
     return (
         textwrap.dedent(template)
+        .replace("__LOG_SHARD_HELPER_FILENAME__", LOG_SHARD_HELPER_FILENAME)
         .replace("__TERM_S__", str(term_s))
         .replace("__KILL_S__", str(kill_s))
         .replace("__SUPERSEDE_S__", str(supersede_s))
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
new file mode 100644
index 0000000..852b73f
--- /dev/null
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -0,0 +1,217 @@
+# Fluxon 配置总览
+
+## 1. 结论
+
+本文只回答一件事：Fluxon 仓库里有哪些稳定配置入口，它们各自负责什么，校验后会变成什么运行时结构。
+
+**稳定结论：**
+
+- 配置输入和运行时结构是分开的，YAML 只负责声明意图，`verify()` / `parse_*()` 负责收敛成唯一可执行结果。
+- 共享契约优先放在 `fluxon_commu_contract` 和 `fluxon_cli::config` 这类公共模块里，业务包更多是复用或重导出。
+- `host:port`、`http(s)://...`、`cluster-scoped path` 这几类格式都被严格区分，不靠探测或模糊回退。
+- 仓库里的 checked-in YAML 分两类：运行时契约和环境/测试契约。前者要强校验，后者主要用于把开发、部署、测试流水线接起来。
+
+```mermaid
+flowchart TD
+    A[build_config_ext.yml<br/>build_config_ext_static.yml] --> B[setup_and_pack / repo_config_utils]
+    C[deployment/deployconf.yaml] --> D[deployment utils / fluxon_py tests]
+    E[fluxon_py/tests/test_config.yaml] --> D
+    F[fluxon_test_stack/*.yaml] --> G[teststack runner / start_test_bed]
+    H[fluxon_cli/src/config.rs] --> I[monitor / UI]
+    J[fluxon_kv/src/config.rs] --> K[KV runtime]
+    L[fluxon_fs_core/src/config.rs] --> M[FS runtime]
+    N[fluxon_commu_contract/src/config.rs] --> K
+    N --> M
+```
+
+## 2. 配置地图
+
+| 配置家族 | 入口文件 / 模块 | 主要消费者 | 作用 |
+| --- | --- | --- | --- |
+| 仓库环境配置 | `build_config_ext.yml` | Rust KV 测试族、`fluxon_py/tests/test_lib.py`、`setup_and_pack` 打包/校验脚本、TestStack 的 `bin_kvtest` 用例 staging | 提供 etcd、Prometheus、remote write 等开发/测试基线 |
+| 静态构建配置 | `build_config_ext_static.yml` | `setup_and_pack/pack_release.py`、`build_pack_fluxonkv_pylib_img.py`、Nix 打包链路 | 固定 wheel / manylinux 版本 |
+| 部署配置 | `deployment/deployconf.yaml` | 部署脚本、`fluxon_py` 测试入口、TestStack 生成/消费链路 | 提供集群节点、服务地址和全局环境变量 |
+| Python 测试配置 | `fluxon_py/tests/test_config.yaml` | `fluxon_py` 测试入口、测试辅助库、deployconf 解析链路 | 连接 deployconf，选择 KV backend 类型 |
+| 开发/打包环境配置 | `setup_and_pack/setup_dev_env/*.yaml`、`setup_and_pack/build_pack_fluxonkv_pylib_img/*.yaml`、`setup_and_pack/nix/*.yaml`、`pub_prepare_build.yaml` | `setup_and_pack` 脚本 | 提供开发机和打包流水线的环境输入 |
+| TestStack 配置 | `fluxon_test_stack/ci_test_list.yaml`、`start_test_bed.yaml`、`gitops.yaml` | `test_runner.py`、`start_test_bed.py` | 定义 suite、testbed、GitOps 和 UI 入口 |
+| CLI 监控配置 | `fluxon_cli/src/config.rs` | `master_ui_monitor`、`test_runner_ui` | 提供监控页和查询页配置 |
+| KV 配置 | `fluxon_kv/src/config.rs` | KV master / owner / external | 定义 KV 运行时角色和校验规则 |
+| FS 配置 | `fluxon_fs_core/src/config.rs` | FS master / agent / panel | 定义 FS cache、master、panel、权限和转移态 |
+| 共享传输配置 | `fluxon_commu_contract/src/config.rs`、`transfer_engine/surface.rs` | KV / FS / commu | 提供 `NetworkConfig`、`ProtocolType`、`TransferEngineType` |
+
+## 3. 通用规则
+
+| 规则 | 含义 |
+| --- | --- |
+| `serde(deny_unknown_fields)` | 运行时 YAML 默认拒绝未知字段 |
+| `from_file` / `from_str` + `verify` | 先解析，再收敛成强类型运行时配置 |
+| `YamlNullable<T>` | 只在需要区分“缺失 / null / value”时使用 |
+| `host:port` 与 `http(s)://...` 分离 | etcd / deployconf 常用前者，监控 / Prometheus 常用后者 |
+| 派生值要显式写回 | 例如 cluster-scoped 路径、默认表名、默认 transport_mode |
+
+## 4. 环境与部署配置
+
+### 4.1 `build_config_ext.yml`
+
+这是仓库级开发环境配置，不是业务 runtime config。
+
+| 字段 | 规则 | 主要用途 |
+| --- | --- | --- |
+| `etcd` | 必填，`host:port` | 供 Rust / Python / 测试工具读取 etcd 地址 |
+| `prom` | 必填，`http(s)://.../v1` 或 `.../api/v1` | 供 Grafana / TSDB 查询 URL 使用 |
+| `prom_remote_write_url` | 必填，`http(s)://...` | 供 remote write 使用 |
+
+`setup_and_pack/utils/repo_config_utils.py` 里保留了 `prometheus_remote_write_url` 的旧名兼容读取，但这是 build tooling 的过渡路径，不是推荐的新契约。
+
+### 4.2 `build_config_ext_static.yml`
+
+当前只固定一个值：
+
+| 字段 | 规则 |
+| --- | --- |
+| `manylinux_version` | 必填，当前只允许 `2_28` |
+
+### 4.3 `deployment/deployconf.yaml`
+
+这是部署和打包流水线的核心配置。当前稳定消费面主要有三块：
+
+| 区块 | 关键字段 | 作用 |
+| --- | --- | --- |
+| `cluster_nodes` | 节点列表 | 作为 placeholder 解析的基础 |
+| `service` | 服务节点映射 | 供部署脚本和测试脚本查 service ip:port |
+| `global_envs` | `ETCD_FULL_ADDRESS`、`FLUXON_PROMETHEUS_BASE_URL`、`MONITOR_GREPTIMEDB_WRITE_URL`、`FLUXON_CLUSTER_NAME`、`FLUXON_SHARED_MEM`、`FLUXON_SHARED_FILE` | 供部署/测试代码读取集群级 authority |
+
+`global_envs` 允许占位符解析，先由 `cluster_nodes` + `service` 构造映射，再把变量落成最终值。
+
+### 4.4 `fluxon_py/tests/test_config.yaml`
+
+这是一层测试入口配置，不是 runtime 部署配置。
+
+| 字段 | 规则 |
+| --- | --- |
+| `deployconf_path` | 必填，指向共享 deployconf |
+| `kv_svc_type` | 必填，当前测试助手只接受已知 backend 类型 |
+
+测试代码里还保留了 mooncake 相关读取函数，但 checked-in 的最小样例只使用上面两个字段。
+
+### 4.5 `fluxon_test_stack/*`
+
+TestStack 的配置已经单独有设计文档，这里只收口成一句话：
+
+- `ci_test_list.yaml` 定义 suite 空间。
+- `start_test_bed.yaml` 定义共享 testbed 和 UI。
+- `gitops.yaml` 定义 GitOps 轮询和记录。
+- 生成的 `deployconf_testbed.yml` 是派生产物，不是手工主配置。
+
+## 5. 运行时配置
+
+### 5.1 KV
+
+KV 的入口在 `fluxon_kv/src/config.rs`，对外分成 master 和 client 两个稳定 YAML：
+
+| 类型 | 作用 |
+| --- | --- |
+| `MasterConfigYaml` | master 节点输入 |
+| `ClientConfigYaml` | owner / external 输入 |
+| `TestSpecConfig` | 测试和实验分支开关 |
+| `MonitoringConfigYaml` | master 监控块 |
+| `NetworkConfig` | 网络白名单和 IP 映射，共享自 `fluxon_commu_contract` |
+
+核心分流规则：
+
+- `contribute_to_cluster_pool_size` 缺失或全零时，进入 external。
+- `contribute_to_cluster_pool_size.dram > 0` 时，进入 owner。
+- `test_spec_config.side_transfer_role = worker` 时，走 side-transfer worker 分支，强制 `TransferEngineType::P2p`。
+
+主要约束：
+
+- `monitoring` 在 master 上必填。
+- `master_ui` 依赖 `monitoring`，并作为嵌入式 monitor HTTP 服务启动。
+- `shared_memory_path` / `shared_file_path` 会拼成 `cluster_name` 作用域路径。
+- `etcd_addresses` 在 client 侧保留 raw `host:port` 和归一化 `http://host:port` 两份视图。
+- zero-contribution `external` / side worker 的 `etcd_addresses`、`sub_cluster`、`large_file_paths` 由 owner 发布的 `shared.json` 继承；本地配置面只保留 attach owner 所需的共享 bundle 锚点和本进程参数。
+
+更细的调用时序、持有生命周期和并发规则分别在 `kv_1_概览与分层.md`、`kv_2_调用时序.md`、`kv_3_参数与并发.md`、`kv_4_allocation_segment_holder生命周期.md` 里展开。
+
+### 5.2 FS
+
+FS 的配置集中在 `fluxon_fs_core/src/config.rs`，上层 `fluxon_fs/src/config.rs` 只是重导出。
+
+| 配置块 | 入口 | 结果 |
+| --- | --- | --- |
+| cache | `fluxon_fs.cache` | `FluxonFsGlobalConfig` |
+| master | `fluxon_fs.master` | `FluxonFsMasterConfig` |
+| master_panel | `fluxon_fs.master_panel` | `FluxonFsMasterPanelConfig` |
+
+`fluxon_fs.cache` 的核心字段：
+
+- `stale_window_ms` 必须 `> 0`。
+- `write_session_target_inflight_bytes` 可缺省，默认 128 MiB。
+- `rules[*]` 需要绝对路径、合法 cache/write 模式、合法前缀和非零 cache 上限。
+- `exports[*]` 需要绝对路径；`nodes` 缺失时表示 `AgentRegistry`，给出时表示 `StaticNodes`。
+
+`fluxon_fs.master` 的核心字段：
+
+- `instance_key` 必填。
+- `pull_interval_ms` 可选，但如果给出必须 `> 0`。
+- 旧的 `fluxon_fs.rpc` 和 `rpc_timeout_ms` 已移除。
+
+`fluxon_fs.master_panel` 的核心字段：
+
+- `listen_addr`、`public_base_url`、`prometheus_base_url`、`access_db_path` 都是必需基线。
+- `bootstrap_access_model` 是面板的启动授权模型。
+- `transfer_state_store` 当前稳定实现是 `tikv`。
+- `s3_gateway` 负责对象请求和 KV miss 策略。
+
+FS 还把访问模型拆成两层：
+
+- `access_model` 是用户/权限的输入模型。
+- `runtime_access_model` 是 runtime 使用的派生模型，密码会被哈希，不再原样保留。
+
+### 5.3 CLI 监控
+
+`fluxon_cli/src/config.rs` 定义统一监控页配置，KV 的 `master_ui` 和 TestStack 的 UI 都复用它。
+
+| 类型 | 关键字段 |
+| --- | --- |
+| `MonitorConfigYaml` | `etcd_endpoints`、`prometheus_base_url`、`cluster_name`、`member_kind`、`output` |
+| 可选项 | `mq_unique_key_prefixes`、`http_listen_addr`、`greptime_sql` |
+
+主要约束：
+
+- `etcd_endpoints` 必须非空且带 scheme。
+- `prometheus_base_url` 必须带 scheme。
+- `mq_unique_key_prefixes` 给出时不能为空，也不能带前后空白。
+- `greptime_sql` 可以显式提供；如果 `prometheus_base_url` 指向 Greptime 的 `/v1/prometheus`，会自动派生默认 SQL 连接信息。
+
+### 5.4 共享传输契约
+
+`fluxon_commu_contract` 提供多个被 KV / FS 共同复用的基础类型：
+
+| 类型 | 取值 | 作用 |
+| --- | --- | --- |
+| `ProtocolType` | `Tcp` / `Rdma` | 输入协议选择 |
+| `TransferEngineType` | `Closed` / `P2p` | 传输引擎分支 |
+| `TransferBackendActivationMode` | 三个显式分支 | 控制 backend 激活方式 |
+| `NetworkConfig` | `subnet_whitelist`、`primary_ip_to_extended_ips` | 网络白名单和 IP 扩展映射 |
+
+这些类型是共享契约，不属于某一个子系统的私有配置。
+
+## 6. 配置之间的关系
+
+| 关系 | 说明 |
+| --- | --- |
+| build_config_ext -> deployment/test | 先确定环境基线，再给 runtime 配置提供 host、URL、路径 |
+| deployconf -> test_config | Python 测试配置通过 `deployconf_path` 指向共享部署配置 |
+| deployconf -> teststack | `start_test_bed` 和 `test_runner` 读取派生后的 testbed deployconf |
+| commu_contract -> KV / FS | `ProtocolType`、`TransferEngineType`、`NetworkConfig` 是共享底座 |
+| CLI config -> KV / TestStack UI | master UI、runner UI 复用同一个 monitor config 契约 |
+
+## 7. 读法建议
+
+如果你只想看某一块的细节，按这个顺序读：
+
+1. 环境/部署先看 `deployment/utils/deployconf_config_utils.py` 和 `fluxon_util/src/dev_config.rs`。
+2. KV 先看 `fluxon_kv/src/config.rs`，再接 `kv_1` 到 `kv_4`。
+3. FS 先看 `fluxon_fs_core/src/config.rs`，再看 `用户 - 5 - FS接口.md`。
+4. TestStack 直接看 `teststack_1_当前架构与CI测试流程.md`。
diff --git "a/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md" "b/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
new file mode 100644
index 0000000..fd81c45
--- /dev/null
+++ "b/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
@@ -0,0 +1,414 @@
+# Fluxon Log 设计 1 - 统一 log 标准与 Greptime OTLP 导出链路
+
+## 0. 总起
+本文定义 Fluxon 服务平面的统一日志标准。主线代码落在 `fluxon_rs/fluxon_kv/src/config.rs`、`fluxon_rs/fluxon_kv/src/lib.rs`、`fluxon_rs/fluxon_util/src/log.rs`、`fluxon_rs/fluxon_observability/src/greptime_otlp_tracing.rs`、`fluxon_rs/fluxon_observability/src/greptime_otlp_log_orchestrator.rs` 和 `fluxon_rs/fluxon_observability/src/greptime_otlp_log.rs`。
+
+稳定结论先说死：
+
+- 本地文件日志始终启用，作为可回放的安全网。
+- Greptime OTLP 导出由 `master.monitoring.otlp_log_api` 控制，`master` 负责配置源，`owner` / `external` 只消费广播。
+- `testbed` 是独立的 `log_service_kind`，启动器、runner、UI 和 workload 统一按同一套日志语义落盘。
+- 当前导出链路采用 best-effort 策略，不阻塞主业务路径。
+
+本文重点回答四个问题：
+
+1. 各条日志链路当前落在哪些目录边界里。
+2. 当前 canonical 文件名、按天分片和 31 天清理语义是什么。
+3. Rust / Python 之间哪些 contract 已经对齐，哪些还没有。
+4. 当前实现里哪些地方已经收口，哪些地方仍是未完全收口点。
+
+KV 里的 `external` 与 side worker 都只消费 owner 感知结果。当前稳定 contract 是：它们显式配置 `shared_memory_path` / `shared_file_path` 作为 attach owner 的共享 bundle 锚点，`large_file_paths` 则从 owner 发布的 `shared.json` 继承；日志和 cache 从启动起就直接落到 owner 派生出来的大文件目录，不再要求 zero-contribution 侧另配一份本地 large root。
+
+## 1. 目录边界
+目录边界只管物理隔离，不管统一 root。统一的是命名、元数据、归档窗口和清理语义。
+
+### 1.1 KV
+- `master` 以 `log_dir` 作为本地主日志根，并在其下派生 cluster-scoped runtime 日志目录。
+- `owner`、`external` 和 side worker 共享单一 `share_path` 作为 share 根，用来放 `mmap.file`、`shared.json`、peer metadata 和 side transfer 相关文件。
+- `owner` 的 `large_file_paths` 定义 runtime log、cache 等大文件资产的物理根目录。
+- `external` 和 side worker 不再单独声明自己的 `large_file_paths`。它们在 zero-contribution bootstrap 阶段从 owner `shared.json` 继承同一组大文件根目录，然后直接复用 owner 派生出来的 runtime log / cache 边界。
+
+### 1.2 ops / bare shared supervisor control plane
+这里不要把 `ops` 和 `bare` 理解成两套彼此独立的面。两者确实共用同一个 `selection_supervisor.py + log_shard.py` 实现源，但当前实际落盘边界不是一棵完全统一的目录树。
+
+先区分两个层次：
+
+| 层次 | 稳定根 | 主要内容 |
+| --- | --- | --- |
+| `deployconf -> gen_bare -> bare bootstrap` | `hostworkdir` | generated control scripts、bare 服务日志 |
+| `ops` runtime | `workdir` | runtime config、embedded supervisor runtime、ops-managed workload 日志 |
+
+其中：
+
+- `hostworkdir` 是节点级宿主根，用来承载 deployer 下发产物、bare 控制脚本和其他需要跨进程稳定复用的目录。
+- `workdir` 是某个具体进程实例自己的运行子目录，用来承载该实例的 runtime config、embedded supervisor runtime 和它托管出来的 workload 日志。
+- 位置关系上，当前 self-host deployconf 里 `workdir` 通常是 `hostworkdir` 的子目录；语义关系上，`workdir` 仍然只是“某个实例的运行子树”，不能反过来代表整个 `hostworkdir`。
+
+bare 稳定根当前可以直观看成：
+
+```text
+${HOSTWORKDIR}/
+  log/
+    ops_controller.<YYYY-MM-DD>.log
+    ops_agent.<YYYY-MM-DD>.log
+    <bare_service_name>.<YYYY-MM-DD>.log
+  gen_bare_deploy_bash/
+    start_ops_controller.sh
+    start_ops_agent.sh
+    start_<service>.sh
+    stop_ops_controller.sh
+    stop_ops_agent.sh
+    stop_<service>.sh
+    start_<atomic_group>.sh
+    stop_<atomic_group>.sh
+    selection_supervisor.py
+    log_shard.py
+    entrypoint__<workload_name>.sh
+```
+
+当前 self-host deployconf 下，`hostworkdir` 与 `ops workdir` 的实际位置关系可以直观看成：
+
+```text
+${HOSTWORKDIR}/
+  gen_bare_deploy_bash/
+    ...
+  log/
+    ops_controller.<YYYY-MM-DD>.log
+    ops_agent.<YYYY-MM-DD>.log
+    <bare_service_name>.<YYYY-MM-DD>.log
+  ops_controller/
+    ops_controller.yaml
+    selection_supervisor/
+      selection_supervisor.py
+      log_shard.py
+    log/
+      workload__<workload_kind>__<workload_name>.<YYYY-MM-DD>.log
+  ops_agent/
+    <NODE_ID>/
+      ops_agent.yaml
+      selection_supervisor/
+        selection_supervisor.py
+        log_shard.py
+      log/
+        workload__<workload_kind>__<workload_name>.<YYYY-MM-DD>.log
+```
+
+这里再把 contract 说清楚：
+
+- `${HOSTWORKDIR}/gen_bare_deploy_bash/` 里的 `start_*.sh` / `stop_*.sh` 是 generated control scripts，是这套 shared supervisor 控制面的入口脚本，不是另一套独立 authority。
+- bare 这一层的稳定逻辑基名仍然是 `${HOSTWORKDIR}/log/<service_name>.log`，shared supervisor runtime 再把它收口为 `${HOSTWORKDIR}/log/<service_name>.<YYYY-MM-DD>.log`。
+- ops-managed workload 这一层的稳定逻辑基名则是 `${WORKDIR}/log/workload__<workload_kind>__<workload_name>.log`，shared supervisor runtime 再把它收口为 `${WORKDIR}/log/workload__<workload_kind>__<workload_name>.<YYYY-MM-DD>.log`。
+- 两层真正共享的是 `selection_supervisor.py + log_shard.py` 这组控制与滚动实现，不是“所有路径和文件名完全一样”。
+
+在当前 self-host deployconf 示例里：
+
+- `ops_controller` 的 workdir 是 `${HOSTWORKDIR}/ops_controller`
+- `ops_agent` 的 workdir 是 `${HOSTWORKDIR}/ops_agent/${NODE_ID}`
+
+### 1.3 testbed
+- `workdir`、`run_dir` 分别承担 launcher、runner、UI、workload 的 run-scoped 落盘边界。
+- `testbed` 必须显式作为 `log_service_kind` 出现，不再用泛化名称代替。
+- launcher 和 workload 的目录语义要和 ops 对齐。
+- 当前优先级不是先把 testbed 做到完美支持，而是先把 ops 长时服务日志 contract 讲清楚并收口；testbed 继续按“服务级日志”和“case artifact”分开讨论。
+
+### 1.4 FS
+- `shared_file_path` 与 `export.remote_root_dir_abs` 分开使用。
+- 前者负责共享 attachment 边界。
+- 后者负责业务数据边界。
+
+这里的目标很明确：目录可以不同，语义必须一致。`log`、`cache`、`shared attachment`、`workload data` 不能混在同一个边界里。
+
+## 2. 文件命名
+当前实现里的文件命名还没有完全统一，但已经可以明确分成下面几类。
+
+| 类别 | 当前逻辑基名 | 当前实际落盘 |
+| --- | --- | --- |
+| KV runtime | `fluxon-kv-<instance_key>.log` | `fluxon-kv-<instance_key>.<YYYY-MM-DD>.log` |
+| bare 服务日志 | `<service_name>.log` | `<service_name>.<YYYY-MM-DD>.log` |
+| ops-managed workload | `workload__<workload_kind>__<workload_name>.log` | `workload__<workload_kind>__<workload_name>.<YYYY-MM-DD>.log` |
+| testbed 服务日志 | `test_runner.log` / `test_runner_ui.log` | `test_runner.<YYYY-MM-DD>.log` / `test_runner_ui.<YYYY-MM-DD>.log` |
+| KV side worker stdio | `side_worker_<worker_idx>.stdout.log` / `side_worker_<worker_idx>.stderr.log` | 当前还没补日期分片 |
+
+补充说明：
+
+- KV runtime 日志当前仍由 `fluxon_util::init_log(...)` 创建，`run_master_impl(...)` 和 `run_client_impl(...)` 都会初始化这套本地文件日志，所以 `master`、`owner`、`external` 这些 KV 运行时进程当前确实都会产生这类文件。
+- `ops` 里还保留一些特例命名，例如 `smoke.log`、`smoke_bare.log`、`smoke_workloads_bare.log`。这些都属于当前实现尚未收口的历史命名。
+- `testbed` 当前仍然没有单一 canonical log filename。服务级日志已经补上时间分片，但 `ci_runner` 等 case 级日志仍主要落在 `results/<case_id>/run_<N>/logs/**` 与 `summary.yaml`、`exception.txt`、`ci.log` 这类 run artifact 里。
+
+清理只依据文件名里约定好的日期分片字段，不按目录数量、文件大小或历史批次做判断。这样本地清理和 Greptime retention 才能共享同一时间窗口。
+
+## 3. 元数据字段
+这一节描述的是当前 KV OTLP 导出链路已经实际写入 Greptime 的元数据字段。
+
+| 字段 | 含义 |
+| --- | --- |
+| `service.name` | 当前固定为 `fluxon` |
+| `fluxon_cluster_name` | 集群名 |
+| `fluxon_member_kind` | 当前业务类型标签，例如 `kv` |
+| `fluxon_role` | 当前进程角色标签，例如 `master`、`owner_client`、`external_client` |
+| `fluxon_member_id` | 当前实例标识 |
+
+当前实现里的日志元数据仍然是围绕 `cluster_name`、`member_kind`、`role`、`member_id` 这组字段组织的；`log_service_kind`、`log_kind`、`process_role`、`instance_key`、`workload_kind`、`workload_name` 这些更细的统一字段，目前还没有完整进入导出链路。
+
+## 4. 归档、超时与清理
+本地文件日志按天滚动归档，默认保留 31 天。清理时只扫描 canonical log file name，并按命名约定提取日期分片删除过期文件，不按文件数量或目录总量触发。
+
+流式备份和 OTLP 导出也服从同一套窗口：
+
+| 项目 | 规则 |
+| --- | --- |
+| 导出策略 | best-effort，不阻塞主业务路径 |
+| 队列满 | 允许丢弃，并保留可观测信号 |
+| 发送失败 | 允许跳过当前 batch，本地文件仍在 |
+| 停机行为 | shutdown 时执行 best-effort flush |
+| 超时语义 | 单次导出必须有硬上界，不能无限挂起 |
+
+Greptime 侧的 retention / TTL 也按同一日期窗口收口，保证本地与远端的保留语义一致。这里要把远端清理语义说死：写入 `fluxon_logs` 的日志记录默认只保留 1 个月，超过窗口的数据必须由 Greptime 表级 TTL 或定时清理任务删除，不能只依赖查询层按时间过滤“看不见旧数据”。
+
+如果后续本地窗口仍保持 31 天，那么 Greptime 侧也应保持同一 31 天窗口；如果本地窗口改为新的 canonical 值，远端 TTL 也必须同步调整。`disable_observability=true` 只关闭 OTLP 层，不关闭本地文件日志。
+
+如果某条 stream 只是“备份副本”，它不能绕开本地日志的归档窗口单独永久存活。超时后应停止 tailing、释放资源，并交回本地文件归档策略处理历史文件。
+
+## 5. 当前实现里已经收口的点
+这一节只写已经可以当作当前事实使用的内容。
+
+### 5.1 本地文件按天分片与 31 天窗口
+- KV runtime 已具备稳定的按天滚动与保留窗口。
+- bare 服务日志已经接到 shared supervisor 的按天分片与同口径清理。
+- ops-managed workload 日志已经接到 shared supervisor 的按天分片与同口径清理。
+- `test_runner` / `test_runner_ui` 这类 testbed 服务级日志已补齐按天分片与本地 31 天保留窗口。
+
+### 5.2 shared supervisor 已经统一到一个实现源
+- bare bootstrap 与 ops-managed workload 现在都复用 `selection_supervisor.py + log_shard.py` 这组实现。
+- `gen_bare_deploy_bash.py` 会把同一个 `log_shard.py` helper 下发到生成目录。
+- bare 启动脚本层保留的是稳定逻辑基名，真正的 stdio 重定向和实际分片写入都在共享 `selection_supervisor.py` 运行时里生效。
+
+### 5.3 Rust / Python 已经有三类明确对齐
+- 按天分片与 31 天清理
+- 日志目录派生规则
+- OTLP 基础字段与 Greptime header
+
+## 6. 当前还没有完全收口的点
+这一节只写未完全收口点，避免把“当前事实”和“目标态”混在一起。
+
+### 6.1 KV 目录边界还没有完全收口到单一 `share_path`
+- 预期 KV 最终收口为单一 `share_path`，统一承载 `mmap.file`、`shared.json` 和 side transfer metadata。
+- 当前 Rust 实现仍保留 `shared_memory_path` 与 `shared_file_path` 两条配置，并分别用于 `mmap.file` 与 `shared.json` / `peer metadata` 的就绪探测和发布。
+
+### 6.2 side worker stdio 仍未收口到统一按天分片
+- zero-contribution bootstrap 已经在启动前继承 owner 的 `large_file_paths`，因此 KV runtime logger 不再依赖 attach 后热切换文件路径。
+- 但 side worker stdio 当前仍然直接写 `side_worker_<worker_idx>.stdout.log` / `side_worker_<worker_idx>.stderr.log`，还没有补到统一的按天分片命名。
+
+### 6.3 side worker stdio 与历史 `smoke` 文件还没纳入这轮收口
+- side worker stdio 当前仍是 `side_worker_<worker_idx>.stdout.log` / `side_worker_<worker_idx>.stderr.log`。
+- `smoke.log`、`smoke_bare.log`、`smoke_workloads_bare.log` 一类历史命名仍然存在。
+
+### 6.4 testbed 只有服务级日志收口到了同类语义
+- `test_runner`、`test_runner_ui` 已改为“稳定逻辑基名 + 按天分片落盘”。
+- case 级 `run_dir/logs/**`、`summary.yaml`、`resolved_case.yaml`、`benchmark_result.json` 等仍按 run artifact 生命周期消费。
+- `history_lookback_days` 仍只是控制 UI 回看哪些 workdir；`gitops retention.max_age_days` 仍然清理 gitops run 目录，不是 testbed 服务日志文件的统一 TTL。
+
+### 6.5 OTLP 统一字段和统一状态机还没有全部收口
+- 当前导出链路仍以 `cluster_name`、`member_kind`、`role`、`member_id` 为主。
+- `log_service_kind`、`log_kind`、`process_role`、`instance_key`、`workload_kind`、`workload_name` 这组更细的 canonical 字段还没有完整进入导出链路。
+- Rust 通用链路已经把 `disabled`、`direct`、`proxy`、失败分支显式枚举出来；Python benchmark exporter 仍是直连特化路径，还没有进入同一套通用发送状态机。
+
+## 7. rs / py 模块对齐与防漂移
+稳定结论先说死：
+
+- 共享 log contract 以 Rust canonical 模块为准，Python 优先复用 Rust 已经导出的结果。
+- 当前已经能从代码直接看出三类对齐：按天分片与 31 天清理、日志目录派生、OTLP 基础字段与 header。
+- 当前还没有完全收口的是通用 OTLP 发送状态机。Rust 已经显式枚举发送分支，Python 侧 benchmark exporter 仍是直连特化路径。
+
+### 7.1 按天分片与本地保留窗口
+Rust `fluxon_rs/fluxon_util/src/log.rs`：
+
+```rust
+const LOG_RETENTION_DAYS: usize = 31;
+
+pub fn current_daily_sharded_log_path(base_path: &Path) -> anyhow::Result<PathBuf> {
+    daily_sharded_log_path(base_path, current_shard_date()?)
+}
+
+fn cleanup_old_daily_sharded_logs(base_path: &Path, retention_days: usize) -> anyhow::Result<()> {
+    let keep_since = current_shard_date()? - chrono::Days::new(retention_days.saturating_sub(1) as u64);
+    ...
+    if shard_date < keep_since {
+        fs::remove_file(&path)?;
+    }
+}
+
+impl DailyShardedFileWriter {
+    fn rotate_if_needed(&self, state: &mut DailyShardedFileWriterState) -> io::Result<()> {
+        let next_path = self.current_path()?;
+        cleanup_old_daily_sharded_logs(&self.base_path, self.retention_days)?;
+        let file = fs::OpenOptions::new().create(true).append(true).open(&next_path)?;
+        state.current_path = Some(next_path);
+        state.current_file = Some(file);
+        Ok(())
+    }
+}
+```
+
+Python `deployment/utils/log_shard.py`：
+
+```python
+DEFAULT_DAILY_LOG_RETENTION_DAYS = 31
+
+def daily_sharded_log_path(base_path: Path, *, now: Optional[datetime.datetime] = None) -> Path:
+    shard_date = _resolve_shard_date(ts)
+    return (base_path.parent / f"{stem}.{shard_date.isoformat()}.log").resolve()
+
+def cleanup_old_daily_sharded_logs(base_path: Path, *, retention_days: int = DEFAULT_DAILY_LOG_RETENTION_DAYS) -> None:
+    current_shard_date = _resolve_shard_date(datetime.datetime.now(datetime.timezone.utc))
+    keep_since = current_shard_date - datetime.timedelta(
+        days=max(int(retention_days) - 1, 0)
+    )
+```
+
+这两段现在对齐的是同一个显式 contract：逻辑基名保持不变，日期字段统一落在 `.<YYYY-MM-DD>.log`，默认本地窗口都是 31 天，而且过期删除都显式按日期分片判断。这里不要机械要求两边 helper 名称完全一样；对齐的是“按天分片 + 31 天窗口 + 同口径清理”这条 contract。
+
+### 7.2 KV 主日志是 Rust；Python 侧要分 bare 服务日志和 ops-managed workload 日志两层
+先把边界说死：KV runtime 主日志当前基本都是 Rust 在输出。`master`、`owner`、`external` 这些 KV 进程走的是 `fluxon_util::init_log(...)` 这条链。Python 一侧真正需要单独检查的，当前已经分成两层：
+
+- `deployconf -> gen_bare -> bare bootstrap` 这一层，负责 `ops_controller`、`ops_agent` 和其他 bare service 自身的 stdout/stderr。
+- `ops_agent` 进入 desired-runtime 管理之后，再去托管 workload；这一层的日志 contract 不再沿用 bare `${service_name}.log`，而是 `workload__<kind>__<name>.log`。
+
+先看 bare 这一层：
+
+Python `deployment/gen_bare_deploy_bash.py`：
+
+```python
+from log_shard import render_module_source as render_log_shard_module_source
+
+(outdir / LOG_SHARD_HELPER_FILENAME).write_text(
+    render_log_shard_module_source(),
+    encoding="utf-8",
+)
+```
+
+```python
+runtime_state_json = _bare_runtime_state_json(
+    workload_name=workload_name,
+    authority_name=...,
+    service_name=service_name,
+    log_path=f"${{HOSTWORKDIR}}/log/{service_name}.log",
+)
+
+LOG_DIR="$HOSTWORKDIR/log"
+LOGFILE="$LOG_DIR/${SERVICE}.log"
+...
+SUPERVISOR_PID=$( ... < /dev/null & echo "$!" )
+```
+
+Python `deployment/utils/selection_supervisor_codegen.py`：
+
+```python
+def _redirect_process_stdio_to_runtime_log(runtime_state: Optional[SelectionRuntimeState]) -> None:
+    base_log_path = _require_non_empty_str(runtime_state.log_path, "state.log_path")
+
+    def _router_loop() -> None:
+        _LOG_SHARD.relay_fd_to_daily_sharded_logs(
+            base_log_path=base_log_path,
+            read_fd=read_fd,
+            retention_days=_LOG_SHARD.DEFAULT_DAILY_LOG_RETENTION_DAYS,
+        )
+
+    os.dup2(write_fd, sys.stdout.fileno())
+    os.dup2(write_fd, sys.stderr.fileno())
+
+...
+
+_redirect_process_stdio_to_runtime_log(runtime_state)
+```
+
+再看 ops-managed workload 这一层：
+
+Rust `fluxon_rs/fluxon_ops/src/lib.rs`：
+
+```rust
+fn workload_log_filename(kind: WorkloadKind, name: &str) -> anyhow::Result<String> {
+    Ok(format!("workload__{}__{}.log", kind.as_str(), name))
+}
+
+let runtime_dir = workdir.join(OPS_SELECTION_SUPERVISOR_DIR_NAME);
+let log_dir = workdir.join(OPS_LOG_DIR_NAME);
+let log_path = self.log_dir.join(log_filename);
+```
+
+这组代码说明当前现状是：
+
+- bare bootstrap 与 ops-managed workload 确实已经复用了同一个 `selection_supervisor.py + log_shard.py` 实现源。
+- bare 服务日志与 ops-managed workload 日志也都已经真正接到这套滚动管理 helper 上。
+- 但两层当前并不是同一个 path contract：
+  - bare 服务日志保留的是 `${HOSTWORKDIR}/log/${service_name}.log`
+  - ops-managed workload 保留的是 `${WORKDIR}/log/workload__<workload_kind>__<workload_name>.log`
+
+### 7.3 OTLP 基础字段与 header 已经同名对齐
+Rust `fluxon_rs/fluxon_observability/src/greptime_otlp_log.rs`：
+
+```rust
+let kvs = vec![
+    KeyValue { key: KEY_CLUSTER_NAME.to_string(), value: Some(...) },
+    KeyValue { key: KEY_MEMBER_KIND.to_string(), value: Some(...) },
+    KeyValue { key: KEY_ROLE.to_string(), value: Some(...) },
+    KeyValue { key: KEY_MEMBER_ID.to_string(), value: Some(...) },
+];
+
+let mut reqb = self
+    .http
+    .post(&self.endpoint)
+    .header("X-Greptime-DB-Name", &self.db_name)
+    .header("X-Greptime-Log-Extract-Keys", GREPTIME_LOG_EXTRACT_KEYS_HEADER_VALUE);
+```
+
+Python `fluxon_test_stack/distributed_benchmark_node.py`：
+
+```python
+log_attrs: Dict[str, Any] = {
+    "fluxon_cluster_name": self._cfg.cluster_name,
+    "fluxon_member_kind": self._cfg.member_kind,
+    "fluxon_role": self._cfg.role,
+    "fluxon_member_id": self._cfg.member_id,
+}
+
+headers = {
+    "Content-Type": "application/x-protobuf",
+    "X-Greptime-DB-Name": self._cfg.db_name,
+    "X-Greptime-Log-Extract-Keys": ",".join(extract_keys),
+}
+```
+
+这两边已经对齐到同一个最小公共集合：`fluxon_cluster_name`、`fluxon_member_kind`、`fluxon_role`、`fluxon_member_id` 这组基础属性同名同义，Greptime header 也保持同一协议面。Python benchmark exporter 可以补 phase summary 字段，但不能改写这组基础字段的含义。
+
+### 7.4 发送状态机还没有完全收口
+Rust `fluxon_rs/fluxon_observability/src/greptime_otlp_log_orchestrator.rs`：
+
+```rust
+pub enum GreptimeOtlpLogAttemptResult<N> {
+    Disabled,
+    Sent { path: GreptimeOtlpLogSendPath, proxy_node: Option<N> },
+    SkippedNoProxy { detail: String },
+    ProxyFailed { proxy_node: N, detail: String },
+}
+```
+
+Python `fluxon_test_stack/distributed_benchmark_node.py`：
+
+```python
+with urllib.request.urlopen(req, timeout=GREPTIME_OTLP_LOG_TIMEOUT_SECONDS) as resp:
+    status = getattr(resp, "status", 200)
+    if int(status) < 200 or int(status) >= 300:
+        body_text = resp.read().decode("utf-8", errors="replace")
+        raise RuntimeError(f"greptime otlp http {status}: {body_text}")
+```
+
+这组对照反映的是当前边界：Rust 通用链路已经把 `disabled`、`direct`、`proxy`、失败分支显式枚举出来；Python 这里只是 benchmark phase summary 的直连特化路径，还没有进入同一套通用发送状态机。后续如果 Python 需要承担通用 service-plane 导出，应该复用 Rust 这组有限分支，而不是再发明一套平行状态模型。
+
+### 7.5 防止未来漂移
+只保留四条工程规则：
+
+1. 共享 contract 只保留一个真相源。目录派生、canonical 字段、发送状态、TTL 这类会跨语言消费的语义，优先由 Rust 定义，Python 复用导出结果或逐项镜像实现。
+2. 任何改动如果影响 canonical 文件名、OTLP 字段、Greptime header、发送分支或 retention，必须同一个 PR 同时更新 Rust 代码、Python 代码、设计文档和至少一层 contract test。
+3. Python 特化路径必须显式标出作用域。`test_runner` 服务日志和 benchmark phase summary 可以保留自己的实现，但不能反向成为公共 contract 的定义源。
+4. 多语言边界坚持一个概念一个名字。不要在 rs / py 两边分别引入近义字段、别名参数或平行配置面，否则文档、查询、清理和告警都会漂移。
diff --git a/fluxon_py/config.py b/fluxon_py/config.py
index 9b7b447..51e0d7d 100644
--- a/fluxon_py/config.py
+++ b/fluxon_py/config.py
@@ -110,6 +110,9 @@ def _yaml_template():
   cluster_name:                       # Cluster name (str)
   shared_memory_path:                 # Shared memory path (str)
   shared_file_path:                   # Shared file path for shared.json/logs/profiles (str)
+  large_file_paths:                   # Owner-mode large file roots (dict(optional))
+    log_root_path:                    # Log root path for owner/client large-file outputs (str)
+    cache_root_path:                  # Cache root path for owner/client large-file outputs (str)
   p2p_listen_port:                    # P2P QUIC listen port override (int(optional))
   redis_compat:                       # Enable Redis protocol shim (dict(optional))
     listen_addr:                      # TCP listen addr, e.g. "127.0.0.1:16379" (str)
@@ -584,6 +587,18 @@ def to_fluxon_kv_client_config_yaml_str(self) -> str:
 
             return yaml.safe_dump(cfg, sort_keys=False)
 
+        if "large_file_paths" not in spec:
+            raise ValueError("fluxonkv_spec.large_file_paths is required for owner mode")
+        large_file_paths = spec.get("large_file_paths")
+        if not isinstance(large_file_paths, dict):
+            raise ValueError("fluxonkv_spec.large_file_paths must be a mapping in owner mode")
+        for field_name in ("log_root_path", "cache_root_path"):
+            field_value = large_file_paths.get(field_name)
+            if not isinstance(field_value, str) or not field_value.strip():
+                raise ValueError(
+                    f"fluxonkv_spec.large_file_paths.{field_name} must be a non-empty string in owner mode"
+                )
+
         return yaml.safe_dump(cfg, sort_keys=False)
     
 
diff --git a/fluxon_py/tests/test_config.py b/fluxon_py/tests/test_config.py
index 379e3e0..2979d8e 100644
--- a/fluxon_py/tests/test_config.py
+++ b/fluxon_py/tests/test_config.py
@@ -47,6 +47,7 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("to_yaml_str_roundtrip", _run_test_to_yaml_str_roundtrip),
         ("fluxonkv_sub_cluster_config", test_fluxonkv_sub_cluster_config),
         ("fluxonkv_owner_requires_sub_cluster", test_fluxonkv_owner_requires_sub_cluster),
+        ("fluxonkv_owner_requires_large_file_paths", test_fluxonkv_owner_requires_large_file_paths),
         ("fluxonkv_p2p_relay_removed", test_fluxonkv_p2p_relay_removed),
         ("fluxon_client_config_yaml_shape", test_fluxon_client_config_yaml_shape),
         ("fluxonkv_protocol_field", test_fluxonkv_protocol_field),
@@ -270,6 +271,54 @@ def test_fluxonkv_owner_requires_sub_cluster():
         print(f"❌ FAIL: test_fluxonkv_owner_requires_sub_cluster - {e}")
 
 
+def test_fluxonkv_owner_requires_large_file_paths():
+    """Ensure owner mode requires explicit large_file_paths roots."""
+    try:
+        base = {
+            "instance_key": "test_instance",
+            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
+            "fluxonkv_spec": {
+                "etcd_addresses": ["localhost:2379"],
+                "cluster_name": "test_cluster",
+                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
+                "shared_file_path": "/tmp/kvcache_shared_files/test",
+                "sub_cluster": "rack-a",
+            },
+        }
+
+        try:
+            FluxonKvClientConfig(copy.deepcopy(base)).to_fluxon_kv_client_config_yaml_str()
+            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - missing large_file_paths should be rejected")
+            return
+        except ValueError:
+            pass
+
+        invalid_blank = copy.deepcopy(base)
+        invalid_blank["fluxonkv_spec"]["large_file_paths"] = {
+            "log_root_path": "   ",
+            "cache_root_path": "/tmp/kvcache_large_cache/test",
+        }
+        try:
+            FluxonKvClientConfig(invalid_blank).to_fluxon_kv_client_config_yaml_str()
+            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - blank log_root_path should be rejected")
+            return
+        except ValueError:
+            pass
+
+        valid = copy.deepcopy(base)
+        valid["fluxonkv_spec"]["large_file_paths"] = {
+            "log_root_path": "/tmp/kvcache_large_logs/test",
+            "cache_root_path": "/tmp/kvcache_large_cache/test",
+        }
+        rendered = FluxonKvClientConfig(valid).to_fluxon_kv_client_config_yaml_str()
+        assert "large_file_paths:" in rendered
+        assert "log_root_path: /tmp/kvcache_large_logs/test" in rendered
+        assert "cache_root_path: /tmp/kvcache_large_cache/test" in rendered
+        print("✅ PASS: test_fluxonkv_owner_requires_large_file_paths")
+    except Exception as e:
+        print(f"❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - {e}")
+
+
 def test_fluxonkv_p2p_relay_removed():
     """Ensure removed fluxonkv_spec.p2p_relay is rejected as an unknown key."""
     try:
diff --git a/fluxon_rs/Cargo.lock b/fluxon_rs/Cargo.lock
index 4ddcf9b..a4b0ecd 100644
--- a/fluxon_rs/Cargo.lock
+++ b/fluxon_rs/Cargo.lock
@@ -1320,6 +1320,7 @@ dependencies = [
  "anyhow",
  "askama",
  "base64 0.21.7",
+ "chrono",
  "clap",
  "etcd-client",
  "fluxon_cli",
@@ -1336,6 +1337,7 @@ dependencies = [
  "serde_json",
  "serde_yaml",
  "sha2",
+ "tempfile",
  "thiserror 1.0.69",
  "tokio",
  "tracing",
diff --git a/fluxon_rs/fluxon_fs/src/agent.rs b/fluxon_rs/fluxon_fs/src/agent.rs
index eca583e..03a3dd0 100644
--- a/fluxon_rs/fluxon_fs/src/agent.rs
+++ b/fluxon_rs/fluxon_fs/src/agent.rs
@@ -1407,20 +1407,20 @@ impl FluxonFsAgent {
             .get_self_info()
             .id
             .to_string();
-        let shared_file_path = if self.kv_framework.is_external_mode() {
+        let cache_root_base = if self.kv_framework.is_external_mode() {
             self.kv_framework
                 .external_client_api_view()
                 .external_client_api()
                 .inner()
-                .shared_file_path()
+                .cache_root_path()
         } else {
             self.kv_framework
                 .client_seg_pool_view()
                 .client_seg_pool()
-                .shared_file_path()
+                .cache_root_path()
                 .to_string()
         };
-        let cache_root = resolve_disk_cache_root(Path::new(&shared_file_path), &instance_key);
+        let cache_root = resolve_disk_cache_root(Path::new(&cache_root_base), &instance_key);
         let cache =
             RemoteDiskCacheManager::new(cache_root.clone(), disk_cache_max_bytes_from_env())
                 .map_err(|err| {
diff --git a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
index 7902beb..fb54c06 100644
--- a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
@@ -46,6 +46,8 @@ pub struct ClientSegPoolNewArg {
     pub contribute_size: ContributeToClusterPoolSize,
     pub shared_memory_path: String,
     pub shared_file_path: String,
+    pub log_root_path: String,
+    pub cache_root_path: String,
     pub cluster_name: String,
     pub etcd_addresses: Vec<String>,
     pub attach_existing_meta: Option<SharedJsonMeta>,
@@ -64,6 +66,7 @@ pub struct SharedJsonMeta {
     pub etcd_addresses: Vec<String>,
     pub shared_memory_path: String,
     pub shared_file_path: String,
+    pub large_file_paths: crate::config::LargeFilePaths,
     pub protocol_version: String,
     pub write_ts: Option<i64>,
 }
@@ -203,6 +206,10 @@ pub struct ClientSegPoolInner {
     shared_memory_path: String,
     /// Directory path for regular files (shared.json, side-transfer metadata).
     shared_file_path: String,
+    /// Base directory for runtime logs and profile outputs.
+    log_root_path: String,
+    /// Base directory for large cache files.
+    cache_root_path: String,
     side_transfer_worker: bool,
     attach_owner_ref: Option<ShareGroupOwnerRef>,
 
@@ -262,6 +269,8 @@ impl ClientSegPool {
         let contribute_size = arg.contribute_size;
         let shared_memory_path = arg.shared_memory_path;
         let shared_file_path = arg.shared_file_path;
+        let log_root_path = arg.log_root_path;
+        let cache_root_path = arg.cache_root_path;
         let cluster_name = arg.cluster_name;
         let etcd_addresses = arg.etcd_addresses;
         let attach_existing_meta = arg.attach_existing_meta;
@@ -356,6 +365,8 @@ impl ClientSegPool {
                 view: std::sync::OnceLock::new(),
                 shared_memory_path: shared_memory_path.clone(),
                 shared_file_path: shared_file_path.clone(),
+                log_root_path: log_root_path.clone(),
+                cache_root_path: cache_root_path.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
                 cluster_name: cluster_name.clone(),
@@ -372,6 +383,8 @@ impl ClientSegPool {
                 view: std::sync::OnceLock::new(),
                 shared_memory_path: shared_memory_path.clone(),
                 shared_file_path: shared_file_path.clone(),
+                log_root_path: log_root_path.clone(),
+                cache_root_path: cache_root_path.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
                 cluster_name: cluster_name.clone(),
@@ -535,6 +548,8 @@ impl ClientSegPool {
             view: std::sync::OnceLock::new(),
             shared_memory_path: base_path.to_string(),
             shared_file_path: shared_file_path.clone(),
+            log_root_path,
+            cache_root_path,
             side_transfer_worker,
             attach_owner_ref,
             cluster_name,
@@ -553,6 +568,10 @@ impl ClientSegPool {
         &self.inner().shared_file_path
     }
 
+    pub fn cache_root_path(&self) -> &str {
+        &self.inner().cache_root_path
+    }
+
     fn transfer_rpc_fast_path_eligible_members(&self) -> Vec<ClusterMember> {
         let inner = self.inner();
         let self_info = inner.view().cluster_manager().get_self_info();
@@ -1161,6 +1180,10 @@ impl ClientSegPool {
             etcd_addresses: inner.etcd_addresses.clone(),
             shared_memory_path: shared_memory_canonical,
             shared_file_path: shared_file_canonical,
+            large_file_paths: crate::config::LargeFilePaths {
+                log_root_path: inner.log_root_path.clone(),
+                cache_root_path: inner.cache_root_path.clone(),
+            },
 
             protocol_version,
 
diff --git a/fluxon_rs/fluxon_kv/src/config.rs b/fluxon_rs/fluxon_kv/src/config.rs
index 218ef69..2df094c 100644
--- a/fluxon_rs/fluxon_kv/src/config.rs
+++ b/fluxon_rs/fluxon_kv/src/config.rs
@@ -379,6 +379,17 @@ fn cluster_scoped_shared_path(root: &str, cluster_name: &str) -> KvResult<String
     Ok(scoped.to_string_lossy().into_owned())
 }
 
+fn verify_non_empty_root_path(root: &str, field_name: &str) -> KvResult<String> {
+    let trimmed = root.trim();
+    if trimmed.is_empty() {
+        return Err(ConfigError::InvalidClientConfig {
+            detail: format!("{field_name} cannot be empty"),
+        }
+        .into_kverror());
+    }
+    Ok(trimmed.to_string())
+}
+
 fn resolve_compiled_rdma_transfer_engine() -> KvResult<TransferEngineType> {
     Ok(TransferEngineType::Closed)
 }
@@ -552,6 +563,8 @@ pub struct FluxonKvSpecYaml {
     pub shared_memory_path: String,
     pub shared_file_path: String,
     #[serde(skip_serializing_if = "Option::is_none")]
+    pub large_file_paths: Option<LargeFilePathsYaml>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     pub p2p_listen_port: Option<u16>,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub redis_compat: Option<YamlNullable<RedisCompatConfigYaml>>,
@@ -559,6 +572,13 @@ pub struct FluxonKvSpecYaml {
     pub sub_cluster: Option<YamlNullable<String>>,
 }
 
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(deny_unknown_fields)]
+pub struct LargeFilePathsYaml {
+    pub log_root_path: String,
+    pub cache_root_path: String,
+}
+
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(deny_unknown_fields)]
 pub struct RedisCompatConfigYaml {
@@ -608,6 +628,12 @@ pub struct FluxonKvSpec {
     pub sub_cluster: Option<String>,
 }
 
+#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+pub struct LargeFilePaths {
+    pub log_root_path: String,
+    pub cache_root_path: String,
+}
+
 /// KV client backend types supported by the system
 #[derive(Debug, Clone, PartialEq)]
 pub enum KvClientType {
@@ -627,6 +653,7 @@ pub struct ClientConfig {
     pub fluxonkv_spec: FluxonKvSpec,
     pub shared_memory_path: String, // Mandatory shared memory path
     pub shared_file_path: String,   // Mandatory shared file path
+    pub large_file_paths: LargeFilePaths, // Mandatory large-file roots for logs and caches
     pub test_spec_config: TestSpecConfig,
 }
 
@@ -893,7 +920,7 @@ impl ClientConfigYaml {
             .into_kverror());
         }
 
-        // External (zero-contribution) mode forbids additional knobs to keep the schema minimal.
+        // External (zero-contribution) mode forbids additional owner-derived knobs to keep the schema minimal.
         if is_external {
             if self.fluxonkv_spec.redis_compat.is_some() {
                 return Err(ConfigError::InvalidClientConfig {
@@ -914,6 +941,12 @@ impl ClientConfigYaml {
                 }
                 .into_kverror());
             }
+            if self.fluxonkv_spec.large_file_paths.is_some() {
+                return Err(ConfigError::InvalidClientConfig {
+                    detail: "fluxonkv_spec.large_file_paths is forbidden in zero-contribution mode (it is inherited from owner shared.json)".to_string(),
+                }
+                .into_kverror());
+            }
         }
 
         // Preserve historical behavior for configs that omit `protocol`, but allow
@@ -1053,6 +1086,32 @@ impl ClientConfigYaml {
             }
             .into_kverror());
         }
+        let large_file_paths = if is_external {
+            LargeFilePaths {
+                log_root_path: String::new(),
+                cache_root_path: String::new(),
+            }
+        } else {
+            let Some(large_file_paths_yaml) = self.fluxonkv_spec.large_file_paths.as_ref() else {
+                return Err(ConfigError::InvalidClientConfig {
+                    detail: "fluxonkv_spec.large_file_paths is required for owner mode"
+                        .to_string(),
+                }
+                .into_kverror());
+            };
+            let log_root_path = verify_non_empty_root_path(
+                &large_file_paths_yaml.log_root_path,
+                "large_file_paths.log_root_path",
+            )?;
+            let cache_root_path = verify_non_empty_root_path(
+                &large_file_paths_yaml.cache_root_path,
+                "large_file_paths.cache_root_path",
+            )?;
+            LargeFilePaths {
+                log_root_path,
+                cache_root_path,
+            }
+        };
 
         let shared_memory_path = cluster_scoped_shared_path(
             &self.fluxonkv_spec.shared_memory_path,
@@ -1062,7 +1121,6 @@ impl ClientConfigYaml {
             &self.fluxonkv_spec.shared_file_path,
             &fluxonkv_spec.cluster_name,
         )?;
-
         let redis_compat_listen_addr = match self.fluxonkv_spec.redis_compat.as_ref() {
             None | Some(YamlNullable::Null) => None,
             Some(YamlNullable::Value(rc)) => {
@@ -1094,6 +1152,7 @@ impl ClientConfigYaml {
             fluxonkv_spec,
             shared_memory_path,
             shared_file_path,
+            large_file_paths,
             test_spec_config,
         })
     }
@@ -1434,6 +1493,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   disable_observability: true
@@ -1480,6 +1542,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 "#,
         )
@@ -1492,6 +1557,45 @@ fluxonkv_spec:
         assert!(verified.fluxonkv_spec.enable_transfer_rpc_fast_path);
     }
 
+    #[test]
+    fn client_config_zero_contribution_allows_owner_bootstrapped_large_file_paths() {
+        let cfg = ClientConfigYaml::from_str(
+            r#"
+instance_key: test_external
+fluxonkv_spec:
+  cluster_name: test_cluster
+  shared_memory_path: /tmp/test_external
+  shared_file_path: /tmp/test_external_files
+"#,
+        )
+        .unwrap();
+        let verified = cfg.verify().unwrap();
+        assert_eq!(verified.large_file_paths.log_root_path, "");
+        assert_eq!(verified.large_file_paths.cache_root_path, "");
+        assert_eq!(verified.fluxonkv_spec.etcd_addresses, Vec::<String>::new());
+        assert_eq!(verified.fluxonkv_spec.sub_cluster, None);
+    }
+
+    #[test]
+    fn client_config_zero_contribution_rejects_large_file_paths_in_yaml() {
+        let cfg = ClientConfigYaml::from_str(
+            r#"
+instance_key: test_external
+fluxonkv_spec:
+  cluster_name: test_cluster
+  shared_memory_path: /tmp/test_external
+  shared_file_path: /tmp/test_external_files
+  large_file_paths:
+    log_root_path: /tmp/test_external_logs
+    cache_root_path: /tmp/test_external_cache
+"#,
+        )
+        .unwrap();
+        let err = cfg.verify().unwrap_err();
+        let text = format!("{err}");
+        assert!(text.contains("fluxonkv_spec.large_file_paths is forbidden in zero-contribution mode"));
+    }
+
     #[test]
     fn client_test_spec_config_accepts_explicit_rdma_device_names() {
         let cfg = ClientConfigYaml::from_str(
@@ -1505,6 +1609,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1558,6 +1665,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -1593,6 +1703,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1624,6 +1737,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   require_transfer_rpc_fast_path_ready_timeout_seconds: 45
@@ -1649,6 +1765,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   tcp_thread_control_lane_count: 0
@@ -1675,6 +1794,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1706,6 +1828,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1730,6 +1855,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -1784,6 +1912,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
+  large_file_paths:
+    log_root_path: /tmp/test_side_worker_logs
+    cache_root_path: /tmp/test_side_worker_cache
   p2p_listen_port: 18081
 test_spec_config:
   enable_side_transfer: true
@@ -1823,6 +1954,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
+  large_file_paths:
+    log_root_path: /tmp/test_side_worker_logs
+    cache_root_path: /tmp/test_side_worker_cache
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -1854,6 +1988,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
+  large_file_paths:
+    log_root_path: /tmp/test_side_worker_logs
+    cache_root_path: /tmp/test_side_worker_cache
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -1883,6 +2020,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   p2p_listen_port: 18081
   sub_cluster: rack-a
 test_spec_config:
@@ -1915,6 +2055,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 "#,
         )
@@ -1940,6 +2083,9 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
+  large_file_paths:
+    log_root_path: /tmp/test_owner_logs
+    cache_root_path: /tmp/test_owner_cache
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
index f811424..6a36ca7 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
@@ -2,8 +2,8 @@ use std::collections::HashMap;
 
 use crate::cluster_manager::NodeID;
 use crate::config::{
-    ClientConfig, ContributeToClusterPoolSize, FluxonKvSpec, MasterConfig, MonitoringConfig,
-    ProtocolConfig, ProtocolType, TestSpecConfig, TransferEngineType,
+    ClientConfig, ContributeToClusterPoolSize, FluxonKvSpec, LargeFilePaths, MasterConfig,
+    MonitoringConfig, ProtocolConfig, ProtocolType, TestSpecConfig, TransferEngineType,
 };
 use crate::master_kv_router::MasterKvRouterView;
 use crate::{ConfigArg, run_client, run_master};
@@ -82,6 +82,10 @@ fn new_client_config(
         },
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
+        large_file_paths: LargeFilePaths {
+            log_root_path: format!("{}_logs", shm_path),
+            cache_root_path: format!("{}_cache", shm_path),
+        },
         test_spec_config: TestSpecConfig::default(),
     }
 }
@@ -124,6 +128,10 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
+        large_file_paths: LargeFilePaths {
+            log_root_path: String::new(),
+            cache_root_path: String::new(),
+        },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
index f2634be..0758ab5 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
@@ -253,6 +253,7 @@ define_module!(
 pub struct ExternalClientApiNewArg {
     pub shared_memory_path: String,
     pub shared_file_path: String,
+    pub cache_root_path: String,
     pub expected_cluster_name: String,
     pub expected_protocol_version: String,
     pub enable_side_transfer: bool,
@@ -312,6 +313,7 @@ pub struct ExternalInner {
     expected_protocol_version: String,
     external_shared_memory_path: String,
     external_shared_file_path: String,
+    external_cache_root_path: String,
     _enable_side_transfer: bool,
     short_circuit_put_payload_path: bool,
     side_rr_next: AtomicUsize,
@@ -363,6 +365,7 @@ impl ExternalClientApi {
             expected_protocol_version: arg.expected_protocol_version,
             external_shared_memory_path: arg.shared_memory_path,
             external_shared_file_path: arg.shared_file_path,
+            external_cache_root_path: arg.cache_root_path,
             _enable_side_transfer: arg.enable_side_transfer,
             short_circuit_put_payload_path: arg.short_circuit_put_payload_path,
             side_rr_next: AtomicUsize::new(0),
@@ -1237,6 +1240,10 @@ impl ExternalInner {
         self.external_shared_file_path.clone()
     }
 
+    pub fn cache_root_path(&self) -> String {
+        self.external_cache_root_path.clone()
+    }
+
     fn should_fallback_side_p2p_error(err: &crate::p2p::P2PError) -> bool {
         matches!(
             err,
diff --git a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
index 355ca6e..1b5754d 100644
--- a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
+++ b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
@@ -147,6 +147,10 @@ fn new_client_config_with_cluster_and_dram(
         },
         shared_memory_path,
         shared_file_path,
+        large_file_paths: crate::config::LargeFilePaths {
+            log_root_path: format!("{}/large_logs/{}", base, instance_key),
+            cache_root_path: format!("{}/large_cache/{}", base, instance_key),
+        },
         test_spec_config: TestSpecConfig::default(),
     };
     println!("fluxonkv core created client config for test: {:?}", conf);
diff --git a/fluxon_rs/fluxon_kv/src/lib.rs b/fluxon_rs/fluxon_kv/src/lib.rs
index b46fd85..96e9b28 100644
--- a/fluxon_rs/fluxon_kv/src/lib.rs
+++ b/fluxon_rs/fluxon_kv/src/lib.rs
@@ -105,6 +105,13 @@ use std::sync::Arc;
 use std::time::{Duration, Instant};
 use tracing::{info, warn};
 
+struct ExternalBootstrapBundle {
+    meta: SharedJsonMeta,
+    shared_memory_path: String,
+    shared_file_path: String,
+    etcd_endpoints: Vec<String>,
+}
+
 fn cluster_manager_rdma_control_init_from_transfer_config(
     _transfer_engine: TransferEngineType,
     _protocol: &ProtocolConfig,
@@ -585,7 +592,7 @@ fn tcp_thread_transport_tuning_from_test_spec_config(
 }
 
 pub async fn load_client_config(config_arg: ConfigArg<ClientConfig>) -> KvResult<ClientConfig> {
-    match config_arg {
+    let config = match config_arg {
         ConfigArg::None => {
             // Try to find default config file
             match find_default_config_file() {
@@ -594,13 +601,13 @@ pub async fn load_client_config(config_arg: ConfigArg<ClientConfig>) -> KvResult
                     let config_yaml = ClientConfigYaml::from_file(&path)?;
                     let config = config_yaml.verify()?;
                     println!("Client configuration loaded and validated successfully");
-                    Ok(config)
+                    config
                 }
                 None => Err(ConfigError::FileReadError {
                     detail: "No config file found. Please provide a config file with -f option"
                         .to_string(),
                 }
-                .into_kverror()),
+                .into_kverror())?,
             }
         }
         ConfigArg::File(config_path) => {
@@ -608,13 +615,15 @@ pub async fn load_client_config(config_arg: ConfigArg<ClientConfig>) -> KvResult
             let config_yaml = ClientConfigYaml::from_file(&config_path)?;
             let config = config_yaml.verify()?;
             println!("Client configuration loaded and validated successfully");
-            Ok(config)
+            config
         }
         ConfigArg::Config(config) => {
             println!("Using provided client configuration");
-            Ok(config)
+            config
         }
-    }
+    };
+
+    bootstrap_zero_contribution_client_config(config).await
 }
 
 pub async fn load_master_config(config_arg: ConfigArg<MasterConfig>) -> KvResult<MasterConfig> {
@@ -785,6 +794,7 @@ fn build_side_transfer_worker_config(
         },
         shared_memory_path: owner_config.shared_memory_path.clone(),
         shared_file_path: owner_config.shared_file_path.clone(),
+        large_file_paths: owner_config.large_file_paths.clone(),
         test_spec_config,
     })
 }
@@ -829,6 +839,7 @@ fn build_side_transfer_worker_config_yaml(
             cluster_name: side_config.cluster_name,
             shared_memory_path: side_config.shared_memory_path,
             shared_file_path: side_config.shared_file_path,
+            large_file_paths: None,
             p2p_listen_port: side_config.fluxonkv_spec.p2p_listen_port,
             redis_compat: None,
             sub_cluster: None,
@@ -838,7 +849,7 @@ fn build_side_transfer_worker_config_yaml(
 }
 
 fn side_transfer_runtime_dir(owner_config: &ClientConfig) -> PathBuf {
-    Path::new(&owner_config.shared_file_path)
+    Path::new(&owner_config.large_file_paths.log_root_path)
         .join(format!("{}_cluster_kv_logs", owner_config.cluster_name))
         .join("side_transfer_runtime")
         .join(&owner_config.instance_key)
@@ -1569,6 +1580,265 @@ fn merge_startup_member_metadata(
     Ok(())
 }
 
+async fn bootstrap_zero_contribution_client_config(config: ClientConfig) -> KvResult<ClientConfig> {
+    let dram = config.contribute_to_cluster_pool_size.dram;
+    let vram_is_zero = config
+        .contribute_to_cluster_pool_size
+        .vram
+        .values()
+        .all(|&v| v == 0);
+    let is_zero_contribution = dram == 0 && vram_is_zero;
+    if !is_zero_contribution {
+        return Ok(config);
+    }
+
+    let bundle = wait_for_external_bootstrap_bundle(&config).await?;
+    let mut final_config = config;
+    final_config.etcd_addresses_raw = bundle.meta.etcd_addresses.clone();
+    final_config.fluxonkv_spec.etcd_addresses = bundle.etcd_endpoints;
+    final_config.fluxonkv_spec.sub_cluster = bundle.meta.sub_cluster.clone();
+    final_config.shared_memory_path = bundle.shared_memory_path;
+    final_config.shared_file_path = bundle.shared_file_path;
+    final_config.large_file_paths = bundle.meta.large_file_paths;
+    Ok(final_config)
+}
+
+async fn wait_for_external_bootstrap_bundle(
+    config: &ClientConfig,
+) -> KvResult<ExternalBootstrapBundle> {
+    let build_version = fluxon_util::git_version_build_record::get_current_git_commitid().unwrap();
+    let shared_memory_dir = Path::new(&config.shared_memory_path);
+    let shared_file_dir = Path::new(&config.shared_file_path);
+    let shared_json_path = shared_file_dir.join("shared.json");
+    let mmap_file_path = shared_memory_dir.join("mmap.file");
+
+    let mut waited_ticks: u64 = 0;
+    loop {
+        if !shared_json_path.exists() || !mmap_file_path.exists() {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                info!(
+                    "Waiting owner shared bundle to be ready... ({}s), shm_dir={} file_dir={} (shared.json={}, mmap.file={})",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_file_dir.to_string_lossy(),
+                    shared_json_path.exists(),
+                    mmap_file_path.exists()
+                );
+            }
+            continue;
+        }
+
+        let shared_json_buf = match std::fs::read_to_string(&shared_json_path) {
+            Ok(v) => v,
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting owner shared.json readable... ({}s), path={}, err={}",
+                        waited_ticks / 5,
+                        shared_json_path.to_string_lossy(),
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        let meta: crate::SharedJsonMeta = match serde_json::from_str(&shared_json_buf) {
+            Ok(v) => v,
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting owner shared.json schema ready... ({}s), path={}, err={}",
+                        waited_ticks / 5,
+                        shared_json_path.to_string_lossy(),
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        if meta.protocol_version != build_version {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                warn!(
+                    "Waiting protocol_version match... ({}s), shm_dir='{}' file_dir='{}', shared='{}', local='{}'",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_file_dir.to_string_lossy(),
+                    meta.protocol_version,
+                    build_version
+                );
+            }
+            continue;
+        }
+
+        if meta.cluster_name != config.cluster_name {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                warn!(
+                    "Waiting cluster_name match... ({}s), shm_dir='{}' file_dir='{}', config='{}', shared.json='{}'",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_file_dir.to_string_lossy(),
+                    config.cluster_name,
+                    meta.cluster_name
+                );
+            }
+            continue;
+        }
+
+        let shared_memory_path_canonical = match std::fs::canonicalize(&config.shared_memory_path) {
+            Ok(v) => v.to_string_lossy().into_owned(),
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
+                        waited_ticks / 5,
+                        shared_memory_dir.to_string_lossy(),
+                        config.shared_memory_path,
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        let meta_shm_canonical = match std::fs::canonicalize(&meta.shared_memory_path) {
+            Ok(v) => v.to_string_lossy().into_owned(),
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting shared.json shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
+                        waited_ticks / 5,
+                        shared_memory_dir.to_string_lossy(),
+                        meta.shared_memory_path,
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        let shared_file_path_canonical = match std::fs::canonicalize(&config.shared_file_path) {
+            Ok(v) => v.to_string_lossy().into_owned(),
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
+                        waited_ticks / 5,
+                        shared_file_dir.to_string_lossy(),
+                        config.shared_file_path,
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+        let meta_file_canonical = match std::fs::canonicalize(&meta.shared_file_path) {
+            Ok(v) => v.to_string_lossy().into_owned(),
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting shared.json shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
+                        waited_ticks / 5,
+                        shared_file_dir.to_string_lossy(),
+                        meta.shared_file_path,
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        if meta_shm_canonical != shared_memory_path_canonical {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                warn!(
+                    "Waiting shared_memory_path match... ({}s), shm_dir='{}', config='{}', shared.json='{}'",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_memory_path_canonical,
+                    meta_shm_canonical
+                );
+            }
+            continue;
+        }
+        if meta_file_canonical != shared_file_path_canonical {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                warn!(
+                    "Waiting shared_file_path match... ({}s), file_dir='{}', config='{}', shared.json='{}'",
+                    waited_ticks / 5,
+                    shared_file_dir.to_string_lossy(),
+                    shared_file_path_canonical,
+                    meta_file_canonical
+                );
+            }
+            continue;
+        }
+
+        if meta.etcd_addresses.is_empty() {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                warn!(
+                    "Waiting shared.json etcd_addresses non-empty... ({}s), shm_dir='{}' file_dir='{}', shared_memory_path='{}'",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_file_dir.to_string_lossy(),
+                    meta_shm_canonical
+                );
+            }
+            continue;
+        }
+
+        let etcd_endpoints = match normalize_etcd_addresses(&meta.etcd_addresses) {
+            Ok(v) => v,
+            Err(e) => {
+                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+                waited_ticks += 1;
+                if waited_ticks % 25 == 0 {
+                    warn!(
+                        "Waiting shared.json etcd_addresses valid... ({}s), shm_dir='{}' file_dir='{}', raw={:?}, err={}",
+                        waited_ticks / 5,
+                        shared_memory_dir.to_string_lossy(),
+                        shared_file_dir.to_string_lossy(),
+                        meta.etcd_addresses,
+                        e
+                    );
+                }
+                continue;
+            }
+        };
+
+        return Ok(ExternalBootstrapBundle {
+            meta,
+            shared_memory_path: meta_shm_canonical,
+            shared_file_path: meta_file_canonical,
+            etcd_endpoints,
+        });
+    }
+}
+
 async fn run_client_impl(
     config_arg: ConfigArg<ClientConfig>,
     test_overrides: Option<ClientRunTestOverrides>,
@@ -1598,9 +1868,8 @@ async fn run_client_impl(
     let build_version = fluxon_util::git_version_build_record::get_current_git_commitid().unwrap();
     let source_sha256 = fluxon_util::build_info::SOURCE_SHA256;
 
-    // 初始化日志系统：将日志放到共享文件根目录
-    // 下的 {cluster_name}_cluster_kv_logs 子目录，避免在 shm 根目录下展开普通文件。
-    let kv_logs_dir = Path::new(&config.shared_file_path)
+    // Logs and other large files are isolated from shared.json/peer metadata.
+    let kv_logs_dir = Path::new(&config.large_file_paths.log_root_path)
         .join(format!("{}_cluster_kv_logs", config.cluster_name));
     let observability_disabled = config.test_spec_config.disable_observability;
     let greptime_tracing_rx = if observability_disabled {
@@ -1651,263 +1920,10 @@ async fn run_client_impl(
             config.test_spec_config.side_transfer_role,
             Some(SideTransferRole::Worker)
         );
-    let mut bootstrapped_shared_meta: Option<SharedJsonMeta> = None;
-
-    let config = if is_external {
-        let shared_memory_dir = Path::new(&config.shared_memory_path);
-        let shared_file_dir = Path::new(&config.shared_file_path);
-        let shared_json_path = shared_file_dir.join("shared.json");
-        let mmap_file_path = shared_memory_dir.join("mmap.file");
-
-        let mut waited_ticks: u64 = 0;
-        let (meta, meta_shm_canonical, meta_file_canonical, etcd_endpoints) = loop {
-            if !shared_json_path.exists() || !mmap_file_path.exists() {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    info!(
-                        "Waiting owner shared bundle to be ready... ({}s), shm_dir={} file_dir={} (shared.json={}, mmap.file={})",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_file_dir.to_string_lossy(),
-                        shared_json_path.exists(),
-                        mmap_file_path.exists()
-                    );
-                }
-                continue;
-            }
-
-            let shared_json_buf = match std::fs::read_to_string(&shared_json_path) {
-                Ok(v) => v,
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting owner shared.json readable... ({}s), path={}, err={}",
-                            waited_ticks / 5,
-                            shared_json_path.to_string_lossy(),
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-
-            let meta: crate::SharedJsonMeta = match serde_json::from_str(&shared_json_buf) {
-                Ok(v) => v,
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting owner shared.json schema ready... ({}s), path={}, err={}",
-                            waited_ticks / 5,
-                            shared_json_path.to_string_lossy(),
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-
-            if meta.protocol_version != build_version {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting protocol_version match... ({}s), shm_dir='{}' file_dir='{}', shared='{}', local='{}'",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_file_dir.to_string_lossy(),
-                        meta.protocol_version,
-                        build_version
-                    );
-                }
-                continue;
-            }
-
-            if meta.cluster_name != config.cluster_name {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting cluster_name match... ({}s), shm_dir='{}' file_dir='{}', config='{}', shared.json='{}'",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_file_dir.to_string_lossy(),
-                        config.cluster_name,
-                        meta.cluster_name
-                    );
-                }
-                continue;
-            }
-
-            let shared_memory_path_canonical = match std::fs::canonicalize(
-                &config.shared_memory_path,
-            ) {
-                Ok(v) => v.to_string_lossy().into_owned(),
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
-                            waited_ticks / 5,
-                            shared_memory_dir.to_string_lossy(),
-                            config.shared_memory_path,
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-
-            let meta_shm_canonical = match std::fs::canonicalize(&meta.shared_memory_path) {
-                Ok(v) => v.to_string_lossy().into_owned(),
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting shared.json shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
-                            waited_ticks / 5,
-                            shared_memory_dir.to_string_lossy(),
-                            meta.shared_memory_path,
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-            let shared_file_path_canonical = match std::fs::canonicalize(&config.shared_file_path) {
-                Ok(v) => v.to_string_lossy().into_owned(),
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
-                            waited_ticks / 5,
-                            shared_file_dir.to_string_lossy(),
-                            config.shared_file_path,
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-            let meta_file_canonical = match std::fs::canonicalize(&meta.shared_file_path) {
-                Ok(v) => v.to_string_lossy().into_owned(),
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting shared.json shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
-                            waited_ticks / 5,
-                            shared_file_dir.to_string_lossy(),
-                            meta.shared_file_path,
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-
-            if meta_shm_canonical != shared_memory_path_canonical {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting shared_memory_path match... ({}s), shm_dir='{}', config='{}', shared.json='{}'",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_memory_path_canonical,
-                        meta_shm_canonical
-                    );
-                }
-                continue;
-            }
-            if meta_file_canonical != shared_file_path_canonical {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting shared_file_path match... ({}s), file_dir='{}', config='{}', shared.json='{}'",
-                        waited_ticks / 5,
-                        shared_file_dir.to_string_lossy(),
-                        shared_file_path_canonical,
-                        meta_file_canonical
-                    );
-                }
-                continue;
-            }
-
-            if meta.etcd_addresses.is_empty() {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting shared.json etcd_addresses non-empty... ({}s), shm_dir='{}' file_dir='{}', shared_memory_path='{}'",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_file_dir.to_string_lossy(),
-                        meta_shm_canonical
-                    );
-                }
-                continue;
-            }
-
-            let etcd_endpoints = match normalize_etcd_addresses(&meta.etcd_addresses) {
-                Ok(v) => v,
-                Err(e) => {
-                    limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200))
-                        .await;
-                    waited_ticks += 1;
-                    if waited_ticks % 25 == 0 {
-                        warn!(
-                            "Waiting shared.json etcd_addresses valid... ({}s), shm_dir='{}' file_dir='{}', raw={:?}, err={}",
-                            waited_ticks / 5,
-                            shared_memory_dir.to_string_lossy(),
-                            shared_file_dir.to_string_lossy(),
-                            meta.etcd_addresses,
-                            e
-                        );
-                    }
-                    continue;
-                }
-            };
-
-            break (
-                meta,
-                meta_shm_canonical,
-                meta_file_canonical,
-                etcd_endpoints,
-            );
-        };
-        bootstrapped_shared_meta = Some(meta.clone());
-        // External bootstrap contract:
-        // - Config provides: instance_key, fluxonkv_spec.cluster_name, fluxonkv_spec.shared_memory_path,
-        //   fluxonkv_spec.shared_file_path, fluxonkv_spec.p2p_listen_port.
-        // - shared.json provides: cluster_name, etcd_addresses (raw), shared_memory_path (canonical),
-        //   shared_file_path (canonical), protocol_version, sub_cluster.
-        // - pprof_duration_seconds is not inherited; it is controlled solely by config.
-        let mut final_config = config.clone();
-        final_config.etcd_addresses_raw = meta.etcd_addresses.clone();
-        final_config.fluxonkv_spec.etcd_addresses = etcd_endpoints;
-        final_config.fluxonkv_spec.sub_cluster = meta.sub_cluster;
-        final_config.shared_memory_path = meta_shm_canonical;
-        final_config.shared_file_path = meta_file_canonical;
-        final_config
+    let bootstrapped_shared_meta = if is_external {
+        Some(wait_for_external_bootstrap_bundle(&config).await?.meta)
     } else {
-        config
+        None
     };
 
     if !is_external && config.test_spec_config.side_transfer_worker_count > 0 {
@@ -2012,6 +2028,7 @@ async fn run_client_impl(
             external_client_api_arg: ExternalClientApiNewArg {
                 shared_memory_path: config.shared_memory_path.clone(),
                 shared_file_path: config.shared_file_path.clone(),
+                cache_root_path: config.large_file_paths.cache_root_path.clone(),
                 expected_cluster_name: config.cluster_name.clone(),
                 expected_protocol_version: build_version.clone(),
                 enable_side_transfer: config.test_spec_config.enable_side_transfer,
@@ -2063,6 +2080,8 @@ async fn run_client_impl(
                 // Read shared memory path from config (must not be empty).
                 shared_memory_path: config.shared_memory_path.clone(),
                 shared_file_path: config.shared_file_path.clone(),
+                log_root_path: config.large_file_paths.log_root_path.clone(),
+                cache_root_path: config.large_file_paths.cache_root_path.clone(),
                 cluster_name: config.cluster_name.clone(),
                 etcd_addresses: config.etcd_addresses_raw.clone(),
                 attach_existing_meta: if is_side_transfer_worker {
@@ -2405,7 +2424,7 @@ async fn run_client_impl(
     }
 
     let shutdown_waiter = framework.cluster_manager_view().register_shutdown_waiter();
-    let kv_profiles_dir = Path::new(&config.shared_file_path)
+    let kv_profiles_dir = Path::new(&config.large_file_paths.log_root_path)
         .join(format!("{}_cluster_kv_profiles", config.cluster_name));
     profile::spawn_pprof_flamegraph_on_timeout_or_shutdown(
         config.pprof_duration_seconds,
@@ -2485,6 +2504,10 @@ mod tests {
             },
             shared_memory_path: "/tmp/fluxon_side_transfer_test".to_string(),
             shared_file_path: "/tmp/fluxon_side_transfer_test_files".to_string(),
+            large_file_paths: crate::config::LargeFilePaths {
+                log_root_path: "/tmp/fluxon_side_transfer_test_large/log".to_string(),
+                cache_root_path: "/tmp/fluxon_side_transfer_test_large/cache".to_string(),
+            },
             test_spec_config: TestSpecConfig {
                 enable_side_transfer: true,
                 side_transfer_worker_count: 4,
@@ -2720,6 +2743,7 @@ mod tests {
         );
         assert!(side_cfg_yaml.contribute_to_cluster_pool_size.is_none());
         assert!(side_cfg_yaml.fluxonkv_spec.etcd_addresses.is_none());
+        assert!(side_cfg_yaml.fluxonkv_spec.large_file_paths.is_none());
         assert!(side_cfg_yaml.fluxonkv_spec.sub_cluster.is_none());
         assert_eq!(side_cfg_yaml.fluxonkv_spec.p2p_listen_port, Some(42001));
         assert_eq!(
@@ -2728,6 +2752,101 @@ mod tests {
         );
     }
 
+    #[tokio::test]
+    async fn zero_contribution_bootstrap_inherits_large_file_paths_from_owner_shared_json() {
+        let tempdir = new_test_dir("fluxon_external_bootstrap_large_paths");
+        let shared_memory_root = tempdir.join("shared_mem");
+        let shared_file_root = tempdir.join("shared_file");
+        let owner_log_root = tempdir.join("owner_logs");
+        let owner_cache_root = tempdir.join("owner_cache");
+        std::fs::create_dir_all(&shared_memory_root).unwrap();
+        std::fs::create_dir_all(&shared_file_root).unwrap();
+        std::fs::create_dir_all(&owner_log_root).unwrap();
+        std::fs::create_dir_all(&owner_cache_root).unwrap();
+        std::fs::write(shared_memory_root.join("mmap.file"), vec![0u8; 4096]).unwrap();
+
+        let shared_meta = SharedJsonMeta {
+            owner_id: "owner-a".to_string(),
+            node_start_time: 123,
+            segment_len: 4096,
+            segment_label: Some("cpu:0".to_string()),
+            sub_cluster: Some("owner-sub".to_string()),
+            cluster_name: "test_cluster".to_string(),
+            etcd_addresses: vec!["127.0.0.1:2379".to_string()],
+            shared_memory_path: std::fs::canonicalize(&shared_memory_root)
+                .unwrap()
+                .to_string_lossy()
+                .into_owned(),
+            shared_file_path: std::fs::canonicalize(&shared_file_root)
+                .unwrap()
+                .to_string_lossy()
+                .into_owned(),
+            large_file_paths: crate::config::LargeFilePaths {
+                log_root_path: owner_log_root.to_string_lossy().into_owned(),
+                cache_root_path: owner_cache_root.to_string_lossy().into_owned(),
+            },
+            protocol_version:
+                fluxon_util::git_version_build_record::get_current_git_commitid().unwrap(),
+            write_ts: Some(chrono::Utc::now().timestamp_micros()),
+        };
+        std::fs::write(
+            shared_file_root.join("shared.json"),
+            serde_json::to_vec(&shared_meta).unwrap(),
+        )
+        .unwrap();
+
+        let config = ClientConfig {
+            cluster_name: "test_cluster".to_string(),
+            etcd_addresses_raw: Vec::new(),
+            instance_key: "external-a".to_string(),
+            contribute_to_cluster_pool_size: ContributeToClusterPoolSize {
+                dram: 0,
+                vram: HashMap::new(),
+            },
+            protocol: ProtocolConfig {
+                protocol_type: ProtocolType::Tcp,
+                rdma_device_names: None,
+            },
+            pprof_duration_seconds: None,
+            redis_compat_listen_addr: None,
+            fluxonkv_spec: FluxonKvSpec {
+                etcd_addresses: Vec::new(),
+                cluster_name: "test_cluster".to_string(),
+                p2p_listen_port: Some(41001),
+                transfer_engine: TransferEngineType::P2p,
+                enable_transfer_rpc_fast_path: false,
+                sub_cluster: None,
+            },
+            shared_memory_path: shared_memory_root.to_string_lossy().into_owned(),
+            shared_file_path: shared_file_root.to_string_lossy().into_owned(),
+            large_file_paths: crate::config::LargeFilePaths {
+                log_root_path: String::new(),
+                cache_root_path: String::new(),
+            },
+            test_spec_config: TestSpecConfig::default(),
+        };
+
+        let bootstrapped = bootstrap_zero_contribution_client_config(config)
+            .await
+            .expect("bootstrap zero-contribution config");
+        assert_eq!(
+            bootstrapped.large_file_paths.log_root_path,
+            owner_log_root.to_string_lossy()
+        );
+        assert_eq!(
+            bootstrapped.large_file_paths.cache_root_path,
+            owner_cache_root.to_string_lossy()
+        );
+        assert_eq!(
+            bootstrapped.fluxonkv_spec.sub_cluster,
+            Some("owner-sub".to_string())
+        );
+        assert_eq!(
+            bootstrapped.fluxonkv_spec.etcd_addresses,
+            vec!["http://127.0.0.1:2379".to_string()]
+        );
+    }
+
     #[test]
     fn current_exe_name_helpers_detect_python_and_fluxon_kv() {
         assert!(current_exe_looks_like_python(Path::new(
diff --git a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
index 377a1c2..5b260c3 100644
--- a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
+++ b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
@@ -94,6 +94,10 @@ fn new_client_config_with_size(
         },
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", instance_key),
+        large_file_paths: crate::config::LargeFilePaths {
+            log_root_path: format!("/tmp/kvcache_large_logs/{}", instance_key),
+            cache_root_path: format!("/tmp/kvcache_large_cache/{}", instance_key),
+        },
         test_spec_config: TestSpecConfig::default(),
     }
 }
@@ -127,6 +131,10 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", owner_instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", owner_instance_key),
+        large_file_paths: crate::config::LargeFilePaths {
+            log_root_path: String::new(),
+            cache_root_path: String::new(),
+        },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_rs/fluxon_ops/Cargo.toml b/fluxon_rs/fluxon_ops/Cargo.toml
index 0d54fc5..f4f772a 100644
--- a/fluxon_rs/fluxon_ops/Cargo.toml
+++ b/fluxon_rs/fluxon_ops/Cargo.toml
@@ -5,6 +5,7 @@ edition = "2024"
 
 [dependencies]
 anyhow = { workspace = true }
+chrono = { workspace = true }
 serde = { workspace = true }
 serde_json = { workspace = true }
 serde_yaml = { workspace = true }
@@ -28,3 +29,6 @@ fluxon_framework = { path = "../fluxon_framework" }
 fluxon_util = { path = "../fluxon_util" }
 fluxon_cli = { path = "../fluxon_cli" }
 fluxon_proxy = { path = "../fluxon_proxy" }
+
+[dev-dependencies]
+tempfile = { workspace = true }
diff --git a/fluxon_rs/fluxon_ops/build.rs b/fluxon_rs/fluxon_ops/build.rs
index ae424ef..585fbfc 100644
--- a/fluxon_rs/fluxon_ops/build.rs
+++ b/fluxon_rs/fluxon_ops/build.rs
@@ -58,14 +58,23 @@ print(
     String::from_utf8(output.stdout).expect("selection supervisor output must be utf-8")
 }
 
+fn render_log_shard_helper(repo_root: &Path) -> String {
+    let helper_path = repo_root.join("deployment").join("utils").join("log_shard.py");
+    fs::read_to_string(&helper_path)
+        .unwrap_or_else(|e| panic!("read log shard helper failed: {} ({})", helper_path.display(), e))
+}
+
 fn main() {
     let manifest_dir = PathBuf::from(env::var("CARGO_MANIFEST_DIR").expect("CARGO_MANIFEST_DIR"));
     let repo_root = repo_root(&manifest_dir);
     let source = render_selection_supervisor(&repo_root);
+    let log_shard_source = render_log_shard_helper(&repo_root);
 
     let out_dir = PathBuf::from(env::var("OUT_DIR").expect("OUT_DIR"));
     let out_path = out_dir.join("selection_supervisor.py");
     fs::write(&out_path, source).expect("write embedded selection supervisor source");
+    let helper_out_path = out_dir.join("log_shard.py");
+    fs::write(&helper_out_path, log_shard_source).expect("write embedded log shard helper");
 
     println!("cargo:rerun-if-changed=build.rs");
     println!(
@@ -76,4 +85,8 @@ fn main() {
             .join("selection_supervisor_codegen.py")
             .display()
     );
+    println!(
+        "cargo:rerun-if-changed={}",
+        repo_root.join("deployment").join("utils").join("log_shard.py").display()
+    );
 }
diff --git a/fluxon_rs/fluxon_ops/src/lib.rs b/fluxon_rs/fluxon_ops/src/lib.rs
index 40f646a..b27420b 100644
--- a/fluxon_rs/fluxon_ops/src/lib.rs
+++ b/fluxon_rs/fluxon_ops/src/lib.rs
@@ -28,7 +28,8 @@ use fluxon_kv::{ConfigArg, Framework, run_client};
 
 use fluxon_proxy::{HeaderKv, PanelProxyMethod, PanelProxyResp};
 use fluxon_util::{
-    FluxonCliProxyDescriptorV2, FluxonCliProxyTransportV2, fluxon_cli_proxy_desc_etcd_key_v2,
+    FluxonCliProxyDescriptorV2, FluxonCliProxyTransportV2, display_runtime_log_path,
+    fluxon_cli_proxy_desc_etcd_key_v2, resolve_readable_log_path,
 };
 
 pub const OPS_SERVICE_NAME: &str = "ops";
@@ -57,6 +58,7 @@ const OPS_ATOMIC_GROUP_ANNOTATION_KEY: &str = "fluxon.io/atomic_group";
 const OPS_ATOMIC_GROUP_PHASE_ANNOTATION_KEY: &str = "fluxon.io/atomic_group_phase";
 const OPS_ATOMIC_GROUP_ORDER_ANNOTATION_KEY: &str = "fluxon.io/atomic_group_order";
 const OPS_SELECTION_SUPERVISOR_FILENAME: &str = "selection_supervisor.py";
+const OPS_LOG_SHARD_HELPER_FILENAME: &str = "log_shard.py";
 const OPS_SELECTION_SUPERVISOR_DIR_NAME: &str = "selection_supervisor";
 const OPS_SELECTION_SUPERVISOR_RUN_RESTART_DELAY_SECONDS: u64 = 5;
 const OPS_SELECTION_SUPERVISOR_RUN_MAX_BACKOFF_SECONDS: u64 = 30;
@@ -78,6 +80,7 @@ const DELETE_APPLY_NO_WAIT_DELAY_SECONDS: u64 = 30;
 
 const EMBEDDED_SELECTION_SUPERVISOR_SOURCE: &str =
     include_str!(concat!(env!("OUT_DIR"), "/selection_supervisor.py"));
+const EMBEDDED_LOG_SHARD_HELPER_SOURCE: &str = include_str!(concat!(env!("OUT_DIR"), "/log_shard.py"));
 
 // Ops controller uses Fluxon user-RPC to talk to ops agents.
 // Keep the timeout as a fixed constant to avoid config surface area.
@@ -970,7 +973,7 @@ fn resolve_python_host_executable(python_exe: &Path) -> anyhow::Result<PathBuf>
     Ok(resolved)
 }
 
-fn ensure_embedded_selection_supervisor(workdir: &Path) -> anyhow::Result<PathBuf> {
+fn ensure_embedded_selection_supervisor_runtime(workdir: &Path) -> anyhow::Result<(PathBuf, PathBuf)> {
     let runtime_dir = workdir.join(OPS_SELECTION_SUPERVISOR_DIR_NAME);
     std::fs::create_dir_all(&runtime_dir).with_context(|| {
         format!(
@@ -979,6 +982,7 @@ fn ensure_embedded_selection_supervisor(workdir: &Path) -> anyhow::Result<PathBu
         )
     })?;
     let script_path = runtime_dir.join(OPS_SELECTION_SUPERVISOR_FILENAME);
+    let helper_path = runtime_dir.join(OPS_LOG_SHARD_HELPER_FILENAME);
     let should_write = match std::fs::read_to_string(&script_path) {
         Ok(existing) => existing != EMBEDDED_SELECTION_SUPERVISOR_SOURCE,
         Err(e) => {
@@ -992,6 +996,19 @@ fn ensure_embedded_selection_supervisor(workdir: &Path) -> anyhow::Result<PathBu
             }
         }
     };
+    let should_write_helper = match std::fs::read_to_string(&helper_path) {
+        Ok(existing) => existing != EMBEDDED_LOG_SHARD_HELPER_SOURCE,
+        Err(e) => {
+            if e.kind() == std::io::ErrorKind::NotFound {
+                true
+            } else {
+                return Err(anyhow::Error::new(e).context(format!(
+                    "read embedded log shard helper failed: {}",
+                    helper_path.display()
+                )));
+            }
+        }
+    };
     if should_write {
         std::fs::write(&script_path, EMBEDDED_SELECTION_SUPERVISOR_SOURCE).with_context(|| {
             format!(
@@ -1019,13 +1036,21 @@ fn ensure_embedded_selection_supervisor(workdir: &Path) -> anyhow::Result<PathBu
             })?;
         }
     }
-    Ok(script_path)
+    if should_write_helper {
+        std::fs::write(&helper_path, EMBEDDED_LOG_SHARD_HELPER_SOURCE).with_context(|| {
+            format!(
+                "write embedded log shard helper failed: {}",
+                helper_path.display()
+            )
+        })?;
+    }
+    Ok((script_path, helper_path))
 }
 
 impl SelectionSupervisorRuntime {
     fn materialize(workdir: &Path, hostworkdir: &Path, python_exe: &Path) -> anyhow::Result<Self> {
         let python_exe = resolve_python_host_executable(python_exe)?;
-        let script_path = ensure_embedded_selection_supervisor(workdir)?;
+        let (script_path, _helper_path) = ensure_embedded_selection_supervisor_runtime(workdir)?;
         if !hostworkdir.is_absolute() {
             anyhow::bail!(
                 "hostworkdir must be absolute for shared selection supervisor runtime: {}",
@@ -1647,7 +1672,9 @@ fn selection_status_from_live_supervisor(
         apply_id: runtime_state.as_ref().and_then(|v| v.apply_id.clone()),
         argv: runtime_state.as_ref().map(|v| v.argv.clone()),
         cwd: runtime_state.as_ref().and_then(|v| v.cwd.clone()),
-        log_path: runtime_state.as_ref().map(|v| v.log_path.clone()),
+        log_path: runtime_state
+            .as_ref()
+            .map(|v| display_runtime_log_path(v.log_path.as_str())),
         started_ts_ms: None,
         owner_ts_ms: Some(supervisor.owner_ts_ms),
         supervisor_start_time_ticks: Some(supervisor.start_time_ticks()),
@@ -2970,7 +2997,8 @@ impl UserRpcHandler for ReadWorkloadLogChunkHandler {
             }
         };
 
-        let path = self.log_dir.join(log_filename);
+        let logical_path = self.log_dir.join(log_filename);
+        let path = resolve_readable_log_path(&logical_path).unwrap_or(logical_path.clone());
         let meta = match std::fs::metadata(&path) {
             Ok(v) => v,
             Err(e) => {
@@ -3773,8 +3801,12 @@ fn desired_workload_matches_running(
     workloads: &SupervisorBackedWorkloads,
     desired: &AgentDesiredWorkload,
 ) -> bool {
-    let _ = workloads;
-    let Ok(status) = observe_selection_status(desired.kind, &desired.name, &desired.authority)
+    let Ok(status) = observe_selection_status_for_scope(
+        desired.kind,
+        &desired.name,
+        &desired.authority,
+        Some(workloads.scope_key.as_str()),
+    )
     else {
         return false;
     };
@@ -3854,7 +3886,6 @@ fn desired_workload_recovery_superseded(
     workloads: &SupervisorBackedWorkloads,
     desired: &AgentDesiredWorkload,
 ) -> anyhow::Result<bool> {
-    let _ = workloads;
     // English note:
     // - A newer apply-owned generation overlapping an older applyless bare owner is the expected
     //   phase-1 state of the self-host two-phase handover.
@@ -3863,7 +3894,12 @@ fn desired_workload_recovery_superseded(
     //   phase 2 has a chance to cut over.
     // - Only an owner_ts that is newer than the requested workload and is not this intentional
     //   phase-1 overlap is treated as a hard superseding fact.
-    let status = observe_selection_status(desired.kind, &desired.name, &desired.authority)?;
+    let status = observe_selection_status_for_scope(
+        desired.kind,
+        &desired.name,
+        &desired.authority,
+        Some(workloads.scope_key.as_str()),
+    )?;
     if phase1_overlap_with_applyless_owner(&status, desired) {
         return Ok(false);
     }
@@ -13938,6 +13974,90 @@ mod tests {
         assert!(err_text.contains("owner_ts_ms collision"), "{err_text}");
     }
 
+    #[test]
+    fn live_selection_supervisors_isolate_same_label_collision_by_scope_key() {
+        let snapshot = SelectionSupervisorProcSnapshot {
+            infos_by_pid: std::collections::HashMap::from([
+                (
+                    11,
+                    ProcessInfoObservation {
+                        pid: 11,
+                        ppid: 1,
+                        pgid: 11,
+                        state: 'S',
+                        start_time_ticks: 100,
+                    },
+                ),
+                (
+                    22,
+                    ProcessInfoObservation {
+                        pid: 22,
+                        ppid: 1,
+                        pgid: 22,
+                        state: 'S',
+                        start_time_ticks: 200,
+                    },
+                ),
+            ]),
+            children_by_ppid: std::collections::HashMap::new(),
+            cmdlines: vec![
+                (
+                    11,
+                    vec![
+                        "/usr/bin/python3".to_string(),
+                        "selection_supervisor.py".to_string(),
+                        "run".to_string(),
+                        "--label".to_string(),
+                        "DaemonSet/target".to_string(),
+                        "--scope-key".to_string(),
+                        "/tmp/scope-a".to_string(),
+                        "--owner-ts-ms".to_string(),
+                        "2".to_string(),
+                    ],
+                ),
+                (
+                    22,
+                    vec![
+                        "/usr/bin/python3".to_string(),
+                        "selection_supervisor.py".to_string(),
+                        "run".to_string(),
+                        "--label".to_string(),
+                        "DaemonSet/target".to_string(),
+                        "--scope-key".to_string(),
+                        "/tmp/scope-b".to_string(),
+                        "--owner-ts-ms".to_string(),
+                        "2".to_string(),
+                    ],
+                ),
+            ],
+            zombie_infos: Vec::new(),
+        };
+
+        let scoped_a =
+            live_selection_supervisors(&snapshot, Some("DaemonSet/target"), Some("/tmp/scope-a"))
+                .unwrap();
+        assert_eq!(scoped_a.len(), 1);
+        assert_eq!(scoped_a[0].pid(), 11);
+
+        let scoped_b =
+            live_selection_supervisors(&snapshot, Some("DaemonSet/target"), Some("/tmp/scope-b"))
+                .unwrap();
+        assert_eq!(scoped_b.len(), 1);
+        assert_eq!(scoped_b[0].pid(), 22);
+
+        let listed_a = observe_all_selection_statuses_for_snapshot(&snapshot, Some("/tmp/scope-a"))
+            .unwrap();
+        assert_eq!(listed_a.len(), 1);
+        assert_eq!(listed_a[0].label, "DaemonSet/target");
+        assert_eq!(listed_a[0].pid, Some(11));
+
+        let listed_b = observe_all_selection_statuses_for_snapshot(&snapshot, Some("/tmp/scope-b"))
+            .unwrap();
+        assert_eq!(listed_b.len(), 1);
+        assert_eq!(listed_b[0].label, "DaemonSet/target");
+        assert_eq!(listed_b[0].pid, Some(22));
+    }
+
     #[test]
     fn live_selection_supervisors_reject_matching_legacy_entry_without_owner_ts_ms() {
         let snapshot = SelectionSupervisorProcSnapshot {
@@ -14405,6 +14525,95 @@ mod tests {
             .unwrap();
     }
 
+    #[test]
+    fn materialize_selection_supervisor_runtime_writes_log_shard_helper() {
+        let python_exe = PathBuf::from("/usr/bin/python3");
+        assert!(
+            python_exe.is_file(),
+            "python executable does not exist: {}",
+            python_exe.display()
+        );
+        let workdir = tempfile::tempdir().unwrap();
+        let runtime =
+            SelectionSupervisorRuntime::materialize(workdir.path(), workdir.path(), python_exe.as_path())
+                .unwrap();
+        assert!(runtime.script_path.exists());
+        assert!(
+            runtime
+                .script_path
+                .parent()
+                .unwrap()
+                .join(OPS_LOG_SHARD_HELPER_FILENAME)
+                .is_file()
+        );
+    }
+
+    #[test]
+    fn detached_selection_supervisor_preserves_early_startup_logs() {
+        let python_exe = PathBuf::from("/usr/bin/python3");
+        assert!(
+            python_exe.is_file(),
+            "python executable does not exist: {}",
+            python_exe.display()
+        );
+        let workdir = tempfile::tempdir().unwrap();
+        let runtime =
+            SelectionSupervisorRuntime::materialize(workdir.path(), workdir.path(), python_exe.as_path())
+                .unwrap();
+        let log_path = workdir.path().join("startup.log");
+        let command = vec![
+            python_exe.display().to_string(),
+            runtime.script_path.display().to_string(),
+            "run".to_string(),
+            "--label".to_string(),
+            "Deployment/startup_demo".to_string(),
+            "--scope-key".to_string(),
+            workdir.path().display().to_string(),
+            "--owner-ts-ms".to_string(),
+            "0".to_string(),
+            "--restart-policy".to_string(),
+            "always".to_string(),
+            "--restart-delay-seconds".to_string(),
+            "5".to_string(),
+            "--max-backoff-seconds".to_string(),
+            "30".to_string(),
+            "--crashloop-consecutive-restarts".to_string(),
+            "0".to_string(),
+            "--crashloop-interval-lt-seconds".to_string(),
+            "0".to_string(),
+            "--".to_string(),
+            "/bin/true".to_string(),
+        ];
+        let pid = runtime.spawn_detached_command(&log_path, command.as_slice()).unwrap();
+        let deadline = Instant::now() + Duration::from_secs(10);
+        let expected = "owner-ts-ms must be positive";
+        let mut saw_expected = false;
+        while Instant::now() < deadline {
+            if let Some(path) = resolve_readable_log_path(&log_path) {
+                let text = std::fs::read_to_string(path).unwrap_or_default();
+                if text.contains(expected) {
+                    saw_expected = true;
+                    break;
+                }
+            }
+            std::thread::sleep(Duration::from_millis(100));
+        }
+        if let Some(path) = resolve_readable_log_path(&log_path) {
+            let text = std::fs::read_to_string(path).unwrap_or_default();
+            assert!(
+                text.contains(expected),
+                "expected detached supervisor startup logs to reach runtime log, got: {text:?}"
+            );
+        } else {
+            panic!("runtime log path did not materialize");
+        }
+        assert!(saw_expected, "startup log was not observed before timeout");
+        let _ = std::process::Command::new("kill")
+            .arg("-TERM")
+            .arg(pid.to_string())
+            .status();
+    }
+
     #[test]
     fn atomic_group_non_agent_requires_present_before_running_match() {
         let desired = AgentDesiredWorkload {
@@ -14616,4 +14825,25 @@ mod tests {
         };
         assert!(!phase1_overlap_with_applyless_owner(&status, &desired));
     }
+
+    #[test]
+    fn resolve_readable_log_path_prefers_latest_daily_shard() {
+        let td = tempfile::tempdir().unwrap();
+        let base_path = td.path().join("workload__Deployment__demo.log");
+        std::fs::write(
+            td.path().join("workload__Deployment__demo.2026-06-19.log"),
+            "old\n",
+        )
+        .unwrap();
+        std::fs::write(
+            td.path().join("workload__Deployment__demo.2026-06-20.log"),
+            "new\n",
+        )
+        .unwrap();
+        let resolved = resolve_readable_log_path(&base_path).unwrap();
+        assert_eq!(
+            resolved.file_name().and_then(|v| v.to_str()),
+            Some("workload__Deployment__demo.2026-06-20.log")
+        );
+    }
 }
diff --git a/fluxon_rs/fluxon_util/build.rs b/fluxon_rs/fluxon_util/build.rs
index 0f586d3..2bf7b87 100644
--- a/fluxon_rs/fluxon_util/build.rs
+++ b/fluxon_rs/fluxon_util/build.rs
@@ -88,12 +88,15 @@ fn collect_crates_for_runtime(ws: &CargoWorkspace) {
     println!("cargo:rerun-if-changed=Cargo.toml");
 }
 
-fn try_discover_git_dir(manifest_dir: &Path) -> Option<PathBuf> {
+fn try_discover_git_dir(manifest_dir: &Path, workspace_root: &Path) -> Option<PathBuf> {
+    let workspace_search_ceiling = workspace_root.parent().unwrap_or(workspace_root);
     let mut cur = Some(manifest_dir);
     while let Some(dir) = cur {
         let candidate = dir.join(".git");
         if candidate.is_dir() {
-            return Some(candidate);
+            if candidate.join("HEAD").is_file() {
+                return Some(candidate);
+            }
         }
         if candidate.is_file() {
             // Worktree/submodule style: .git is a file containing `gitdir: <path>`
@@ -106,11 +109,17 @@ fn try_discover_git_dir(manifest_dir: &Path) -> Option<PathBuf> {
                 .unwrap_or_else(|| panic!("invalid .git file format: {}", candidate.display()))
                 .trim();
             let gitdir_path = Path::new(gitdir);
-            return Some(if gitdir_path.is_absolute() {
+            let resolved = if gitdir_path.is_absolute() {
                 gitdir_path.to_path_buf()
             } else {
                 dir.join(gitdir_path)
-            });
+            };
+            if resolved.join("HEAD").is_file() {
+                return Some(resolved);
+            }
+        }
+        if dir == workspace_search_ceiling {
+            break;
         }
         cur = dir.parent();
     }
@@ -309,7 +318,7 @@ fn main() {
             v
         }
         Err(_) => {
-            match try_discover_git_dir(&manifest_dir) {
+            match try_discover_git_dir(&manifest_dir, &ws.workspace_root) {
                 Some(git_dir) => {
                     emit_rerun_hints(&git_dir);
                     resolve_head_commit_id(&git_dir)
diff --git a/fluxon_rs/fluxon_util/src/lib.rs b/fluxon_rs/fluxon_util/src/lib.rs
index 2f4f9fa..e575a75 100644
--- a/fluxon_rs/fluxon_util/src/lib.rs
+++ b/fluxon_rs/fluxon_util/src/lib.rs
@@ -36,7 +36,12 @@ pub mod limitrate;
 // PyO3 helpers: run long-time Python call without holding GIL in caller thread.
 pub mod pyo3;
 // Re-export for stable public API: existing call sites can keep using `fluxon_util::init_log`.
-pub use log::{current_log_file_path, init_log, init_log_test, init_log_with_extra_layer};
+pub use log::{
+    current_daily_sharded_log_path, current_log_file_path, daily_sharded_log_path,
+    display_runtime_log_path, init_log, init_log_test, init_log_with_extra_layer,
+    latest_existing_daily_sharded_log_path, resolve_readable_log_path,
+    DEFAULT_DAILY_LOG_RETENTION_DAYS,
+};
 #[cfg(test)]
 mod test_util_test;
 
diff --git a/fluxon_rs/fluxon_util/src/log.rs b/fluxon_rs/fluxon_util/src/log.rs
index db3d88f..648650f 100644
--- a/fluxon_rs/fluxon_util/src/log.rs
+++ b/fluxon_rs/fluxon_util/src/log.rs
@@ -3,6 +3,7 @@ use std::io;
 use std::path::{Path, PathBuf};
 use std::sync::OnceLock;
 
+use parking_lot::Mutex;
 use tracing_appender::non_blocking;
 use tracing_appender::non_blocking::WorkerGuard;
 use tracing_subscriber::EnvFilter;
@@ -20,6 +21,9 @@ mod generated_crates {
 // RPC fast-path traffic actually entered the closed transfer / verbs backend. Keep the scope explicit:
 // only these dependency targets are promoted to DEBUG alongside workspace crates.
 const RDMA_DEBUG_TARGETS: &[&str] = &["fabric_lib", "libfabric_sys", "libibverbs_sys"];
+const LOG_RETENTION_DAYS: usize = 31;
+const TEST_LOG_SHARD_WINDOW_SECONDS_ENV: &str = "FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS";
+const TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV: &str = "FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS";
 
 // Simple UTC timer in RFC3339 seconds (no subsecond precision)
 struct UtcSecondTimer;
@@ -37,6 +41,191 @@ static GLOBAL_CONSOLE_LOG_GUARD: OnceLock<WorkerGuard> = OnceLock::new();
 // Expose the current process log file path for sidecar collectors (e.g. OTLP tailer).
 static GLOBAL_LOG_FILE_PATH: OnceLock<PathBuf> = OnceLock::new();
 
+pub const DEFAULT_DAILY_LOG_RETENTION_DAYS: usize = LOG_RETENTION_DAYS;
+
+#[derive(Clone, Copy, Debug)]
+struct LogShardWindowConfig {
+    window_seconds: i64,
+    anchor_unix_seconds: i64,
+}
+
+fn read_test_log_shard_window_config() -> anyhow::Result<Option<LogShardWindowConfig>> {
+    let Some(raw_window) = std::env::var_os(TEST_LOG_SHARD_WINDOW_SECONDS_ENV) else {
+        return Ok(None);
+    };
+    let raw_window = raw_window
+        .into_string()
+        .map_err(|_| anyhow::anyhow!("{TEST_LOG_SHARD_WINDOW_SECONDS_ENV} must be valid utf-8"))?;
+    let window_text = raw_window.trim();
+    if window_text.is_empty() {
+        return Ok(None);
+    }
+    let window_seconds: i64 = window_text.parse().map_err(|e| {
+        anyhow::anyhow!(
+            "{TEST_LOG_SHARD_WINDOW_SECONDS_ENV} must be a positive integer: {e}"
+        )
+    })?;
+    if window_seconds <= 0 {
+        anyhow::bail!("{TEST_LOG_SHARD_WINDOW_SECONDS_ENV} must be > 0");
+    }
+
+    let raw_anchor = std::env::var(TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV).map_err(|_| {
+        anyhow::anyhow!(
+            "{TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV} is required when {TEST_LOG_SHARD_WINDOW_SECONDS_ENV} is set"
+        )
+    })?;
+    let anchor_unix_seconds: i64 = raw_anchor.trim().parse().map_err(|e| {
+        anyhow::anyhow!(
+            "{TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV} must be an integer unix timestamp: {e}"
+        )
+    })?;
+    Ok(Some(LogShardWindowConfig {
+        window_seconds,
+        anchor_unix_seconds,
+    }))
+}
+
+fn resolve_shard_date_from_datetime(now: chrono::DateTime<chrono::Utc>) -> anyhow::Result<chrono::NaiveDate> {
+    let Some(config) = read_test_log_shard_window_config()? else {
+        return Ok(now.date_naive());
+    };
+    let unix_seconds = now.timestamp();
+    let delta_seconds = unix_seconds - config.anchor_unix_seconds;
+    if delta_seconds < 0 {
+        anyhow::bail!(
+            "test log shard anchor must not be in the future: anchor={}, ts={}",
+            config.anchor_unix_seconds,
+            unix_seconds
+        );
+    }
+    let bucket_index = delta_seconds / config.window_seconds;
+    let base_date = chrono::NaiveDate::from_ymd_opt(2026, 1, 1)
+        .expect("valid hard-coded synthetic base date");
+    Ok(base_date + chrono::Days::new(bucket_index as u64))
+}
+
+fn current_shard_date() -> anyhow::Result<chrono::NaiveDate> {
+    resolve_shard_date_from_datetime(chrono::Utc::now())
+}
+
+fn cleanup_old_daily_sharded_logs(
+    base_path: &Path,
+    retention_days: usize,
+) -> anyhow::Result<()> {
+    let parent = match base_path.parent() {
+        Some(parent) => parent,
+        None => return Ok(()),
+    };
+    let file_name = match base_path.file_name().and_then(|v| v.to_str()) {
+        Some(file_name) => file_name,
+        None => return Ok(()),
+    };
+    let Some(stem) = file_name.strip_suffix(".log") else {
+        return Ok(());
+    };
+    fs::create_dir_all(parent)?;
+    let keep_since = current_shard_date()? - chrono::Days::new(retention_days.saturating_sub(1) as u64);
+    let prefix = format!("{stem}.");
+    for entry in std::fs::read_dir(parent)? {
+        let entry = entry?;
+        let path = entry.path();
+        if !path.is_file() {
+            continue;
+        }
+        let entry_name = entry.file_name();
+        let Some(entry_name) = entry_name.to_str() else {
+            continue;
+        };
+        if !entry_name.starts_with(prefix.as_str()) || !entry_name.ends_with(".log") {
+            continue;
+        }
+        let date_text = &entry_name[prefix.len()..entry_name.len() - ".log".len()];
+        let Ok(shard_date) = chrono::NaiveDate::parse_from_str(date_text, "%Y-%m-%d") else {
+            continue;
+        };
+        if shard_date < keep_since {
+            match fs::remove_file(&path) {
+                Ok(()) => {}
+                Err(err) if err.kind() == io::ErrorKind::NotFound => {}
+                Err(err) => return Err(err.into()),
+            }
+        }
+    }
+    Ok(())
+}
+
+#[derive(Debug)]
+struct DailyShardedFileWriter {
+    base_path: PathBuf,
+    retention_days: usize,
+    state: Mutex<DailyShardedFileWriterState>,
+}
+
+#[derive(Debug, Default)]
+struct DailyShardedFileWriterState {
+    current_path: Option<PathBuf>,
+    current_file: Option<fs::File>,
+}
+
+impl DailyShardedFileWriter {
+    fn new(base_path: PathBuf, retention_days: usize) -> Self {
+        Self {
+            base_path,
+            retention_days,
+            state: Mutex::new(DailyShardedFileWriterState::default()),
+        }
+    }
+
+    fn current_path(&self) -> anyhow::Result<PathBuf> {
+        current_daily_sharded_log_path(&self.base_path)
+    }
+
+    fn rotate_if_needed(
+        &self,
+        state: &mut DailyShardedFileWriterState,
+    ) -> io::Result<()> {
+        let next_path = self
+            .current_path()
+            .map_err(|err| io::Error::new(io::ErrorKind::Other, err.to_string()))?;
+        if state.current_path.as_ref() == Some(&next_path) && state.current_file.is_some() {
+            return Ok(());
+        }
+        cleanup_old_daily_sharded_logs(&self.base_path, self.retention_days)
+            .map_err(|err| io::Error::new(io::ErrorKind::Other, err.to_string()))?;
+        if let Some(parent) = next_path.parent() {
+            fs::create_dir_all(parent)?;
+        }
+        let file = fs::OpenOptions::new()
+            .create(true)
+            .append(true)
+            .open(&next_path)?;
+        state.current_path = Some(next_path);
+        state.current_file = Some(file);
+        Ok(())
+    }
+}
+
+impl io::Write for DailyShardedFileWriter {
+    fn write(&mut self, buf: &[u8]) -> io::Result<usize> {
+        let mut state = self.state.lock();
+        self.rotate_if_needed(&mut state)?;
+        state
+            .current_file
+            .as_mut()
+            .expect("log writer file must exist after rotation")
+            .write(buf)
+    }
+
+    fn flush(&mut self) -> io::Result<()> {
+        let mut state = self.state.lock();
+        if let Some(file) = state.current_file.as_mut() {
+            file.flush()
+        } else {
+            Ok(())
+        }
+    }
+}
+
 fn setup_global_log_guards(file_guard: WorkerGuard, console_guard: WorkerGuard) {
     let _ = GLOBAL_FILE_LOG_GUARD.set(file_guard);
     let _ = GLOBAL_CONSOLE_LOG_GUARD.set(console_guard);
@@ -90,9 +279,9 @@ fn third_party_log_target_overrides(
     targets
 }
 
-/// Init log for production
+/// Init log for production.
 /// - `log_path`: directory to write log files
-/// - `instance_key`: used in file names to disambiguate instances
+/// - `instance_key`: used in daily file names to disambiguate instances
 pub fn init_log(log_path: &Path, instance_key: &str) {
     init_log_impl(log_path, instance_key, NoopLayer);
 }
@@ -113,6 +302,95 @@ struct NoopLayer;
 
 impl<S> tracing_subscriber::Layer<S> for NoopLayer where S: tracing::Subscriber {}
 
+fn current_daily_log_file_path(log_path: &Path, instance_key: &str) -> PathBuf {
+    current_daily_sharded_log_path(&log_path.join(format!("fluxon-kv-{instance_key}.log")))
+        .unwrap_or_else(|_| {
+            let date = chrono::Utc::now().format("%Y-%m-%d");
+            log_path.join(format!("fluxon-kv-{instance_key}.{date}.log"))
+        })
+}
+
+pub fn daily_sharded_log_path(
+    base_path: &Path,
+    date: chrono::NaiveDate,
+) -> anyhow::Result<PathBuf> {
+    let file_name = base_path.file_name().and_then(|v| v.to_str()).ok_or_else(|| {
+        anyhow::anyhow!(
+            "log path must end with a valid utf-8 filename: {}",
+            base_path.display()
+        )
+    })?;
+    let stem = file_name
+        .strip_suffix(".log")
+        .ok_or_else(|| anyhow::anyhow!("log path must end with .log: {}", base_path.display()))?;
+    Ok(base_path.with_file_name(format!(
+        "{}.{}.log",
+        stem,
+        date.format("%Y-%m-%d")
+    )))
+}
+
+pub fn current_daily_sharded_log_path(base_path: &Path) -> anyhow::Result<PathBuf> {
+    daily_sharded_log_path(base_path, current_shard_date()?)
+}
+
+pub fn latest_existing_daily_sharded_log_path(base_path: &Path) -> Option<PathBuf> {
+    let parent = base_path.parent()?;
+    let file_name = base_path.file_name()?.to_str()?;
+    let stem = file_name.strip_suffix(".log")?;
+    let prefix = format!("{}.", stem);
+    let mut latest: Option<(chrono::NaiveDate, PathBuf)> = None;
+    let entries = std::fs::read_dir(parent).ok()?;
+    for entry in entries {
+        let entry = entry.ok()?;
+        let path = entry.path();
+        if !path.is_file() {
+            continue;
+        }
+        let entry_name = entry.file_name();
+        let entry_name = entry_name.to_str()?;
+        if !entry_name.starts_with(prefix.as_str()) || !entry_name.ends_with(".log") {
+            continue;
+        }
+        if entry_name.len() <= prefix.len() + ".log".len() {
+            continue;
+        }
+        let date_text = &entry_name[prefix.len()..entry_name.len() - ".log".len()];
+        let date = chrono::NaiveDate::parse_from_str(date_text, "%Y-%m-%d").ok()?;
+        let replace = match latest.as_ref() {
+            Some((prev, _)) => date > *prev,
+            None => true,
+        };
+        if replace {
+            latest = Some((date, path));
+        }
+    }
+    latest.map(|(_, path)| path)
+}
+
+pub fn resolve_readable_log_path(base_path: &Path) -> Option<PathBuf> {
+    if let Ok(current) = current_daily_sharded_log_path(base_path) {
+        if current.exists() {
+            return Some(current);
+        }
+    }
+    if let Some(latest) = latest_existing_daily_sharded_log_path(base_path) {
+        return Some(latest);
+    }
+    if base_path.exists() {
+        return Some(base_path.to_path_buf());
+    }
+    None
+}
+
+pub fn display_runtime_log_path(base_path_text: &str) -> String {
+    let base_path = Path::new(base_path_text);
+    resolve_readable_log_path(base_path)
+        .unwrap_or_else(|| base_path.to_path_buf())
+        .display()
+        .to_string()
+}
+
 fn init_log_impl<L>(log_path: &Path, instance_key: &str, extra_layer: L)
 where
     L: tracing_subscriber::Layer<Registry> + Send + Sync + 'static,
@@ -238,83 +516,9 @@ where
         }
     }
 
-    // Archive existing logs for the same instance into a sibling history directory.
-    // Scope is strictly within the provided `log_path` (cluster is implied by the dir path),
-    // and only files of the current `instance_key` are moved. This avoids any cross-instance
-    // interference and keeps behavior explicit and bounded.
-    {
-        let history_dir = log_path.join("history");
-        if let Err(e) = fs::create_dir_all(&history_dir) {
-            panic!(
-                "[fluxon] Create history directory failed: {:?}. Base log_path: {:?}. \
-This log_path is provided by the caller's configuration. \
-For Master mode it is derived from MasterConfigYaml.log_dir with a subdirectory '<cluster_name>_cluster_kv_logs'; \
-for Client mode it is derived from ClientConfigYaml.fluxonkv_spec.shared_memory_path with subdirectory '<cluster_name>_cluster_kv_logs'. \
-Please ensure the directory exists and is writable. Underlying OS error: {:?}",
-                history_dir, log_path, e
-            );
-        }
-
-        // Pattern: fluxon-kv-<instance_key>.<timestamp>.log
-        // No fallback patterns: keep rule strict and explicit.
-        let prefix = format!("fluxon-kv-{}.", instance_key);
-        let mut moved = 0usize;
-
-        let iter = fs::read_dir(log_path).unwrap_or_else(|e| {
-            panic!(
-                "[fluxon] Read log directory failed at {:?}. This directory is the configured log_path described above. OS error: {:?}",
-                log_path, e
-            )
-        });
-
-        for entry in iter {
-            let entry = entry.unwrap_or_else(|e| {
-                panic!(
-                    "[fluxon] Failed to read a directory entry under {:?}. OS error: {:?}",
-                    log_path, e
-                )
-            });
-            let path = entry.path();
-            if !path.is_file() {
-                continue;
-            }
-            let name_os = match path.file_name() {
-                Some(n) => n,
-                None => continue,
-            };
-            let name = match name_os.to_str() {
-                Some(s) => s,
-                None => continue,
-            };
-            let is_target = name.starts_with(&prefix) && name.ends_with(".log");
-            if !is_target {
-                continue;
-            }
-            let dst = history_dir.join(name);
-            if let Err(err) = fs::rename(&path, &dst) {
-                panic!(
-                    "[fluxon] Move old log failed: {:?} -> {:?}. Base log_path: {:?}. OS error: {:?}",
-                    path, dst, log_path, err
-                );
-            }
-            moved += 1;
-        }
-
-        if moved > 0 {
-            println!(
-                "[fluxon] Archived {moved} existing logs for instance_key='{instance_key}' into {:?}",
-                history_dir
-            );
-        }
-    }
-
-    // Files named with UTC timestamp once per process run
-    let ts = chrono::Utc::now().format("%Y-%m-%d_%H-%M-%S");
-
     // File log keeps workspace crates at DEBUG; non-workspace crates default to WARN.
     // This avoids dumping verbose dependency debug logs (e.g. h2/tower) into file output.
-    let file_name = format!("fluxon-kv-{instance_key}.{ts}.log");
-    let file_path = log_path.join(&file_name);
+    let file_path = current_daily_log_file_path(log_path, instance_key);
     // Keep a copy for the whole process lifetime; collectors can clone it.
     if let Some(prev) = GLOBAL_LOG_FILE_PATH.get() {
         if prev != &file_path {
@@ -326,18 +530,11 @@ Please ensure the directory exists and is writable. Underlying OS error: {:?}",
     } else {
         let _ = GLOBAL_LOG_FILE_PATH.set(file_path.clone());
     }
-    let file = match std::fs::OpenOptions::new()
-        .create(true)
-        .append(true)
-        .open(&file_path)
-    {
-        Ok(f) => f,
-        Err(e) => {
-            eprintln!("Failed to open log file {:?}, err: {:?}", file_path, e);
-            return;
-        }
-    };
-    let (file_writer, file_guard) = non_blocking(file);
+    let file_appender = DailyShardedFileWriter::new(
+        log_path.join(format!("fluxon-kv-{instance_key}.log")),
+        LOG_RETENTION_DAYS,
+    );
+    let (file_writer, file_guard) = non_blocking(file_appender);
     let enable_iceoryx_logs = matches!(
         std::env::var("FLUXON_ENABLE_ICEORYX_LOGS")
             .ok()
@@ -380,10 +577,9 @@ Please ensure the directory exists and is writable. Underlying OS error: {:?}",
     setup_global_log_guards(file_guard, console_guard);
 
     // Success notice: tell users where logs are written.
-    let history_dir_for_print = log_path.join("history");
     println!(
-        "[fluxon] Logging initialized. base_dir={:?}, history_dir={:?}, instance_key='{}'",
-        log_path, history_dir_for_print, instance_key
+        "[fluxon] Logging initialized. base_dir={:?}, retention_days={}, current_file={:?}, instance_key='{}'",
+        log_path, LOG_RETENTION_DAYS, file_path, instance_key
     );
 }
 
diff --git a/fluxon_rs/fluxon_util/tests/log_mgmt.rs b/fluxon_rs/fluxon_util/tests/log_mgmt.rs
new file mode 100644
index 0000000..03de37c
--- /dev/null
+++ b/fluxon_rs/fluxon_util/tests/log_mgmt.rs
@@ -0,0 +1,120 @@
+use std::fs;
+use std::path::Path;
+use std::time::{Duration, SystemTime, UNIX_EPOCH};
+
+use fluxon_util::DEFAULT_DAILY_LOG_RETENTION_DAYS;
+use tempfile::TempDir;
+
+const TEST_LOG_SHARD_WINDOW_SECONDS_ENV: &str = "FLUXON_TEST_LOG_SHARD_WINDOW_SECONDS";
+const TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV: &str = "FLUXON_TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS";
+
+struct EnvVarGuard {
+    key: &'static str,
+    previous: Option<String>,
+}
+
+impl EnvVarGuard {
+    fn set(key: &'static str, value: impl Into<String>) -> Self {
+        let previous = std::env::var(key).ok();
+        unsafe {
+            std::env::set_var(key, value.into());
+        }
+        Self { key, previous }
+    }
+}
+
+impl Drop for EnvVarGuard {
+    fn drop(&mut self) {
+        match self.previous.as_deref() {
+            Some(value) => unsafe {
+                std::env::set_var(self.key, value);
+            },
+            None => unsafe {
+                std::env::remove_var(self.key);
+            },
+        }
+    }
+}
+
+fn count_service_shards(root: &Path, prefix: &str) -> usize {
+    fs::read_dir(root)
+        .expect("read log directory")
+        .filter_map(|entry| entry.ok())
+        .map(|entry| entry.file_name().to_string_lossy().to_string())
+        .filter(|name| name.starts_with(prefix) && name.ends_with(".log"))
+        .count()
+}
+
+#[test]
+fn kv_log_shards_roll_and_cleanup_with_test_window() {
+    let temp_dir = TempDir::new().expect("create temp dir");
+    let log_path = temp_dir.path();
+    let instance_key = "log_mgmt_window";
+    let base_prefix = format!("fluxon-kv-{instance_key}");
+    let stale_path = log_path.join(format!("{base_prefix}.2025-12-01.log"));
+    fs::write(&stale_path, "stale\n").expect("write stale shard");
+
+    let now = SystemTime::now()
+        .duration_since(UNIX_EPOCH)
+        .expect("unix epoch")
+        .as_secs() as i64;
+    let _window_guard = EnvVarGuard::set(TEST_LOG_SHARD_WINDOW_SECONDS_ENV, "10");
+    let _anchor_guard = EnvVarGuard::set(TEST_LOG_SHARD_ANCHOR_UNIX_SECONDS_ENV, (now - 2).to_string());
+
+    fluxon_util::init_log(log_path, instance_key);
+    tracing::info!(target: "fluxon_util", "[kv-log-mgmt][phase=before] ts={}", now);
+    std::thread::sleep(Duration::from_millis(300));
+    std::thread::sleep(Duration::from_secs(11));
+    let after_ts = SystemTime::now()
+        .duration_since(UNIX_EPOCH)
+        .expect("unix epoch")
+        .as_secs();
+    tracing::info!(target: "fluxon_util", "[kv-log-mgmt][phase=after] ts={after_ts}");
+    std::thread::sleep(Duration::from_millis(500));
+
+    let shard_1 = log_path.join(format!("{base_prefix}.2026-01-01.log"));
+    let shard_2 = log_path.join(format!("{base_prefix}.2026-01-02.log"));
+    assert!(shard_1.exists(), "missing shard: {}", shard_1.display());
+    assert!(shard_2.exists(), "missing shard: {}", shard_2.display());
+    assert!(
+        !stale_path.exists(),
+        "stale shard should be removed once retention cleanup runs"
+    );
+    assert_eq!(
+        count_service_shards(log_path, base_prefix.as_str()),
+        2,
+        "expected exactly two retained shard files within the synthetic test window"
+    );
+
+    let shard_1_text = fs::read_to_string(&shard_1).expect("read first shard");
+    let shard_2_text = fs::read_to_string(&shard_2).expect("read second shard");
+    assert!(
+        shard_1_text.contains("[kv-log-mgmt][phase=before]"),
+        "first shard should contain the before marker"
+    );
+    assert!(
+        !shard_1_text.contains("[kv-log-mgmt][phase=after]"),
+        "first shard should not contain the after marker"
+    );
+    assert!(
+        shard_2_text.contains("[kv-log-mgmt][phase=after]"),
+        "second shard should contain the after marker"
+    );
+    assert!(
+        !shard_2_text.contains("[kv-log-mgmt][phase=before]"),
+        "second shard should not contain the before marker"
+    );
+    assert_eq!(DEFAULT_DAILY_LOG_RETENTION_DAYS, 31);
+}
+
+#[test]
+fn resolve_readable_log_path_ignores_plain_base_log_when_daily_shards_exist() {
+    let temp_dir = TempDir::new().expect("create temp dir");
+    let base_path = temp_dir.path().join("startup.log");
+    fs::write(&base_path, "plain\n").expect("write base log");
+    let shard_path = temp_dir.path().join("startup.2026-06-21.log");
+    fs::write(&shard_path, "shard\n").expect("write shard log");
+
+    let resolved = fluxon_util::resolve_readable_log_path(&base_path).expect("resolve readable log path");
+    assert_eq!(resolved, shard_path);
+}
diff --git a/fluxon_test_stack/ci_2_virt_node.py b/fluxon_test_stack/ci_2_virt_node.py
index 28e9b82..7f91716 100644
--- a/fluxon_test_stack/ci_2_virt_node.py
+++ b/fluxon_test_stack/ci_2_virt_node.py
@@ -879,6 +879,8 @@ def main() -> int:
             sys.executable,
             str((REPO_ROOT / "fluxon_test_stack" / "pack_test_stack_rsc.py").resolve()),
             "--all-profiles",
+            "--release-dir",
+            str(release_dir),
             "-c",
             str(pack_metadata["suite_path"]),
         ]
diff --git a/fluxon_test_stack/ci_test_list.yaml b/fluxon_test_stack/ci_test_list.yaml
index e0e99c4..333ce3f 100644
--- a/fluxon_test_stack/ci_test_list.yaml
+++ b/fluxon_test_stack/ci_test_list.yaml
@@ -29,6 +29,14 @@ scenes:
       scales: [n1_kvowner_dram_20gib]
       profiles: [fluxon_tcp]
 
+  ci_top_attention_log_mgmt:
+    ci:
+      subject: rust
+      runtime_contract: rust_self_managed
+    select:
+      scales: [n1_kvowner_dram_20gib]
+      profiles: [fluxon_tcp]
+
   kv_read_heavy_zipf:
     test_stack:
       mode: KVSTORE
@@ -315,6 +323,8 @@ profiles:
             doc_site_base_url: example.com
           ci_top_attention_bin_kvtest:
             kv_test_rounds: all
+          ci_top_attention_log_mgmt:
+            enabled: true
         runtime_contracts:
           cluster_kv_owner: &cluster_kv_owner_runtime
             base_runtime:
@@ -460,6 +470,8 @@ profiles:
             doc_site_base_url: example.com
           ci_top_attention_bin_kvtest:
             kv_test_rounds: all
+          ci_top_attention_log_mgmt:
+            enabled: true
       test_stack:
         <<: *common_test_stack_runtime
   fluxon_sockudo_ws:
@@ -472,6 +484,8 @@ profiles:
             doc_site_base_url: example.com
           ci_top_attention_bin_kvtest:
             kv_test_rounds: all
+          ci_top_attention_log_mgmt:
+            enabled: true
       test_stack:
         <<: *common_test_stack_runtime
   fluxon_tcp:
@@ -484,6 +498,8 @@ profiles:
             doc_site_base_url: example.com
           ci_top_attention_bin_kvtest:
             kv_test_rounds: all
+          ci_top_attention_log_mgmt:
+            enabled: true
       test_stack:
         <<: *common_test_stack_runtime
   redis_sharded:
diff --git a/fluxon_test_stack/deployconf_testbed.yml b/fluxon_test_stack/deployconf_testbed.yml
index fe431de..552ce13 100644
--- a/fluxon_test_stack/deployconf_testbed.yml
+++ b/fluxon_test_stack/deployconf_testbed.yml
@@ -349,6 +349,9 @@ service:
         cluster_name: "${FLUXON_CLUSTER_NAME}"
         shared_memory_path: "${FLUXON_SHARED_MEM}"
         shared_file_path: "${FLUXON_SHARED_FILE}"
+        large_file_paths:
+          log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"
+          cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"
         sub_cluster: "owner"
       YAML
       ${HOSTWORKDIR}/venv/bin/python -m fluxon_py.runtime.start_owner_kvclient -c "${CONFIG_PATH}" -w "${WORKDIR}"
@@ -589,7 +592,7 @@ service:
         cluster_name: "${FLUXON_CLUSTER_NAME}"
         member_kind: kv
         output: web
-        http_listen_addr: "0.0.0.0:${MASTER__PORT}"
+        http_listen_addr: "0.0.0.0:${OPS_CONTROLLER__PORT}"
       YAML
 
       ${HOSTWORKDIR}/venv/bin/python -m fluxon_py.runtime.start_ops_controller -c "${WORKDIR}/ops_controller.yaml" -w "${WORKDIR}"
diff --git a/fluxon_test_stack/pack_test_stack_rsc.py b/fluxon_test_stack/pack_test_stack_rsc.py
index 9e80dea..e843a15 100644
--- a/fluxon_test_stack/pack_test_stack_rsc.py
+++ b/fluxon_test_stack/pack_test_stack_rsc.py
@@ -2,7 +2,6 @@
 from __future__ import annotations
 
 import argparse
-import fnmatch
 import hashlib
 import json
 import os
@@ -19,30 +18,28 @@
 import yaml
 
 REPO_ROOT = Path(__file__).resolve().parent.parent
-SCRIPTS_DIR = REPO_ROOT / "setup_and_pack"
-if str(SCRIPTS_DIR) not in sys.path:
-    sys.path.insert(0, str(SCRIPTS_DIR))
+SETUP_AND_PACK_DIR = REPO_ROOT / "setup_and_pack"
+setup_and_pack_dir_str = str(SETUP_AND_PACK_DIR)
+if setup_and_pack_dir_str in sys.path:
+    sys.path.remove(setup_and_pack_dir_str)
+sys.path.insert(0, setup_and_pack_dir_str)
+SCRIPTS_DIR = REPO_ROOT / "scripts"
+scripts_dir_str = str(SCRIPTS_DIR)
+if scripts_dir_str in sys.path:
+    sys.path.remove(scripts_dir_str)
+sys.path.insert(0, scripts_dir_str)
 
 import utils as script_utils
+from source_selection_profiles import (
+    SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+    collect_source_profile_relpaths,
+    get_source_profile_source_roots,
+    source_profile_relpath_excluded,
+)
 
 
-CI_SOURCE_ROOT_NAMES: tuple[str, ...] = (".",)
-CI_SOURCE_COMMON_EXCLUDE_REL_PATHS: tuple[str, ...] = (
-    "__pycache__/",
-    ".pytest_cache/",
-    ".mypy_cache/",
-    ".ruff_cache/",
-    "*.swp",
-)
-CI_SOURCE_STAGE_EXCLUDE_PREFIXES: tuple[str, ...] = (
-    ".dever/",
-    "fluxon_release/",
-    "skills/",
-)
-CI_SOURCE_STAGE_EXCLUDE_NAMES: frozenset[str] = frozenset(
-    {
-        ".DS_Store",
-    }
+CI_SOURCE_ROOT_NAMES: tuple[str, ...] = get_source_profile_source_roots(
+    profile=SOURCE_SELECTION_PROFILE_SOURCE_PACK
 )
 PACKED_RUNTIME_ROOT_NAMES: tuple[str, ...] = (
     "bin",
@@ -86,18 +83,6 @@
     "mooncake",
 )
 RELEASE_MANIFEST_FILENAME = "fluxon_release.sha256"
-CI_SOURCE_DIGEST_IGNORED_DIR_NAMES = frozenset(
-    {
-        ".git",
-        "__pycache__",
-        ".pytest_cache",
-        ".mypy_cache",
-        ".ruff_cache",
-        "target",
-    }
-)
-CI_SOURCE_DIGEST_IGNORED_FILE_NAMES = frozenset()
-CI_SOURCE_DIGEST_IGNORED_FILE_SUFFIXES = (".pyc", ".swp", ".gitignore")
 DEFAULT_REDIS_BUILD_IMAGE = "quay.io/pypa/manylinux_2_28_x86_64"
 DEFAULT_REDIS_DOWNLOAD_URL_TEMPLATE = "https://download.redis.io/releases/redis-{version}.tar.gz"
 DEFAULT_REDIS_VERSION = "7.2.5"
@@ -121,11 +106,6 @@
     profile_id: transport_backend
     for transport_backend, profile_id in script_utils.TRANSPORT_PROFILE_IDS.items()
 }
-DEFAULT_RATHER_NO_GIT_SUBMODULE_CONFIG_RELPATH = Path(
-    "setup_and_pack/rather_no_git_submodule.yaml"
-)
-
-
 def main() -> int:
     script_utils.reset_stage_summary()
     try:
@@ -933,125 +913,13 @@ def _git_stage_ci_source_tree(*, repo_root: Path, stage_root: Path) -> list[str]
     return selected
 
 
-def _collect_git_listed_source_relpaths(
-    *,
-    repo_root: Path,
-    git_root: Path,
-    rel_prefix: str = "",
-) -> list[str]:
-    script_utils.require_cmd("git")
-    argv = [
-        "git",
-        "ls-files",
-        "--cached",
-        "--others",
-        "--exclude-standard",
-        "-z",
-    ]
-    raw = subprocess.check_output(argv, cwd=str(git_root))
-    selected: list[str] = []
-    rel_prefix = rel_prefix.strip("/")
-    for entry in raw.split(b"\0"):
-        if not entry:
-            continue
-        rel = entry.decode("utf-8").strip()
-        if not rel:
-            continue
-        repo_rel = rel if not rel_prefix else f"{rel_prefix}/{rel}"
-        if _ci_source_relpath_excluded(repo_rel):
-            continue
-        src_path = (repo_root / repo_rel).resolve()
-        if not src_path.exists():
-            continue
-        selected.append(repo_rel)
-    return selected
-
-
-def _load_rather_no_git_submodule_source_roots(
-    *,
-    repo_root: Path,
-) -> tuple[tuple[str, Path], ...]:
-    config_path = (repo_root / DEFAULT_RATHER_NO_GIT_SUBMODULE_CONFIG_RELPATH).resolve()
-    if not config_path.exists():
-        return ()
-    raw_cfg = _load_yaml_file(config_path)
-    if raw_cfg is None:
-        return ()
-    if not isinstance(raw_cfg, dict):
-        raise RuntimeError(
-            "rather_no_git_submodule config must be a YAML mapping: "
-            f"{config_path}"
-        )
-    raw_modules = raw_cfg.get("modules")
-    if raw_modules is None:
-        return ()
-    if not isinstance(raw_modules, list):
-        raise RuntimeError(
-            "rather_no_git_submodule config `modules` must be a list: "
-            f"{config_path}"
-        )
-
-    repo_root = repo_root.resolve()
-    selected: list[tuple[str, Path]] = []
-    seen_relpaths: set[str] = set()
-    for index, raw_item in enumerate(raw_modules):
-        if not isinstance(raw_item, dict):
-            raise RuntimeError(
-                "rather_no_git_submodule config entries must be mappings: "
-                f"{config_path} modules[{index}]"
-            )
-        raw_path = raw_item.get("path")
-        if not isinstance(raw_path, str) or not raw_path.strip():
-            raise RuntimeError(
-                "rather_no_git_submodule config path must be a non-empty string: "
-                f"{config_path} modules[{index}].path"
-            )
-        rel_path = Path(raw_path.strip())
-        if rel_path.is_absolute() or ".." in rel_path.parts:
-            raise RuntimeError(
-                "rather_no_git_submodule config path must stay within the repo root: "
-                f"{config_path} modules[{index}].path={raw_path!r}"
-            )
-        relpath = rel_path.as_posix()
-        if relpath in seen_relpaths:
-            continue
-        seen_relpaths.add(relpath)
-        module_root = (repo_root / rel_path).resolve()
-        if module_root != repo_root and repo_root not in module_root.parents:
-            raise RuntimeError(
-                "rather_no_git_submodule config path escapes the repo root: "
-                f"{config_path} modules[{index}].path={raw_path!r}"
-            )
-        if not module_root.is_dir():
-            raise RuntimeError(
-                "CI source pack requires configured rather_no_git_submodule path to exist as a directory: "
-                f"path={relpath} resolved={module_root}"
-            )
-        selected.append((relpath, module_root))
-    return tuple(selected)
-
-
 def _collect_ci_source_relpaths(*, repo_root: Path) -> list[str]:
-    repo_root = repo_root.resolve()
-    selected = set(
-        _collect_git_listed_source_relpaths(
-            repo_root=repo_root,
-            git_root=repo_root,
+    return list(
+        collect_source_profile_relpaths(
+            repo_root=repo_root.resolve(),
+            profile=SOURCE_SELECTION_PROFILE_SOURCE_PACK,
         )
     )
-    for relpath, module_root in _load_rather_no_git_submodule_source_roots(
-        repo_root=repo_root
-    ):
-        selected.update(
-            _collect_git_listed_source_relpaths(
-                repo_root=repo_root,
-                git_root=module_root,
-                rel_prefix=relpath,
-            )
-        )
-    if not selected:
-        raise RuntimeError("git-based CI source selection produced no files")
-    return sorted(selected)
 
 
 def _compute_ci_source_digest(*, repo_root: Path) -> str:
@@ -1060,16 +928,17 @@ def _compute_ci_source_digest(*, repo_root: Path) -> str:
         relative_to=repo_root,
         mode=script_utils.PathDigestMode.PACK_INPUTS,
         algorithm=script_utils.PathHashAlgorithm.SHA256,
-        ignored_dir_names=CI_SOURCE_DIGEST_IGNORED_DIR_NAMES,
-        ignored_file_names=CI_SOURCE_DIGEST_IGNORED_FILE_NAMES,
-        ignored_file_suffixes=CI_SOURCE_DIGEST_IGNORED_FILE_SUFFIXES,
+        ignored_dir_names=(),
+        ignored_file_names=(),
+        ignored_file_suffixes=(),
     )
 
 
 def _ci_source_relpath_excluded(relpath: str) -> bool:
-    if relpath in CI_SOURCE_STAGE_EXCLUDE_NAMES:
-        return True
-    return any(relpath == prefix.rstrip("/") or relpath.startswith(prefix) for prefix in CI_SOURCE_STAGE_EXCLUDE_PREFIXES)
+    return source_profile_relpath_excluded(
+        profile=SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+        relpath=relpath,
+    )
 
 
 def _pack_ci_ext_rsc(*, repo_root: Path, out_path: Path) -> None:
@@ -1110,8 +979,8 @@ def build_tarball() -> None:
                         src=src,
                         dst=packed_stage_root / rel_name,
                         honor_gitignore=False,
+                        exclude_rel_paths=PACKED_RUNTIME_EXCLUDE_REL_PATHS,
                     )
-                _prune_stage_paths(packed_stage_root, PACKED_RUNTIME_EXCLUDE_REL_PATHS)
                 script_utils.tar_gz(
                     cwd=stage_root,
                     out_path=out_path,
@@ -1148,7 +1017,7 @@ def _stage_repo_test_rsc_tree(*, repo_test_rsc_root: Path, out_dir: Path) -> Non
         else:
             dst.parent.mkdir(parents=True, exist_ok=True)
             shutil.copy2(src, dst)
-    _prune_stage_paths(out_dir, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(out_dir, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _release_shared_baselines_root(*, release_dir: Path) -> Path:
@@ -1179,7 +1048,7 @@ def _stage_release_shared_baselines_into_root(*, release_dir: Path, prepared_roo
     if baselines_dst.exists():
         raise RuntimeError(f"prepared test_rsc baselines path already exists before release authority stage: {baselines_dst}")
     shutil.copytree(shared_baselines_root, baselines_dst, dirs_exist_ok=False)
-    _prune_stage_paths(baselines_dst, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(baselines_dst, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _stage_canonical_profile_prepared_resources_into_root(*, profile_id: str, prepared_root: Path) -> None:
@@ -1206,7 +1075,7 @@ def _stage_canonical_profile_prepared_resources_into_root(*, profile_id: str, pr
         else:
             dst.parent.mkdir(parents=True, exist_ok=True)
             shutil.copy2(src, dst)
-        _prune_stage_paths(dst, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+        script_utils.prune_stage_paths(dst, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _stage_prepared_test_rsc(*, prepared_root: Path, out_dir: Path) -> None:
@@ -1220,7 +1089,7 @@ def _stage_prepared_test_rsc(*, prepared_root: Path, out_dir: Path) -> None:
         else:
             dst.parent.mkdir(parents=True, exist_ok=True)
             shutil.copy2(src, dst)
-    _prune_stage_paths(out_dir, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(out_dir, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _prepare_baselines_into_root(
@@ -1249,7 +1118,7 @@ def _prepare_baselines_into_root(
             dir_source=dir_source,
             archive_source=archive_source,
         )
-    _prune_stage_paths(prepared_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(prepared_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _prepare_configured_test_rsc_resources_into_root(
@@ -1276,7 +1145,7 @@ def _prepare_configured_test_rsc_resources_into_root(
             scratch_root=scratch_root,
             mooncake_cfg=mooncake_cfg_raw,
         )
-    _prune_stage_paths(prepared_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(prepared_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _prepare_python_runtime_wheelhouse_into_root(
@@ -1786,7 +1655,7 @@ def _sync_prepared_baselines_into_release_tree(*, prepared_root: Path, release_d
     release_shared_baselines_root.parent.mkdir(parents=True, exist_ok=True)
     _remove_path(release_shared_baselines_root)
     shutil.copytree(prepared_baselines_root, release_shared_baselines_root, dirs_exist_ok=False)
-    _prune_stage_paths(release_shared_baselines_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
+    script_utils.prune_stage_paths(release_shared_baselines_root, TEST_RSC_REPO_TREE_EXCLUDE_REL_PATHS)
 
 
 def _extract_bundle_archive(*, archive_path: Path, out_dir: Path, expected_root_name: str) -> None:
@@ -1814,62 +1683,6 @@ def _remove_path(path: Path) -> None:
     path.unlink()
 
 
-def _rsync_stage_filtered(
-    *,
-    repo_root: Path,
-    src: Path,
-    dst: Path,
-    honor_gitignore: bool,
-    exclude_rel_paths: tuple[str, ...] = (),
-) -> None:
-    if not exclude_rel_paths:
-        script_utils.rsync_stage(
-            repo_root=repo_root,
-            src=src,
-            dst=dst,
-            honor_gitignore=honor_gitignore,
-        )
-        return
-
-    if not src.exists():
-        raise RuntimeError(f"missing required source path for staging: {src}")
-    if dst.exists():
-        raise RuntimeError(f"staging destination already exists (no overwrite): {dst}")
-    if shutil.which("rsync") is None:
-        raise RuntimeError("rsync is required for filtered staging, but was not found in PATH")
-
-    dst.parent.mkdir(parents=True, exist_ok=True)
-    argv = ["rsync", "-a"]
-    if honor_gitignore:
-        argv += [
-            "--exclude=.git/",
-            "--exclude-from=.gitignore",
-            "--filter=:- .gitignore",
-        ]
-    for pattern in exclude_rel_paths:
-        argv.append(f"--exclude={pattern}")
-    if src.is_dir():
-        argv += [str(src) + "/", str(dst) + "/"]
-    else:
-        argv += [str(src), str(dst)]
-    subprocess.check_call(argv, cwd=str(repo_root))
-
-
-def _prune_stage_paths(stage_root: Path, exclude_rel_paths: tuple[str, ...]) -> None:
-    if not stage_root.exists():
-        return
-    for path in sorted(stage_root.rglob("*"), reverse=True):
-        rel_path = path.relative_to(stage_root).as_posix()
-        for pattern in exclude_rel_paths:
-            normalized_pattern = pattern.rstrip("/")
-            if fnmatch.fnmatch(rel_path, normalized_pattern) or fnmatch.fnmatch(path.name, normalized_pattern):
-                if path.is_dir():
-                    shutil.rmtree(path)
-                else:
-                    path.unlink(missing_ok=True)
-                break
-
-
 def _test_rsc_manifest_file_list(*, out_dir: Path, prepared_root: Path) -> list[Path]:
     files: list[Path] = []
     for fixed_name in ("src_ci.tar.gz", "fluxon_ci_ext_rsc.tar.gz"):
diff --git a/fluxon_test_stack/start_test_bed.py b/fluxon_test_stack/start_test_bed.py
index 79f7bcd..7c3f22a 100644
--- a/fluxon_test_stack/start_test_bed.py
+++ b/fluxon_test_stack/start_test_bed.py
@@ -7,6 +7,7 @@
 import fcntl
 import json
 import os
+import re
 import subprocess
 import sys
 import time
@@ -24,6 +25,7 @@
 DEPLOYMENT_DIR = REPO_ROOT / "deployment"
 sys.path.insert(0, str(DEPLOYMENT_DIR))
 import manual_dispatch_release
+from utils import log_shard
 from utils.selection_runtime import (
     atomic_group_member_authority_name as _selection_atomic_group_member_authority_name,
     atomic_group_member_selection_workload_name as _selection_atomic_group_member_selection_workload_name,
@@ -432,11 +434,12 @@ def main() -> None:
             waves=coverage_bootstrap_waves,
             bootstrap_bare_services=bootstrap_bare_services,
         )
-    _wait_controller_ready_stable(
-        controller_url=controller_url,
-        timeout_seconds=controller_ready_timeout_seconds,
-        stability_window_seconds=bootstrap_stability_window_seconds,
-    )
+    if bootstrap_mode in (BOOTSTRAP_MODE_BARE_THEN_APPLY, BOOTSTRAP_MODE_BARE_ONLY):
+        _wait_controller_ready_stable(
+            controller_url=controller_url,
+            timeout_seconds=controller_ready_timeout_seconds,
+            stability_window_seconds=bootstrap_stability_window_seconds,
+        )
     test_runner_ui_summary = _ensure_test_runner_ui_started(ui_cfg=test_runner_ui_cfg)
     if bootstrap_mode == BOOTSTRAP_MODE_BARE_THEN_APPLY:
         post_bootstrap_agent_instance_keys = _selection_agent_instance_keys(
@@ -764,6 +767,9 @@ def _normalize_bootstrap_deployconf(
     if isinstance(master_cfg, dict):
         entrypoint = master_cfg.get("entrypoint")
         if isinstance(entrypoint, str):
+            master_port = _extract_master_listen_port(entrypoint=entrypoint)
+            if master_port is not None:
+                _set_service_port(master_cfg, port=master_port)
             normalized_entrypoint, removed = _strip_legacy_master_p2p_listen_port(entrypoint=entrypoint)
             if removed:
                 master_cfg["entrypoint"] = normalized_entrypoint
@@ -843,6 +849,7 @@ def _rewrite_same_host_local_multi_node_fixed_ports(
     _set_service_port(greptime_cfg, port=plan["greptime_port"])
     _set_service_port(tikv_pd_cfg, port=plan["tikv_pd_port"])
     _set_service_port(tikv_cfg, port=plan["tikv_port"])
+    _set_service_port(master_cfg, port=plan["master_port"])
 
     etcd_entrypoint = _require_str(etcd_cfg.get("entrypoint"), "deployconf.service.etcd.entrypoint")
     etcd_entrypoint = _replace_expected_substring(
@@ -972,6 +979,13 @@ def _set_service_port(service_cfg: dict[str, Any], *, port: int) -> None:
         service_cfg["in_container_port"] = int(port)
 
 
+def _extract_master_listen_port(*, entrypoint: str) -> int | None:
+    match = re.search(r"(?m)^[ \t]*port:\s*(\d+)\s*$", entrypoint)
+    if match is None:
+        return None
+    return _require_port_number(match.group(1), "deployconf.service.master.entrypoint port")
+
+
 def _replace_expected_substring(*, value: str, old: str, new: str, ctx: str) -> str:
     if old in value:
         return value.replace(old, new)
@@ -1398,7 +1412,7 @@ def _test_runner_ui_summary_from_cfg(
         "url": ui_cfg["url"],
         "probe_url": ui_cfg["probe_url"],
         "workdir": str(ui_cfg["workdir"]),
-        "log_path": str(ui_cfg["log_path"]),
+        "log_path": str(ui_cfg["active_log_path"]),
         "history_lookback_days": int(ui_cfg["history_lookback_days"]),
         "history_roots": [str(path) for path in ui_cfg["history_roots"]],
         "gitops_config_path": (
@@ -1459,7 +1473,8 @@ def _parse_test_runner_ui_config(
             _require_str(ui_cfg.get("gitops_config_path"), "test_runner_ui.gitops_config_path"),
             "test_runner_ui.gitops_config_path",
         )
-    log_path = (workdir / TEST_RUNNER_UI_LOG_FILENAME).resolve()
+    log_path = (workdir.resolve() / TEST_RUNNER_UI_LOG_FILENAME).resolve()
+    active_log_path = log_shard.daily_sharded_log_path(log_path)
     return {
         "enabled": True,
         "host": host,
@@ -1468,6 +1483,7 @@ def _parse_test_runner_ui_config(
         "probe_url": _test_runner_ui_probe_url(host=host, port=port),
         "workdir": workdir.resolve(),
         "log_path": log_path,
+        "active_log_path": active_log_path,
         "history_lookback_days": int(history_lookback_days),
         "history_roots": [path.resolve() for path in history_roots],
         "gitops_config_path": gitops_config_path.resolve() if gitops_config_path is not None else None,
@@ -1588,7 +1604,7 @@ def _ensure_test_runner_ui_started(*, ui_cfg: dict[str, Any]) -> dict[str, Any]:
     if ui_cfg["gitops_config_path"] is not None:
         argv.extend(["--gitops-config", str(ui_cfg["gitops_config_path"])])
 
-    log_path = Path(ui_cfg["log_path"]).resolve()
+    log_path = Path(ui_cfg["active_log_path"]).resolve()
     log_path.parent.mkdir(parents=True, exist_ok=True)
     log_handle = log_path.open("a", encoding="utf-8")
     try:
diff --git a/fluxon_test_stack/test_runner.py b/fluxon_test_stack/test_runner.py
index e31d500..f3344b8 100644
--- a/fluxon_test_stack/test_runner.py
+++ b/fluxon_test_stack/test_runner.py
@@ -37,6 +37,11 @@
 
 import yaml
 
+RUNNER_REPO_ROOT = Path(__file__).resolve().parent.parent
+RUNNER_DEPLOYMENT_DIR = RUNNER_REPO_ROOT / "deployment"
+RUNNER_TEMPLATE_DIR = (RUNNER_REPO_ROOT / "fluxon_test_stack" / "test_runner_templates").resolve()
+sys.path.insert(0, str(RUNNER_DEPLOYMENT_DIR))
+
 from benchmark_role_names import (
     KV_NODE_ROLE_SEED,
     KV_NODE_ROLE_WORKER,
@@ -51,6 +56,7 @@
     run_top_attention_entries,
     select_top_attention_entries,
 )
+from utils import log_shard
 
 
 # NOTE: This project uses multiple schemas:
@@ -277,10 +283,10 @@ def _test_stack_mode_requires_kv_master(mode: str) -> bool:
     "workloads may still be stopping",
 )
 _WAIT_DELETE_APPLY_REQUIRES_DELETE_ERR = "wait_delete_apply requires delete_apply first"
-RUNNER_REPO_ROOT = Path(__file__).resolve().parent.parent
 RUNNER_SHARED_RUNTIME_DIR = (RUNNER_REPO_ROOT / "fluxon_test_stack" / "test_runner").resolve()
 RUNNER_SHARED_LOCK_DIR = (RUNNER_SHARED_RUNTIME_DIR / "locks").resolve()
 RUNNER_STDIO_LOG_FILENAME = "test_runner.log"
+_SERVICE_LOG_RETENTION_DAYS = log_shard.DEFAULT_DAILY_LOG_RETENTION_DAYS
 _ACTIVE_TEST_BED_SELECTION_SUPERVISOR_CHECK_CACHE_KEY: Optional[str] = None
 
 # TEST_STACK coordinator uses a stable workload name across cases; if a previous run crashed
@@ -349,6 +355,7 @@ def _runner_native_ci_scene_ids() -> Tuple[str, ...]:
     return (
         "ci_top_attention_doc_page_build",
         "ci_top_attention_bin_kvtest",
+        "ci_top_attention_log_mgmt",
     )
 
 
@@ -402,6 +409,7 @@ def _scene_id_uses_runner_native_ci_commands(scene_id: str) -> bool:
 _RUNNER_STDIO_LOG_FP: Optional[Any] = None
 _RUNNER_STDIO_KEEPALIVE_FDS: Optional[Tuple[int, int]] = None
 _RUNNER_STDIO_MIRROR_THREAD: Optional[threading.Thread] = None
+_RUNNER_STDIO_ROUTER_THREAD: Optional[threading.Thread] = None
 _CI_WAIT_HEARTBEAT_INTERVAL_SECONDS = 15.0
 _CI_WAIT_TAIL_MAX_CHARS = 8000
 _TEST_RUNNER_UI_MAX_LOG_CHUNK_BYTES = 1024 * 1024
@@ -434,17 +442,65 @@ def _ci_log_prefix_lines(text: str, *, now: Optional[float] = None) -> str:
     return "".join(f"{prefix} {line}" if line.strip() else line for line in lines)
 
 
+def _service_log_base_path(workdir_root: Path, *, filename: str) -> Path:
+    return (workdir_root / filename).resolve()
+
+
+def _service_log_daily_path(base_path: Path, *, now: Optional[datetime.datetime] = None) -> Path:
+    return log_shard.daily_sharded_log_path(base_path, now=now)
+
+
+def _service_log_latest_path(base_path: Path) -> Optional[Path]:
+    return log_shard.latest_existing_daily_sharded_log_path(base_path)
+
+
+def _service_log_resolve_read_path(workdir_root: Path, *, filename: str) -> Optional[Path]:
+    base_path = _service_log_base_path(workdir_root, filename=filename)
+    return _service_log_resolve_read_path_from_base(base_path)
+
+
+def _service_log_resolve_read_path_from_base(base_path: Path) -> Optional[Path]:
+    return log_shard.resolve_readable_log_path(base_path)
+
+
+def _cleanup_old_service_logs(base_path: Path, *, retention_days: int = _SERVICE_LOG_RETENTION_DAYS) -> None:
+    log_shard.cleanup_old_daily_sharded_logs(base_path, retention_days=retention_days)
+
+
+def _start_runner_stdio_log_router(*, base_log_path: Path, read_fd: int) -> None:
+    def _router_loop() -> None:
+        log_shard.relay_fd_to_daily_sharded_logs(
+            base_log_path=str(base_log_path),
+            read_fd=read_fd,
+            retention_days=_SERVICE_LOG_RETENTION_DAYS,
+        )
+
+    router = threading.Thread(
+        target=_router_loop,
+        name="test-runner-stdio-log-router",
+        daemon=True,
+    )
+    router.start()
+    global _RUNNER_STDIO_ROUTER_THREAD
+    _RUNNER_STDIO_ROUTER_THREAD = router
+
+
 def _start_runner_stdio_log_mirror(*, log_path: Path, stdout_fd: int) -> None:
     def _mirror_loop() -> None:
         offset = 0
+        current_path: Optional[Path] = None
         while True:
             try:
-                if log_path.exists():
-                    size = log_path.stat().st_size
+                resolved_path = _service_log_resolve_read_path_from_base(log_path)
+                if isinstance(resolved_path, Path) and resolved_path.exists():
+                    if current_path != resolved_path:
+                        current_path = resolved_path
+                        offset = 0
+                    size = resolved_path.stat().st_size
                     if size < offset:
                         offset = 0
                     if size > offset:
-                        with log_path.open("r", encoding="utf-8", errors="replace") as fp:
+                        with resolved_path.open("r", encoding="utf-8", errors="replace") as fp:
                             fp.seek(offset)
                             chunk = fp.read()
                             offset = fp.tell()
@@ -469,7 +525,11 @@ def _mirror_loop() -> None:
     _RUNNER_STDIO_MIRROR_THREAD = mirror
 
 
-def _redirect_process_stdio_to_log(workdir_root: Path) -> None:
+def _redirect_process_stdio_to_log(
+    workdir_root: Path,
+    *,
+    filename: str = RUNNER_STDIO_LOG_FILENAME,
+) -> None:
     """Route runner stdio to a stable workdir log so long suites survive PTY loss.
 
     English note:
@@ -481,10 +541,13 @@ def _redirect_process_stdio_to_log(workdir_root: Path) -> None:
     """
     global _RUNNER_STDIO_LOG_FP
     global _RUNNER_STDIO_KEEPALIVE_FDS
+    global _RUNNER_STDIO_ROUTER_THREAD
     if _RUNNER_STDIO_LOG_FP is not None:
         return
 
-    log_path = (workdir_root / RUNNER_STDIO_LOG_FILENAME).resolve()
+    base_log_path = _service_log_base_path(workdir_root, filename=filename)
+    _cleanup_old_service_logs(base_log_path)
+    log_path = _service_log_daily_path(base_log_path)
     log_fp = log_path.open("a", encoding="utf-8", buffering=1)
     banner = (
         f"{_ci_log_timestamp_prefix()} [test_runner] redirecting process stdio to stable log: {log_path}\n"
@@ -519,15 +582,26 @@ def _redirect_process_stdio_to_log(workdir_root: Path) -> None:
         except OSError:
             _RUNNER_STDIO_KEEPALIVE_FDS = (-1, -1)
 
-    os.dup2(log_fp.fileno(), sys.stdout.fileno())
-    os.dup2(log_fp.fileno(), sys.stderr.fileno())
+    read_fd, write_fd = os.pipe()
+    router_keepalive = os.dup(write_fd)
+    _start_runner_stdio_log_router(base_log_path=base_log_path, read_fd=read_fd)
+    os.dup2(write_fd, sys.stdout.fileno())
+    os.dup2(write_fd, sys.stderr.fileno())
     sys.stdout = os.fdopen(sys.stdout.fileno(), "w", encoding="utf-8", buffering=1, closefd=False)
     sys.stderr = os.fdopen(sys.stderr.fileno(), "w", encoding="utf-8", buffering=1, closefd=False)
-    _RUNNER_STDIO_LOG_FP = log_fp
+    try:
+        os.close(write_fd)
+    except OSError:
+        pass
+    try:
+        log_fp.close()
+    except OSError:
+        pass
+    _RUNNER_STDIO_LOG_FP = os.fdopen(router_keepalive, "w", encoding="utf-8", buffering=1)
     if _runner_stdio_mirror_enabled():
         keepalive = _RUNNER_STDIO_KEEPALIVE_FDS or (-1, -1)
         _start_runner_stdio_log_mirror(
-            log_path=log_path,
+            log_path=base_log_path,
             stdout_fd=int(keepalive[0]),
         )
 
@@ -2919,105 +2993,17 @@ def _write_deployer_manifests(resolved_case: Dict[str, Any], run_dir: Path, *, a
             orig_argv = [cmd0] + args
             exec_cmd = " ".join(_shell_quote(x) for x in orig_argv)
 
-            # Generate a self-contained SigV4 GET downloader (Fluxon FS S3 gateway) and then exec the original argv.
-            bash_script = (
-                "set -euo pipefail\n"
-                "python3 - <<'PY'\n"
-                "import datetime\n"
-                "import hashlib\n"
-                "import hmac\n"
-                "import os\n"
-                "import urllib.parse\n"
-                "import urllib.request\n"
-                "from pathlib import Path\n"
-                "\n"
-                f"BASE_URL = {s3_base_url!r}\n"
-                f"BUCKET = {s3_bucket!r}\n"
-                f"OBJECT_KEY = {object_key!r}\n"
-                f"DEST_PATH = {payload_dest_path_s!r}\n"
-                f"ACCESS_KEY = {s3_access_key!r}\n"
-                f"SECRET_KEY = {s3_secret_key!r}\n"
-                f"REGION = {s3_region!r}\n"
-                "\n"
-                "ALG = 'AWS4-HMAC-SHA256'\n"
-                "SERVICE = 's3'\n"
-                "TERM = 'aws4_request'\n"
-                "UNSIGNED = 'UNSIGNED-PAYLOAD'\n"
-                "\n"
-                "def _hmac_sha256(key: bytes, msg: bytes) -> bytes:\n"
-                "    return hmac.new(key, msg, hashlib.sha256).digest()\n"
-                "\n"
-                "def _sha256_hex(msg: bytes) -> str:\n"
-                "    return hashlib.sha256(msg).hexdigest()\n"
-                "\n"
-                "def _derive_signing_key(secret_key: str, scope_date: str, region: str) -> bytes:\n"
-                "    k_date = _hmac_sha256(('AWS4' + secret_key).encode('utf-8'), scope_date.encode('utf-8'))\n"
-                "    k_region = _hmac_sha256(k_date, region.encode('utf-8'))\n"
-                "    k_service = _hmac_sha256(k_region, SERVICE.encode('utf-8'))\n"
-                "    return _hmac_sha256(k_service, TERM.encode('utf-8'))\n"
-                "\n"
-                "def _sigv4_headers(*, method: str, signing_path: str, query: str, host: str, scope_date: str, amz_date: str, payload_hash: str) -> dict:\n"
-                "    signed_headers = 'host;x-amz-content-sha256;x-amz-date'\n"
-                "    canonical_headers = ''\n"
-                "    canonical_headers += f'host:{host}\\n'\n"
-                "    canonical_headers += f'x-amz-content-sha256:{payload_hash}\\n'\n"
-                "    canonical_headers += f'x-amz-date:{amz_date}\\n'\n"
-                "    canonical_request = '\\n'.join([method, signing_path, query, canonical_headers, signed_headers, payload_hash])\n"
-                "    cr_hash = _sha256_hex(canonical_request.encode('utf-8'))\n"
-                "    scope = f'{scope_date}/{REGION}/{SERVICE}/{TERM}'\n"
-                "    string_to_sign = '\\n'.join([ALG, amz_date, scope, cr_hash])\n"
-                "    signing_key = _derive_signing_key(SECRET_KEY, scope_date, REGION)\n"
-                "    sig = hmac.new(signing_key, string_to_sign.encode('utf-8'), hashlib.sha256).hexdigest()\n"
-                "    auth = f\"{ALG} Credential={ACCESS_KEY}/{scope}, SignedHeaders={signed_headers}, Signature={sig}\"\n"
-                "    return {\n"
-                "        'Authorization': auth,\n"
-                "        'x-amz-date': amz_date,\n"
-                "        'x-amz-content-sha256': payload_hash,\n"
-                "        'Host': host,\n"
-                "    }\n"
-                "\n"
-                "u = urllib.parse.urlparse(BASE_URL)\n"
-                "if u.scheme not in ('http', 'https'):\n"
-                "    raise ValueError('BASE_URL must be http(s)')\n"
-                "if not u.netloc:\n"
-                "    raise ValueError('BASE_URL missing host')\n"
-                "base_path = u.path.rstrip('/')\n"
-                "if base_path == '':\n"
-                "    raise ValueError('BASE_URL must include a non-root path prefix (e.g. /fs_s3)')\n"
-                "\n"
-                "bucket_enc = urllib.parse.quote(BUCKET, safe='-_.~')\n"
-                "key_enc = urllib.parse.quote(OBJECT_KEY, safe='/-_.~')\n"
-                "full_path = base_path + '/' + bucket_enc + '/' + key_enc\n"
-                # Sign the *actual* client-visible request path (including s3_base_url path prefix, e.g. "/fs_s3").
-                "signing_path = full_path\n"
-                "url = f'{u.scheme}://{u.netloc}{full_path}'\n"
-                "\n"
-                "now = datetime.datetime.utcnow()\n"
-                "amz_date = now.strftime('%Y%m%dT%H%M%SZ')\n"
-                "scope_date = now.strftime('%Y%m%d')\n"
-                "hdrs = _sigv4_headers(method='GET', signing_path=signing_path, query='', host=u.netloc, scope_date=scope_date, amz_date=amz_date, payload_hash=UNSIGNED)\n"
-                "\n"
-                "dest = Path(DEST_PATH)\n"
-                "dest.parent.mkdir(parents=True, exist_ok=True)\n"
-                "tmp = Path(str(dest) + '.tmp')\n"
-                "if tmp.exists():\n"
-                "    tmp.unlink()\n"
-                "req = urllib.request.Request(url, method='GET')\n"
-                "for k, v in hdrs.items():\n"
-                "    req.add_header(k, v)\n"
-                "with urllib.request.urlopen(req, timeout=60) as resp:\n"
-                "    if getattr(resp, 'status', None) != 200:\n"
-                "        body = resp.read(4096)\n"
-                "        raise RuntimeError(f'download failed: status={getattr(resp, \"status\", None)} body={body!r}')\n"
-                "    with tmp.open('wb') as f:\n"
-                "        while True:\n"
-                "            b = resp.read(1024 * 1024)\n"
-                "            if not b:\n"
-                "                break\n"
-                "            f.write(b)\n"
-                "tmp.replace(dest)\n"
-                "PY\n"
-                f"exec {exec_cmd}\n"
+            # Keep the remote wrapper self-contained, but store it as a standalone template
+            # instead of hardcoding a long inline script in this Python source file.
+            bash_script = _render_fluxon_fs_s3_payload_wrapper(
+                s3_base_url=s3_base_url,
+                s3_bucket=s3_bucket,
+                object_key=object_key,
+                payload_dest_path=payload_dest_path_s,
+                s3_access_key=s3_access_key,
+                s3_secret_key=s3_secret_key,
+                s3_region=s3_region,
+                exec_cmd=exec_cmd,
             )
 
             # Deployer only consumes argv/cwd; container image is required by the YAML subset parser
@@ -7670,6 +7656,18 @@ def _runner_native_ci_commands_for_case(case: _ResolvedCase, *, ctx: str) -> Lis
                 "timeout_seconds": 21600,
             }
         ]
+    if scene_id == "ci_top_attention_log_mgmt":
+        return [
+            {
+                "id": "top_attention_log_mgmt",
+                "command": (
+                    "__RUN_DIR__/venv/bin/python3 -u "
+                    "__RUN_DIR__/src/fluxon_test_stack/top_attention_test_index/_log_mgmt.py "
+                    "--case-config __RUN_DIR__/configs/ci_scene_config.yaml"
+                ),
+                "timeout_seconds": 21600,
+            }
+        ]
     raise ValueError(f"{ctx} unsupported runner-native CI scene: {scene_id!r}")
 
 
@@ -12251,6 +12249,51 @@ def _shell_quote(s: str) -> str:
     return "'" + s.replace("'", "'\\''") + "'"
 
 
+def _json_string_literal(value: str) -> str:
+    return json.dumps(value, ensure_ascii=True)
+
+
+def _render_runner_template(*, template_name: str, replacements: Dict[str, str]) -> str:
+    template_path = (RUNNER_TEMPLATE_DIR / template_name).resolve()
+    if template_path.parent != RUNNER_TEMPLATE_DIR:
+        raise ValueError(f"template must stay under {RUNNER_TEMPLATE_DIR}: {template_path}")
+    if not template_path.is_file():
+        raise ValueError(f"missing runner template: {template_path}")
+    rendered = template_path.read_text(encoding="utf-8")
+    for token, value in replacements.items():
+        rendered = rendered.replace(token, value)
+    unresolved = sorted(set(re.findall(r"__FLUXON_TMPL_[A-Z0-9_]+__", rendered)))
+    if unresolved:
+        raise ValueError(f"unresolved runner template tokens: {unresolved} template={template_path}")
+    return rendered
+
+
+def _render_fluxon_fs_s3_payload_wrapper(
+    *,
+    s3_base_url: str,
+    s3_bucket: str,
+    object_key: str,
+    payload_dest_path: str,
+    s3_access_key: str,
+    s3_secret_key: str,
+    s3_region: str,
+    exec_cmd: str,
+) -> str:
+    return _render_runner_template(
+        template_name="payload_fluxon_fs_s3_download_and_exec.sh.template",
+        replacements={
+            "__FLUXON_TMPL_BASE_URL_JSON__": _json_string_literal(s3_base_url),
+            "__FLUXON_TMPL_BUCKET_JSON__": _json_string_literal(s3_bucket),
+            "__FLUXON_TMPL_OBJECT_KEY_JSON__": _json_string_literal(object_key),
+            "__FLUXON_TMPL_DEST_PATH_JSON__": _json_string_literal(payload_dest_path),
+            "__FLUXON_TMPL_ACCESS_KEY_JSON__": _json_string_literal(s3_access_key),
+            "__FLUXON_TMPL_SECRET_KEY_JSON__": _json_string_literal(s3_secret_key),
+            "__FLUXON_TMPL_REGION_JSON__": _json_string_literal(s3_region),
+            "__FLUXON_TMPL_EXEC_CMD__": exec_cmd,
+        },
+    )
+
+
 
 def _find_deploy_instance_opt(resolved_case: Dict[str, Any], *, instance_id: str) -> Optional[Dict[str, Any]]:
     deploy = _require_dict(resolved_case.get("deploy"), "resolved_case.deploy")
@@ -16220,7 +16263,9 @@ def _consume_path(path: Path) -> None:
             return
 
     _consume_path((workdir_root / "case_runs.yaml").resolve())
-    _consume_path((workdir_root / RUNNER_STDIO_LOG_FILENAME).resolve())
+    runner_log_path = _service_log_resolve_read_path(workdir_root, filename=RUNNER_STDIO_LOG_FILENAME)
+    if isinstance(runner_log_path, Path):
+        _consume_path(runner_log_path)
 
     run_dir = (_ui_case_result_root(workdir_root, case_id) / _ui_run_dir_name(run_index)).resolve()
     _consume_path(run_dir)
@@ -16327,7 +16372,7 @@ def _ui_case_overview(workdir_root: Path, *, case_id: str) -> Dict[str, Any]:
 def _ui_collect_suite_overview(workdir_root: Path) -> Dict[str, Any]:
     case_ids = _ui_collect_case_ids(workdir_root)
     cases = [_ui_case_overview(workdir_root, case_id=case_id) for case_id in case_ids]
-    runner_log_path = (workdir_root / RUNNER_STDIO_LOG_FILENAME).resolve()
+    runner_log_path = _service_log_resolve_read_path(workdir_root, filename=RUNNER_STDIO_LOG_FILENAME)
     running_cases = [case for case in cases if case.get("status") == "RUNNING"]
     incomplete_cases = [case for case in cases if case.get("status") in {"INCOMPLETE", "RESERVED"}]
     last_updated_unix_s = 0
@@ -16350,7 +16395,7 @@ def _ui_collect_suite_overview(workdir_root: Path) -> Dict[str, Any]:
     return {
         "workdir_root": workdir_root.resolve(),
         "case_runs_path": (workdir_root / "case_runs.yaml").resolve(),
-        "runner_log_path": runner_log_path if runner_log_path.exists() else None,
+        "runner_log_path": runner_log_path if isinstance(runner_log_path, Path) and runner_log_path.exists() else None,
         "running_case_count": len(running_cases),
         "status": "RUNNING" if running_cases else ("INCOMPLETE" if incomplete_cases else ("IDLE" if cases else "EMPTY")),
         "last_updated_unix_s": int(last_updated_unix_s),
@@ -16451,7 +16496,7 @@ def _ui_workdir_id(workdir_root: Path) -> str:
 
 def _ui_workdir_touch_unix_s(workdir_root: Path) -> int:
     touched = 0
-    for name in ("case_runs.yaml", RUNNER_STDIO_LOG_FILENAME):
+    for name in ("case_runs.yaml",):
         path = (workdir_root / name).resolve()
         if not path.exists():
             continue
@@ -16459,6 +16504,12 @@ def _ui_workdir_touch_unix_s(workdir_root: Path) -> int:
             touched = max(touched, int(path.stat().st_mtime))
         except Exception:
             continue
+    runner_log_path = _service_log_resolve_read_path(workdir_root, filename=RUNNER_STDIO_LOG_FILENAME)
+    if isinstance(runner_log_path, Path) and runner_log_path.exists():
+        try:
+            touched = max(touched, int(runner_log_path.stat().st_mtime))
+        except Exception:
+            pass
     return int(touched)
 
 
@@ -17897,8 +17948,11 @@ def _handle_api_log_chunk(self, parsed) -> None:
                         self._send_json(400, {"error": "missing workdir_id"})
                         return
                     suite_workdir = _ui_workdir_by_id(workdir_root, workdir_id, extra_history_roots)
-                    path = (suite_workdir / RUNNER_STDIO_LOG_FILENAME).resolve()
-                    if not path.exists():
+                    path = _service_log_resolve_read_path(
+                        suite_workdir,
+                        filename=RUNNER_STDIO_LOG_FILENAME,
+                    )
+                    if not isinstance(path, Path) or not path.exists():
                         raise FileNotFoundError(f"runner log not found: {path}")
                 elif kind == "run":
                     workdir_id = (qs.get("workdir_id") or [""])[0]
diff --git a/fluxon_test_stack/test_runner_templates/payload_fluxon_fs_s3_download_and_exec.sh.template b/fluxon_test_stack/test_runner_templates/payload_fluxon_fs_s3_download_and_exec.sh.template
new file mode 100644
index 0000000..ca677bc
--- /dev/null
+++ b/fluxon_test_stack/test_runner_templates/payload_fluxon_fs_s3_download_and_exec.sh.template
@@ -0,0 +1,108 @@
+set -euo pipefail
+python3 - <<'PY'
+import datetime
+import hashlib
+import hmac
+import urllib.parse
+import urllib.request
+from pathlib import Path
+
+BASE_URL = __FLUXON_TMPL_BASE_URL_JSON__
+BUCKET = __FLUXON_TMPL_BUCKET_JSON__
+OBJECT_KEY = __FLUXON_TMPL_OBJECT_KEY_JSON__
+DEST_PATH = __FLUXON_TMPL_DEST_PATH_JSON__
+ACCESS_KEY = __FLUXON_TMPL_ACCESS_KEY_JSON__
+SECRET_KEY = __FLUXON_TMPL_SECRET_KEY_JSON__
+REGION = __FLUXON_TMPL_REGION_JSON__
+
+ALG = "AWS4-HMAC-SHA256"
+SERVICE = "s3"
+TERM = "aws4_request"
+UNSIGNED = "UNSIGNED-PAYLOAD"
+
+
+def _hmac_sha256(key: bytes, msg: bytes) -> bytes:
+    return hmac.new(key, msg, hashlib.sha256).digest()
+
+
+def _sha256_hex(msg: bytes) -> str:
+    return hashlib.sha256(msg).hexdigest()
+
+
+def _derive_signing_key(secret_key: str, scope_date: str, region: str) -> bytes:
+    k_date = _hmac_sha256(("AWS4" + secret_key).encode("utf-8"), scope_date.encode("utf-8"))
+    k_region = _hmac_sha256(k_date, region.encode("utf-8"))
+    k_service = _hmac_sha256(k_region, SERVICE.encode("utf-8"))
+    return _hmac_sha256(k_service, TERM.encode("utf-8"))
+
+
+def _sigv4_headers(*, method: str, signing_path: str, query: str, host: str, scope_date: str, amz_date: str, payload_hash: str) -> dict:
+    signed_headers = "host;x-amz-content-sha256;x-amz-date"
+    canonical_headers = ""
+    canonical_headers += f"host:{host}\n"
+    canonical_headers += f"x-amz-content-sha256:{payload_hash}\n"
+    canonical_headers += f"x-amz-date:{amz_date}\n"
+    canonical_request = "\n".join([method, signing_path, query, canonical_headers, signed_headers, payload_hash])
+    cr_hash = _sha256_hex(canonical_request.encode("utf-8"))
+    scope = f"{scope_date}/{REGION}/{SERVICE}/{TERM}"
+    string_to_sign = "\n".join([ALG, amz_date, scope, cr_hash])
+    signing_key = _derive_signing_key(SECRET_KEY, scope_date, REGION)
+    sig = hmac.new(signing_key, string_to_sign.encode("utf-8"), hashlib.sha256).hexdigest()
+    auth = f"{ALG} Credential={ACCESS_KEY}/{scope}, SignedHeaders={signed_headers}, Signature={sig}"
+    return {
+        "Authorization": auth,
+        "x-amz-date": amz_date,
+        "x-amz-content-sha256": payload_hash,
+        "Host": host,
+    }
+
+
+u = urllib.parse.urlparse(BASE_URL)
+if u.scheme not in ("http", "https"):
+    raise ValueError("BASE_URL must be http(s)")
+if not u.netloc:
+    raise ValueError("BASE_URL missing host")
+base_path = u.path.rstrip("/")
+if base_path == "":
+    raise ValueError("BASE_URL must include a non-root path prefix (e.g. /fs_s3)")
+
+bucket_enc = urllib.parse.quote(BUCKET, safe="-_.~")
+key_enc = urllib.parse.quote(OBJECT_KEY, safe="/-_.~")
+full_path = base_path + "/" + bucket_enc + "/" + key_enc
+signing_path = full_path
+url = f"{u.scheme}://{u.netloc}{full_path}"
+
+now = datetime.datetime.utcnow()
+amz_date = now.strftime("%Y%m%dT%H%M%SZ")
+scope_date = now.strftime("%Y%m%d")
+hdrs = _sigv4_headers(
+    method="GET",
+    signing_path=signing_path,
+    query="",
+    host=u.netloc,
+    scope_date=scope_date,
+    amz_date=amz_date,
+    payload_hash=UNSIGNED,
+)
+
+dest = Path(DEST_PATH)
+dest.parent.mkdir(parents=True, exist_ok=True)
+tmp = Path(str(dest) + ".tmp")
+if tmp.exists():
+    tmp.unlink()
+req = urllib.request.Request(url, method="GET")
+for k, v in hdrs.items():
+    req.add_header(k, v)
+with urllib.request.urlopen(req, timeout=60) as resp:
+    if getattr(resp, "status", None) != 200:
+        body = resp.read(4096)
+        raise RuntimeError(f'download failed: status={getattr(resp, "status", None)} body={body!r}')
+    with tmp.open("wb") as f:
+        while True:
+            b = resp.read(1024 * 1024)
+            if not b:
+                break
+            f.write(b)
+tmp.replace(dest)
+PY
+exec __FLUXON_TMPL_EXEC_CMD__
diff --git a/fluxon_test_stack/test_runner_ui.py b/fluxon_test_stack/test_runner_ui.py
index 9702da4..d7c6ac2 100644
--- a/fluxon_test_stack/test_runner_ui.py
+++ b/fluxon_test_stack/test_runner_ui.py
@@ -53,6 +53,10 @@ def main() -> None:
         raw_path=Path(args.workdir),
         field_name="workdir",
     )
+    test_runner._redirect_process_stdio_to_log(
+        workdir_root,
+        filename="test_runner_ui.log",
+    )
     gitops_cfg_path = None
     if args.gitops_config:
         gitops_cfg_path = test_runner._resolve_repo_root_cli_path(
diff --git a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
index 96f0554..a9d0cf7 100644
--- a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
+++ b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
@@ -29,12 +29,13 @@ def _load_module():
 class TestCi2VirtNodeContract(unittest.TestCase):
     _KVTEST_SCENE_ID = "ci_top_attention_bin_kvtest"
     _DOC_SCENE_ID = "ci_top_attention_doc_page_build"
+    _LOG_MGMT_SCENE_ID = "ci_top_attention_log_mgmt"
 
     def test_generated_suite_is_public_dual_local_nodes_ci_only(self) -> None:
         suite_cfg = _ENTRY._load_yaml_mapping(_ENTRY.DEFAULT_SUITE_PATH, ctx="suite")
         generated = _ENTRY._rewrite_suite_for_local_dual_nodes(
             suite_cfg=suite_cfg,
-            scene_ids=[self._DOC_SCENE_ID, self._KVTEST_SCENE_ID],
+            scene_ids=[self._DOC_SCENE_ID, self._KVTEST_SCENE_ID, self._LOG_MGMT_SCENE_ID],
             primary_node_name="local-node-a",
             secondary_node_name="local-node-b",
             host_ip="10.1.1.119",
@@ -43,7 +44,7 @@ def test_generated_suite_is_public_dual_local_nodes_ci_only(self) -> None:
         )
 
         self.assertEqual(generated["run"]["selectors"]["profile_ids"], ["fluxon_tcp_thread"])
-        self.assertEqual(set(generated["scenes"].keys()), {self._DOC_SCENE_ID, self._KVTEST_SCENE_ID})
+        self.assertEqual(set(generated["scenes"].keys()), {self._DOC_SCENE_ID, self._KVTEST_SCENE_ID, self._LOG_MGMT_SCENE_ID})
         self.assertEqual(generated["profiles"]["fluxon_tcp_thread"]["artifact_set"], "fluxon_tcp_thread")
         self.assertEqual(
             generated["profiles"]["fluxon_tcp_thread"]["runtime"]["ci"]["scene_configs"][self._KVTEST_SCENE_ID][
@@ -51,6 +52,12 @@ def test_generated_suite_is_public_dual_local_nodes_ci_only(self) -> None:
             ],
             "tcp_thread_transport",
         )
+        self.assertEqual(
+            generated["profiles"]["fluxon_tcp_thread"]["runtime"]["ci"]["scene_configs"][self._LOG_MGMT_SCENE_ID][
+                "enabled"
+            ],
+            True,
+        )
         self.assertEqual(
             generated["profiles"]["fluxon_tcp_thread"]["runtime"]["ci"]["deploy"]["target_ip_map"],
             {"local-node-a": "10.1.1.119", "local-node-b": "10.1.1.119"},
@@ -106,11 +113,16 @@ def test_generated_suite_is_public_dual_local_nodes_ci_only(self) -> None:
             generated["scenes"][self._KVTEST_SCENE_ID]["select"]["scales"],
             ["n1_kvowner_dram_20gib"],
         )
+        self.assertEqual(
+            generated["scenes"][self._LOG_MGMT_SCENE_ID]["select"]["scales"],
+            ["n1_kvowner_dram_20gib"],
+        )
         self.assertEqual(
             set(generated["scales"].keys()),
             {"n1_kvowner_dram_3gib", "n1_kvowner_dram_20gib"},
         )
         self.assertNotIn("commands", generated["scenes"][self._KVTEST_SCENE_ID]["ci"])
+        self.assertNotIn("commands", generated["scenes"][self._LOG_MGMT_SCENE_ID]["ci"])
 
     def test_generated_suite_preserves_source_scene_configs(self) -> None:
         suite_cfg = _ENTRY._load_yaml_mapping(_ENTRY.DEFAULT_SUITE_PATH, ctx="suite")
@@ -211,7 +223,23 @@ def test_generated_deployconf_rewrites_to_dual_local_nodes(self) -> None:
         self.assertIn('--wheel "$FLUXON_RELEASE_WHEEL"', generated["global_envs"]["FLUXON_RELEASE_WHEEL_FETCH_CMD"])
         self.assertEqual(generated["atomic_groups"]["fluxon_core_controller"]["nodes"], ["local-node-a", "local-node-b"])
         self.assertEqual(generated["service"]["owner"]["node_bind"]["node"], ["local-node-a", "local-node-b"])
+        self.assertIn(
+            'log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"',
+            generated["service"]["owner"]["entrypoint"],
+        )
+        self.assertIn(
+            'cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"',
+            generated["service"]["owner"]["entrypoint"],
+        )
         self.assertEqual(generated["service"]["ops_controller"]["port"], 19180)
+        self.assertIn(
+            'http_listen_addr: "0.0.0.0:${OPS_CONTROLLER__PORT}"',
+            generated["service"]["ops_controller"]["entrypoint"],
+        )
+        self.assertNotIn(
+            'http_listen_addr: "0.0.0.0:${MASTER__PORT}"',
+            generated["service"]["ops_controller"]["entrypoint"],
+        )
         self.assertIn("local-node-a", generated["service"]["ops_agent"]["entrypoint"])
         self.assertIn("local-node-b", generated["service"]["ops_agent"]["entrypoint"])
         self.assertIn('    - "10.1.1.119/32"', generated["service"]["master"]["entrypoint"])
@@ -401,7 +429,7 @@ def test_main_supports_explicit_suite_path(self) -> None:
             suite_cfg["scenes"] = {
                 key: value
                 for key, value in suite_cfg["scenes"].items()
-                if key in (self._DOC_SCENE_ID, self._KVTEST_SCENE_ID)
+                if key in (self._DOC_SCENE_ID, self._KVTEST_SCENE_ID, self._LOG_MGMT_SCENE_ID)
             }
             suite_cfg["profiles"] = {"fluxon_tcp": suite_cfg["profiles"]["fluxon_tcp"]}
             suite_cfg["run"]["selectors"]["profile_ids"] = ["fluxon_tcp"]
@@ -409,6 +437,7 @@ def test_main_supports_explicit_suite_path(self) -> None:
             suite_cfg["profiles"]["fluxon_tcp"]["runtime"]["ci"]["scene_configs"][self._DOC_SCENE_ID]["doc_site_base_url"] = (
                 "tele-ai.github.io/Fluxon"
             )
+            suite_cfg["profiles"]["fluxon_tcp"]["runtime"]["ci"]["scene_configs"][self._LOG_MGMT_SCENE_ID]["enabled"] = True
             _ENTRY._write_yaml(suite_path, suite_cfg)
             release_dir = REPO_ROOT / "fluxon_release"
             release_dir.mkdir(parents=True, exist_ok=True)
@@ -445,7 +474,7 @@ def test_main_supports_explicit_suite_path(self) -> None:
                 workdir / "generated" / "ci_test_list.local.yaml",
                 ctx="generated suite",
             )
-            self.assertEqual(set(generated_suite["scenes"].keys()), {self._DOC_SCENE_ID, self._KVTEST_SCENE_ID})
+            self.assertEqual(set(generated_suite["scenes"].keys()), {self._DOC_SCENE_ID, self._KVTEST_SCENE_ID, self._LOG_MGMT_SCENE_ID})
             self.assertEqual(
                 generated_suite["profiles"]["fluxon_tcp_thread"]["runtime"]["ci"]["scene_configs"][self._KVTEST_SCENE_ID][
                     "kv_test_rounds"
@@ -458,6 +487,12 @@ def test_main_supports_explicit_suite_path(self) -> None:
                 ],
                 "tele-ai.github.io/Fluxon",
             )
+            self.assertEqual(
+                generated_suite["profiles"]["fluxon_tcp_thread"]["runtime"]["ci"]["scene_configs"][self._LOG_MGMT_SCENE_ID][
+                    "enabled"
+                ],
+                True,
+            )
 
     def test_main_same_host_generated_configs_use_non_loopback_host_ip(self) -> None:
         with tempfile.TemporaryDirectory() as td:
@@ -563,6 +598,60 @@ def fake_run(argv: list[str], *, env=None) -> None:
                 str((REPO_ROOT / "fluxon_test_stack" / "pack_test_stack_rsc.py").resolve()),
             )
 
+    def test_main_passes_explicit_release_dir_to_pack_stage(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            root = Path(td)
+            workdir = root / "ci_2_virt_node_workdir"
+            hostworkdir = root / "hostworkdir"
+            release_dir = root / "custom_release"
+            release_dir.mkdir(parents=True, exist_ok=True)
+            wheel_path = release_dir / "fluxon-0.2.1-cp38-abi3-manylinux_2_28_x86_64.whl"
+            wheel_path.write_text("", encoding="utf-8")
+            calls: list[tuple[list[str], dict[str, str] | None]] = []
+
+            def fake_run(argv: list[str], *, env=None) -> None:
+                calls.append((list(argv), None if env is None else dict(env)))
+
+            argv = [
+                "ci_2_virt_node.py",
+                "--workdir",
+                str(workdir),
+                "--testbed-hostworkdir",
+                str(hostworkdir),
+                "--release-dir",
+                str(release_dir),
+                "--scene-id",
+                self._KVTEST_SCENE_ID,
+                "--skip-builder-image",
+                "--skip-dispatch",
+                "--skip-start-testbed",
+                "--skip-runner",
+            ]
+            original_argv = sys.argv[:]
+            try:
+                with mock.patch.object(_ENTRY, "_run", side_effect=fake_run):
+                    with mock.patch.object(_ENTRY, "_detect_local_hostname", return_value="runner-host"):
+                        with mock.patch.object(_ENTRY, "_detect_local_ipv4", return_value="10.1.1.119"):
+                            with mock.patch.object(_ENTRY, "_ensure_ci_pack_release_env", return_value=Path("/tmp/env.yaml")):
+                                with mock.patch.object(_ENTRY, "_render_ci_nix_pack_config", return_value=Path("/tmp/cfg.yaml")):
+                                    sys.argv = argv
+                                    rc = _ENTRY.main()
+            finally:
+                sys.argv = original_argv
+
+            self.assertEqual(rc, 0)
+            self.assertGreaterEqual(len(calls), 2)
+            pack_cmd = calls[1][0]
+            self.assertEqual(
+                pack_cmd[1],
+                str((REPO_ROOT / "fluxon_test_stack" / "pack_test_stack_rsc.py").resolve()),
+            )
+            self.assertIn("--release-dir", pack_cmd)
+            self.assertEqual(
+                pack_cmd[pack_cmd.index("--release-dir") + 1],
+                str(release_dir.resolve()),
+            )
+
     def test_main_uses_apply_check_config_for_explicit_apply_validation(self) -> None:
         with tempfile.TemporaryDirectory() as td:
             root = Path(td)
diff --git a/fluxon_test_stack/tests/test_pack_test_stack_rsc_cli.py b/fluxon_test_stack/tests/test_pack_test_stack_rsc_cli.py
index d4bfac2..09afc1b 100644
--- a/fluxon_test_stack/tests/test_pack_test_stack_rsc_cli.py
+++ b/fluxon_test_stack/tests/test_pack_test_stack_rsc_cli.py
@@ -261,26 +261,19 @@ def test_git_stage_ci_source_tree_excludes_runtime_outputs(self) -> None:
                 "scripts/build_doc_site.py",
                 "fluxon_doc_cn/roadmap.md",
                 "README.md",
-                "fluxon_release/install.py",
-                ".dever/run.log",
-                "skills/demo/SKILL.md",
             ):
                 path = repo_root / relpath
                 path.parent.mkdir(parents=True, exist_ok=True)
                 path.write_text("x\n", encoding="utf-8")
-
-            raw = b"\0".join(
-                [
-                    b"scripts/build_doc_site.py",
-                    b"fluxon_doc_cn/roadmap.md",
-                    b"README.md",
-                    b"fluxon_release/install.py",
-                    b".dever/run.log",
-                    b"skills/demo/SKILL.md",
-                ]
-            ) + b"\0"
-
-            with mock.patch.object(_PACK.subprocess, "check_output", return_value=raw):
+            with mock.patch.object(
+                _PACK,
+                "_collect_ci_source_relpaths",
+                return_value=[
+                    "README.md",
+                    "fluxon_doc_cn/roadmap.md",
+                    "scripts/build_doc_site.py",
+                ],
+            ):
                 relpaths = _PACK._git_stage_ci_source_tree(repo_root=repo_root, stage_root=stage_root)
 
             self.assertEqual(
@@ -308,25 +301,40 @@ def test_collect_ci_source_relpaths_excludes_runtime_outputs(self) -> None:
                 path = repo_root / relpath
                 path.parent.mkdir(parents=True, exist_ok=True)
                 path.write_text("x\n", encoding="utf-8")
+            (repo_root / ".gitignore").write_text(
+                "\n".join(
+                    [
+                        "fluxon_release/*",
+                        "!fluxon_release/install.py",
+                        ".dever",
+                        "skills/",
+                    ]
+                )
+                + "\n",
+                encoding="utf-8",
+            )
 
-            raw = b"\0".join(
-                [
-                    b"scripts/build_doc_site.py",
-                    b"fluxon_doc_cn/roadmap.md",
-                    b"README.md",
-                    b"fluxon_release/install.py",
-                    b".dever/run.log",
-                    b"skills/demo/SKILL.md",
-                ]
-            ) + b"\0"
-
-            with mock.patch.object(_PACK.subprocess, "check_output", return_value=raw):
+            def fake_check_output(argv, cwd=None):
+                del argv
+                cwd_path = Path(cwd).resolve()
+                if cwd_path == repo_root.resolve():
+                    return b"scripts/build_doc_site.py\0fluxon_doc_cn/roadmap.md\0README.md\0"
+                raise AssertionError(f"unexpected git ls-files cwd: {cwd_path}")
+
+            with mock.patch.object(
+                _PACK.collect_source_profile_relpaths.__globals__["git_source_selection_utils"].subprocess,
+                "check_output",
+                side_effect=fake_check_output,
+            ):
                 relpaths = _PACK._collect_ci_source_relpaths(repo_root=repo_root)
 
             self.assertEqual(
                 relpaths,
                 ["README.md", "fluxon_doc_cn/roadmap.md", "scripts/build_doc_site.py"],
             )
+            self.assertNotIn("fluxon_release/install.py", relpaths)
+            self.assertNotIn(".dever/run.log", relpaths)
+            self.assertNotIn("skills/demo/SKILL.md", relpaths)
 
     def test_collect_ci_source_relpaths_includes_rather_no_git_submodule_sources(self) -> None:
         with tempfile.TemporaryDirectory() as tmpdir:
@@ -334,6 +342,7 @@ def test_collect_ci_source_relpaths_includes_rather_no_git_submodule_sources(sel
             tracked_root = repo_root / "scripts"
             tracked_root.mkdir(parents=True, exist_ok=True)
             (tracked_root / "build_doc_site.py").write_text("tracked\n", encoding="utf-8")
+            (repo_root / ".gitignore").write_text("", encoding="utf-8")
             module_root = repo_root / "fluxon_rs" / "moka"
             (module_root / "src").mkdir(parents=True, exist_ok=True)
             (module_root / "Cargo.toml").write_text("module\n", encoding="utf-8")
@@ -357,7 +366,11 @@ def fake_check_output(argv, cwd=None):
                     return b"Cargo.toml\0src/lib.rs\0"
                 raise AssertionError(f"unexpected git ls-files cwd: {cwd_path}")
 
-            with mock.patch.object(_PACK.subprocess, "check_output", side_effect=fake_check_output):
+            with mock.patch.object(
+                _PACK.collect_source_profile_relpaths.__globals__["git_source_selection_utils"].subprocess,
+                "check_output",
+                side_effect=fake_check_output,
+            ):
                 relpaths = _PACK._collect_ci_source_relpaths(repo_root=repo_root)
 
             self.assertEqual(
@@ -384,9 +397,9 @@ def test_collect_ci_source_relpaths_requires_rather_no_git_submodule_root_to_exi
 
             with (
                 mock.patch.object(
-                    _PACK,
-                    "_collect_git_listed_source_relpaths",
-                    return_value=["scripts/build_doc_site.py"],
+                    _PACK.collect_source_profile_relpaths.__globals__["git_source_selection_utils"].subprocess,
+                    "check_output",
+                    return_value=b"scripts/build_doc_site.py\0",
                 ),
                 self.assertRaisesRegex(
                     RuntimeError,
@@ -422,6 +435,54 @@ def test_compute_ci_source_digest_uses_selected_git_paths_only(self) -> None:
             digest_roots = digest_mock.call_args.args[0]
             self.assertEqual(digest_roots, [tracked.resolve()])
 
+    def test_prune_stage_paths_applies_glob_patterns(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            stage_root = Path(tmpdir)
+            keep_path = stage_root / "keep.txt"
+            pyc_path = stage_root / "pkg" / "drop.pyc"
+            baseline_file = stage_root / "baselines" / "manifest.txt"
+            pyc_path.parent.mkdir(parents=True, exist_ok=True)
+            baseline_file.parent.mkdir(parents=True, exist_ok=True)
+            keep_path.write_text("keep\n", encoding="utf-8")
+            pyc_path.write_text("drop\n", encoding="utf-8")
+            baseline_file.write_text("drop\n", encoding="utf-8")
+
+            _PACK.script_utils.prune_stage_paths(
+                stage_root,
+                ("*.pyc", "baselines/"),
+            )
+
+            self.assertTrue(keep_path.exists())
+            self.assertFalse(pyc_path.exists())
+            self.assertFalse(baseline_file.exists())
+
+    def test_shared_rsync_stage_accepts_exclude_patterns(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            repo_root = Path(tmpdir)
+            src = repo_root / "src"
+            dst = repo_root / "dst"
+            (src / "keep").mkdir(parents=True, exist_ok=True)
+            (src / "drop").mkdir(parents=True, exist_ok=True)
+            (src / "keep" / "a.txt").write_text("keep\n", encoding="utf-8")
+            (src / "drop" / "b.txt").write_text("drop\n", encoding="utf-8")
+
+            run_mock = mock.Mock()
+            with mock.patch.dict(
+                _PACK.script_utils.rsync_stage.__globals__,
+                {"run_cmd_argv": run_mock},
+            ):
+                _PACK.script_utils.rsync_stage(
+                    repo_root=repo_root,
+                    src=src,
+                    dst=dst,
+                    honor_gitignore=False,
+                    exclude_rel_paths=("drop/", "*.tmp"),
+                )
+
+            argv = run_mock.call_args.args[0]
+            self.assertIn("--exclude=drop/", argv)
+            self.assertIn("--exclude=*.tmp", argv)
+
 
 if __name__ == "__main__":
     raise SystemExit(unittest.main())
diff --git a/fluxon_test_stack/tests/test_runner_contract.py b/fluxon_test_stack/tests/test_runner_contract.py
index d017841..67d42e0 100644
--- a/fluxon_test_stack/tests/test_runner_contract.py
+++ b/fluxon_test_stack/tests/test_runner_contract.py
@@ -59,6 +59,10 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
             "ci_top_attention_doc_page_build_declares_setup_dev_env_prepare",
             test_ci_top_attention_doc_page_build_declares_setup_dev_env_prepare,
         ),
+        (
+            "ci_top_attention_log_mgmt_scene_exists",
+            test_ci_top_attention_log_mgmt_scene_exists,
+        ),
     ]
     if selected_test_id is None:
         return checks
@@ -247,5 +251,51 @@ def test_ci_top_attention_doc_page_build_declares_setup_dev_env_prepare() -> Non
     print("PASS: test_ci_top_attention_doc_page_build_declares_setup_dev_env_prepare")
 
 
+def test_ci_top_attention_log_mgmt_scene_exists() -> None:
+    repo_root = Path(__file__).resolve().parents[2]
+    suite_cfg_path = repo_root / "fluxon_test_stack" / "ci_test_list.yaml"
+    suite_cfg = yaml.safe_load(suite_cfg_path.read_text(encoding="utf-8"))
+    if not isinstance(suite_cfg, dict):
+        print("FAIL: test_ci_top_attention_log_mgmt_scene_exists - suite config is not a mapping")
+        return
+
+    suite_for_contract = copy.deepcopy(suite_cfg)
+    artifact_sets = suite_for_contract.get("artifact_sets")
+    if not isinstance(artifact_sets, dict):
+        print("FAIL: test_ci_top_attention_log_mgmt_scene_exists - artifact_sets is not a mapping")
+        return
+    for artifact_set in artifact_sets.values():
+        if not isinstance(artifact_set, dict):
+            continue
+        release_artifacts = artifact_set.get("release_artifacts")
+        if isinstance(release_artifacts, dict):
+            python_wheel = release_artifacts.get("python_wheel")
+            if isinstance(python_wheel, str) and python_wheel.strip():
+                artifact_set["release_artifacts"] = {"wheel": python_wheel}
+
+    suite = _TEST_RUNNER._parse_suite_config(suite_for_contract)
+    scene = suite.scenes.get("ci_top_attention_log_mgmt")
+    if not isinstance(scene, dict):
+        print("FAIL: test_ci_top_attention_log_mgmt_scene_exists - missing scene")
+        return
+    ci = scene.get("ci")
+    if not isinstance(ci, dict):
+        print("FAIL: test_ci_top_attention_log_mgmt_scene_exists - scene.ci missing")
+        return
+    if ci.get("subject") != "rust":
+        print(
+            "FAIL: test_ci_top_attention_log_mgmt_scene_exists - "
+            f"expected subject 'rust', got {ci.get('subject')!r}"
+        )
+        return
+    if ci.get("runtime_contract") != "rust_self_managed":
+        print(
+            "FAIL: test_ci_top_attention_log_mgmt_scene_exists - "
+            f"expected runtime_contract 'rust_self_managed', got {ci.get('runtime_contract')!r}"
+        )
+        return
+    print("PASS: test_ci_top_attention_log_mgmt_scene_exists")
+
+
 if __name__ == "__main__":
     raise SystemExit(main())
diff --git a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
index 617ffda..4272c10 100644
--- a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
+++ b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
@@ -103,6 +103,30 @@ def test_top_attention_ci_execution_plan_is_runner_native(self) -> None:
         self.assertEqual(planned[0].ci_commands[0]["id"], "top_attention_bin_kvtest")
         self.assertIn("--case-config __RUN_DIR__/configs/ci_scene_config.yaml", planned[0].ci_commands[0]["command"])
 
+    def test_top_attention_log_mgmt_ci_execution_plan_is_runner_native(self) -> None:
+        suite_cfg = yaml.safe_load((_RUNNER.RUNNER_REPO_ROOT / "fluxon_test_stack" / "ci_test_list.yaml").read_text(encoding="utf-8"))
+        artifact_sets = suite_cfg.get("artifact_sets")
+        if isinstance(artifact_sets, dict):
+            for artifact_set in artifact_sets.values():
+                if not isinstance(artifact_set, dict):
+                    continue
+                release_artifacts = artifact_set.get("release_artifacts")
+                if isinstance(release_artifacts, dict):
+                    python_wheel = release_artifacts.get("python_wheel")
+                    if isinstance(python_wheel, str) and python_wheel.strip():
+                        artifact_set["release_artifacts"] = {"wheel": python_wheel}
+        suite = _RUNNER._parse_suite_config(suite_cfg)
+        cases = _RUNNER._expand_cases(suite)
+        case = next(item for item in cases if item.scene_id == "ci_top_attention_log_mgmt" and item.profile_id == "fluxon_tcp")
+        planned = _RUNNER._build_ci_execution_plan(case, suite)
+        self.assertEqual(len(planned), 1)
+        self.assertEqual(planned[0].ci_commands[0]["id"], "top_attention_log_mgmt")
+        self.assertIn(
+            "__RUN_DIR__/src/fluxon_test_stack/top_attention_test_index/_log_mgmt.py",
+            planned[0].ci_commands[0]["command"],
+        )
+        self.assertIn("--case-config __RUN_DIR__/configs/ci_scene_config.yaml", planned[0].ci_commands[0]["command"])
+
     def test_ci_prepare_run_inputs_rebuilds_release_view_without_reusing_source_test_rsc(self) -> None:
         with tempfile.TemporaryDirectory() as td:
             root = Path(td)
@@ -520,6 +544,81 @@ def test_ci_base_runtime_service_target_ip_uses_loopback_for_same_host_local_nod
                     "127.0.0.1",
                 )
 
+    def test_write_deployer_manifests_renders_payload_wrapper_from_template(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            run_dir = Path(td)
+            resolved_case = {
+                "case": {
+                    "case_id": "bench_case",
+                    "profile_id": "bench_profile",
+                },
+                "scene": {
+                    "bench": {
+                        "subject": "kv",
+                    }
+                },
+                "deploy": {
+                    "instances": [
+                        {
+                            "id": "worker_0",
+                            "k8s_ref": "deployment/test-worker",
+                            "lifecycle": "service",
+                            "deployer": {
+                                "target": "logic-a",
+                                "payload_file": "wheelhouse/pkg.whl",
+                                "payload_dest_path": "/tmp/run/pkg.whl",
+                                "command": ["/bin/sh", "-lc", "python3 /tmp/run/pkg.whl"],
+                            },
+                        }
+                    ],
+                    "payload_delivery": {
+                        "kind": _RUNNER.PAYLOAD_DELIVERY_KIND_FLUXON_FS_S3,
+                        "s3_base_url": "http://127.0.0.1:19080/fs_s3",
+                        "bucket": "bench-bucket",
+                        "access_key": "bench-ak",
+                        "secret_key": "bench-sk",
+                        "region": "bench-region",
+                        "key_prefix": "case-prefix",
+                    },
+                },
+                "runtime": {
+                    "workdir_root": str(run_dir.parent),
+                    "run_dir": str(run_dir),
+                    "stack_identity": {
+                        "cluster_name": "fluxon_testbed",
+                        "controller_url": "http://127.0.0.1:19080/r/ops/fluxon_testbed",
+                        "shared_memory_path": "/tmp/shm",
+                        "shared_file_path": "/tmp/share",
+                    },
+                },
+                "artifact_set": {
+                    "release_root": str(run_dir / "fluxon_release"),
+                    "test_rsc_root": str(run_dir / "test_rsc"),
+                },
+            }
+
+            template_path = (
+                _RUNNER.RUNNER_TEMPLATE_DIR / "payload_fluxon_fs_s3_download_and_exec.sh.template"
+            ).resolve()
+            self.assertTrue(template_path.is_file())
+
+            _RUNNER._write_deployer_manifests(resolved_case, run_dir, allow_overwrite=False)
+
+            manifest_docs = list(
+                yaml.safe_load_all((run_dir / "deployer_deploy.yaml").read_text(encoding="utf-8"))
+            )
+            self.assertEqual(len(manifest_docs), 1)
+            container = manifest_docs[0]["spec"]["template"]["spec"]["containers"][0]
+            self.assertEqual(container["command"], ["/bin/bash", "-lc"])
+            self.assertEqual(len(container["args"]), 1)
+            script_text = container["args"][0]
+            self.assertIn("python3 - <<'PY'", script_text)
+            self.assertIn('BASE_URL = "http://127.0.0.1:19080/fs_s3"', script_text)
+            self.assertIn('OBJECT_KEY = "case-prefix/wheelhouse/pkg.whl"', script_text)
+            self.assertIn('DEST_PATH = "/tmp/run/pkg.whl"', script_text)
+            self.assertIn('exec /bin/sh -lc', script_text)
+            self.assertNotIn("__FLUXON_TMPL_", script_text)
+
 
 if __name__ == "__main__":
     raise SystemExit(unittest.main())
diff --git a/fluxon_test_stack/tests/test_test_runner_ui_contract.py b/fluxon_test_stack/tests/test_test_runner_ui_contract.py
index ff407e2..2abc4ec 100644
--- a/fluxon_test_stack/tests/test_test_runner_ui_contract.py
+++ b/fluxon_test_stack/tests/test_test_runner_ui_contract.py
@@ -119,6 +119,8 @@ def test_redirect_process_stdio_starts_mirror_on_github_actions(self) -> None:
             workdir = Path(td)
             original_log_fp = _RUNNER._RUNNER_STDIO_LOG_FP
             original_keepalive = _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS
+            saved_stdout = sys.stdout
+            saved_stderr = sys.stderr
             with mock.patch.dict(os.environ, {"GITHUB_ACTIONS": "true"}, clear=False):
                 _RUNNER._RUNNER_STDIO_LOG_FP = None
                 _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS = (11, 12)
@@ -129,10 +131,18 @@ def test_redirect_process_stdio_starts_mirror_on_github_actions(self) -> None:
             self.assertEqual(dup2_mock.call_count, 2)
             start_mirror.assert_called_once()
             kwargs = start_mirror.call_args.kwargs
-            self.assertEqual(kwargs["log_path"], (workdir / _RUNNER.RUNNER_STDIO_LOG_FILENAME).resolve())
+            expected_log_path = _RUNNER._service_log_base_path(
+                workdir, filename=_RUNNER.RUNNER_STDIO_LOG_FILENAME
+            )
+            self.assertEqual(kwargs["log_path"], expected_log_path)
             self.assertEqual(kwargs["stdout_fd"], 11)
             self.assertNotIn("stderr_fd", kwargs)
-            if _RUNNER._RUNNER_STDIO_LOG_FP is not None:
+            sys.stdout = saved_stdout
+            sys.stderr = saved_stderr
+            if _RUNNER._RUNNER_STDIO_LOG_FP is not None and _RUNNER._RUNNER_STDIO_LOG_FP not in (
+                sys.__stdout__,
+                sys.__stderr__,
+            ):
                 _RUNNER._RUNNER_STDIO_LOG_FP.close()
             _RUNNER._RUNNER_STDIO_LOG_FP = original_log_fp
             _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS = original_keepalive
@@ -142,6 +152,8 @@ def test_redirect_process_stdio_skips_mirror_outside_github_actions(self) -> Non
             workdir = Path(td)
             original_log_fp = _RUNNER._RUNNER_STDIO_LOG_FP
             original_keepalive = _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS
+            saved_stdout = sys.stdout
+            saved_stderr = sys.stderr
             with mock.patch.dict(os.environ, {}, clear=True):
                 _RUNNER._RUNNER_STDIO_LOG_FP = None
                 _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS = (11, 12)
@@ -151,7 +163,12 @@ def test_redirect_process_stdio_skips_mirror_outside_github_actions(self) -> Non
                             _RUNNER._redirect_process_stdio_to_log(workdir)
             self.assertEqual(dup2_mock.call_count, 2)
             start_mirror.assert_not_called()
-            if _RUNNER._RUNNER_STDIO_LOG_FP is not None:
+            sys.stdout = saved_stdout
+            sys.stderr = saved_stderr
+            if _RUNNER._RUNNER_STDIO_LOG_FP is not None and _RUNNER._RUNNER_STDIO_LOG_FP not in (
+                sys.__stdout__,
+                sys.__stderr__,
+            ):
                 _RUNNER._RUNNER_STDIO_LOG_FP.close()
             _RUNNER._RUNNER_STDIO_LOG_FP = original_log_fp
             _RUNNER._RUNNER_STDIO_KEEPALIVE_FDS = original_keepalive
@@ -225,6 +242,20 @@ def test_log_chunk_tail_and_before_window(self) -> None:
             self.assertEqual(older["text"], "2345")
             self.assertEqual(older["start"], 2)
 
+    def test_service_log_resolve_read_path_prefers_latest_daily_shard(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            workdir = Path(td)
+            (workdir / "test_runner.2026-06-19.log").write_text("old\n", encoding="utf-8")
+            (workdir / "test_runner.2026-06-20.log").write_text("new\n", encoding="utf-8")
+            resolved = _RUNNER._service_log_resolve_read_path(
+                workdir,
+                filename=_RUNNER.RUNNER_STDIO_LOG_FILENAME,
+            )
+            self.assertEqual(
+                resolved,
+                (workdir / "test_runner.2026-06-20.log").resolve(),
+            )
+
     def test_ops_logs_base_url_derives_from_controller_proxy(self) -> None:
         url = _RUNNER._ui_ops_logs_base_url("http://127.0.0.1:19080/r/ops/fluxon_testbed")
         self.assertEqual(url, "http://127.0.0.1:19080/logs")
diff --git a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
new file mode 100644
index 0000000..c06c033
--- /dev/null
+++ b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
@@ -0,0 +1,112 @@
+#!/usr/bin/env python3
+
+from __future__ import annotations
+
+import importlib.util
+import sys
+import tempfile
+import unittest
+from pathlib import Path
+from unittest import mock
+
+import yaml
+
+
+REPO_ROOT = Path(__file__).resolve().parents[2]
+MODULE_PATH = REPO_ROOT / "fluxon_test_stack" / "top_attention_test_index" / "_log_mgmt.py"
+
+
+def _load_module():
+    module_dir = MODULE_PATH.parent
+    sys.path.insert(0, str(module_dir))
+    try:
+        spec = importlib.util.spec_from_file_location("fluxon_test_stack_top_attention_log_mgmt_contract", MODULE_PATH)
+        assert spec is not None and spec.loader is not None
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[spec.name] = mod
+        spec.loader.exec_module(mod)
+        return mod
+    finally:
+        if sys.path and sys.path[0] == str(module_dir):
+            sys.path.pop(0)
+
+
+_ENTRY = _load_module()
+
+
+class TestTopAttentionLogMgmtContract(unittest.TestCase):
+    def test_main_accepts_case_config_and_runs_canonical_tests(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            run_dir = Path(td)
+            cfg_dir = run_dir / "configs"
+            cfg_dir.mkdir(parents=True)
+            case_cfg = cfg_dir / "ci_scene_config.yaml"
+            case_cfg.write_text(
+                yaml.safe_dump(
+                    {
+                        "case": {
+                            "scene_id": "ci_top_attention_log_mgmt",
+                            "scale_id": "n1_kvowner_dram_20gib",
+                            "profile_id": "fluxon_tcp_thread",
+                            "case_id": "ci_top_attention_log_mgmt__n1_kvowner_dram_20gib__fluxon_tcp_thread",
+                        },
+                        "scene_config": {
+                            "enabled": True,
+                        },
+                        "scene_runtime": {
+                            "etcd": {"ip": "127.0.0.1", "port": 19180},
+                            "greptime": {"ip": "127.0.0.1", "port": 19190},
+                        },
+                    },
+                    sort_keys=False,
+                ),
+                encoding="utf-8",
+            )
+
+            python_calls: list[tuple[str, tuple[str, ...]]] = []
+
+            def fake_run_python_file(description: str, path: str, extra_args=()):
+                del description
+                python_calls.append((path, tuple(extra_args)))
+                return 0
+
+            with mock.patch.object(_ENTRY, "run_python_file", side_effect=fake_run_python_file):
+                with mock.patch.object(_ENTRY, "run_cargo", return_value=0) as run_cargo:
+                    with mock.patch.object(
+                        sys,
+                        "argv",
+                        [str(MODULE_PATH), "--case-config", str(case_cfg), "--", "--nocapture"],
+                    ):
+                        rc = _ENTRY.main()
+
+            self.assertEqual(rc, 0)
+            self.assertEqual(
+                python_calls,
+                [
+                    ("deployment/tests/test_log_shard.py", ("--", "--nocapture")),
+                    (
+                        "deployment/tests/test_selection_supervisor_codegen.py",
+                        ("--test-id", "runtime_log_path_uses_daily_shard_files", "--", "--nocapture"),
+                    ),
+                    (
+                        "deployment/tests/test_selection_supervisor_codegen.py",
+                        ("--test-id", "runtime_log_shards_roll_and_preserve_content_boundaries", "--", "--nocapture"),
+                    ),
+                ],
+            )
+            self.assertEqual(
+                run_cargo.call_args.args[0],
+                [
+                    "test",
+                    "--manifest-path",
+                    str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
+                    "--test",
+                    "log_mgmt",
+                    "--",
+                    "--nocapture",
+                ],
+            )
+
+
+if __name__ == "__main__":
+    raise SystemExit(unittest.main())
diff --git a/fluxon_test_stack/top_attention_test_index/README.md b/fluxon_test_stack/top_attention_test_index/README.md
index d81c346..2894ddf 100644
--- a/fluxon_test_stack/top_attention_test_index/README.md
+++ b/fluxon_test_stack/top_attention_test_index/README.md
@@ -47,6 +47,7 @@ Entries:
 - `_fs_remote_mount.py`: heavier Fluxon FS remote mount integration coverage
 - `_test_stack_contract.py`: test-stack runner contract coverage
 - `_deployment_codegen.py`: deployment code generation coverage
+- `_log_mgmt.py`: shared-supervisor ops log rolling plus Rust KV log sharding coverage. `ci_test_list.yaml` now exposes this wrapper as the formal `ci_top_attention_log_mgmt` scene, and `test_runner.py` dispatches to it from the runner-native `top_attention` CI execution model.
 - `_script_tools.py`: script utility coverage
 - `_cargo_fs_core.py`: cargo tests for the Rust FS core crate
 - `_cargo_util.py`: cargo tests for the Rust util crate
diff --git a/fluxon_test_stack/top_attention_test_index/_log_mgmt.py b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
new file mode 100644
index 0000000..e3547ab
--- /dev/null
+++ b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
@@ -0,0 +1,54 @@
+#!/usr/bin/env python3
+from __future__ import annotations
+
+import argparse
+
+from _common import REPO_ROOT, load_case_config, run_cargo, run_python_file
+
+
+TEST_REQUIREMENTS = ["cargo", "etcd", "ops", "submodules"]
+SCENE_ID = "ci_top_attention_log_mgmt"
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(
+        description="Flat index entry for shared-supervisor ops log rolling and Rust KV log sharding coverage."
+    )
+    parser.add_argument(
+        "--case-config",
+        help="Canonical CI case config YAML emitted by test_runner.",
+    )
+    args, passthrough = parser.parse_known_args()
+    if args.case_config:
+        _ = load_case_config(args.case_config, expected_scene_id=SCENE_ID)
+
+    rc = run_python_file(
+        "Flat index entry for ops/shared-supervisor log shard helper coverage.",
+        "deployment/tests/test_log_shard.py",
+        extra_args=tuple(passthrough),
+    )
+    if rc != 0:
+        return rc
+    for test_id in (
+        "runtime_log_path_uses_daily_shard_files",
+        "runtime_log_shards_roll_and_preserve_content_boundaries",
+    ):
+        rc = run_python_file(
+            "Flat index entry for ops/shared-supervisor log routing coverage.",
+            "deployment/tests/test_selection_supervisor_codegen.py",
+            extra_args=("--test-id", test_id, *passthrough),
+        )
+        if rc != 0:
+            return rc
+    return run_cargo([
+        "test",
+        "--manifest-path",
+        str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
+        "--test",
+        "log_mgmt",
+        *passthrough,
+    ])
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/scripts/git_source_selection.py b/scripts/git_source_selection.py
new file mode 100644
index 0000000..491a0c1
--- /dev/null
+++ b/scripts/git_source_selection.py
@@ -0,0 +1,163 @@
+from __future__ import annotations
+
+import subprocess
+from pathlib import Path
+from typing import Callable
+
+import yaml
+
+
+DEFAULT_RATHER_NO_GIT_SUBMODULE_CONFIG_RELPATH = Path(
+    "setup_and_pack/rather_no_git_submodule.yaml"
+)
+
+
+def collect_git_listed_source_relpaths(
+    *,
+    repo_root: Path,
+    git_root: Path,
+    rel_prefix: str = "",
+    is_excluded: Callable[[str], bool],
+) -> list[str]:
+    argv = [
+        "git",
+        "ls-files",
+        "--cached",
+        "--others",
+        "--exclude-standard",
+        "-z",
+    ]
+    raw = subprocess.check_output(argv, cwd=str(git_root))
+    selected: list[str] = []
+    rel_prefix = rel_prefix.strip("/")
+    for entry in raw.split(b"\0"):
+        if not entry:
+            continue
+        rel = entry.decode("utf-8").strip()
+        if not rel:
+            continue
+        repo_rel = rel if not rel_prefix else f"{rel_prefix}/{rel}"
+        if is_excluded(repo_rel):
+            continue
+        source_path = (repo_root / repo_rel).resolve()
+        if not source_path.exists():
+            continue
+        selected.append(repo_rel)
+    return selected
+
+
+def load_rather_no_git_submodule_source_roots(
+    *,
+    repo_root: Path,
+    context_name: str,
+) -> tuple[tuple[str, Path], ...]:
+    config_path = (repo_root / DEFAULT_RATHER_NO_GIT_SUBMODULE_CONFIG_RELPATH).resolve()
+    if not config_path.exists():
+        return ()
+    raw_cfg = yaml.safe_load(config_path.read_text(encoding="utf-8"))
+    if raw_cfg is None:
+        return ()
+    if not isinstance(raw_cfg, dict):
+        raise RuntimeError(
+            "rather_no_git_submodule config must be a YAML mapping: "
+            f"{config_path}"
+        )
+    raw_modules = raw_cfg.get("modules")
+    if raw_modules is None:
+        return ()
+    if not isinstance(raw_modules, list):
+        raise RuntimeError(
+            "rather_no_git_submodule config `modules` must be a list: "
+            f"{config_path}"
+        )
+
+    repo_root = repo_root.resolve()
+    selected: list[tuple[str, Path]] = []
+    seen_relpaths: set[str] = set()
+    for index, raw_item in enumerate(raw_modules):
+        if not isinstance(raw_item, dict):
+            raise RuntimeError(
+                "rather_no_git_submodule config entries must be mappings: "
+                f"{config_path} modules[{index}]"
+            )
+        raw_path = raw_item.get("path")
+        if not isinstance(raw_path, str) or not raw_path.strip():
+            raise RuntimeError(
+                "rather_no_git_submodule config path must be a non-empty string: "
+                f"{config_path} modules[{index}].path"
+            )
+        rel_path = Path(raw_path.strip())
+        if rel_path.is_absolute() or ".." in rel_path.parts:
+            raise RuntimeError(
+                "rather_no_git_submodule config path must stay within the repo root: "
+                f"{config_path} modules[{index}].path={raw_path!r}"
+            )
+        relpath = rel_path.as_posix()
+        if relpath in seen_relpaths:
+            continue
+        seen_relpaths.add(relpath)
+        module_root = (repo_root / rel_path).resolve()
+        if module_root != repo_root and repo_root not in module_root.parents:
+            raise RuntimeError(
+                "rather_no_git_submodule config path escapes the repo root: "
+                f"{config_path} modules[{index}].path={raw_path!r}"
+            )
+        if not module_root.is_dir():
+            raise RuntimeError(
+                f"{context_name} requires configured rather_no_git_submodule path "
+                f"to exist as a directory: path={relpath} resolved={module_root}"
+            )
+        selected.append((relpath, module_root))
+    return tuple(selected)
+
+
+def collect_source_relpaths_with_rather_no_git_submodule(
+    *,
+    repo_root: Path,
+    source_roots: tuple[str, ...],
+    is_excluded: Callable[[str], bool],
+    empty_selection_error: str,
+    rather_no_git_submodule_context_name: str,
+) -> list[str]:
+    repo_root = repo_root.resolve()
+    selected: set[str] = set()
+    for source_root in source_roots:
+        root_path = (repo_root / source_root).resolve()
+        if not root_path.exists():
+            continue
+        if root_path.is_file():
+            relpath = Path(source_root).as_posix()
+            if not is_excluded(relpath):
+                selected.add(relpath)
+            continue
+        selected.update(
+            collect_git_listed_source_relpaths(
+                repo_root=repo_root,
+                git_root=root_path,
+                rel_prefix="" if source_root == "." else source_root,
+                is_excluded=is_excluded,
+            )
+        )
+    for relpath, module_root in load_rather_no_git_submodule_source_roots(
+        repo_root=repo_root,
+        context_name=rather_no_git_submodule_context_name,
+    ):
+        selected.update(
+            collect_git_listed_source_relpaths(
+                repo_root=repo_root,
+                git_root=module_root,
+                rel_prefix=relpath,
+                is_excluded=is_excluded,
+            )
+        )
+    if not selected:
+        raise RuntimeError(empty_selection_error)
+    return sorted(selected)
+
+
+__all__ = [
+    "DEFAULT_RATHER_NO_GIT_SUBMODULE_CONFIG_RELPATH",
+    "collect_git_listed_source_relpaths",
+    "collect_source_relpaths_with_rather_no_git_submodule",
+    "load_rather_no_git_submodule_source_roots",
+]
diff --git a/scripts/source_selection_profiles.py b/scripts/source_selection_profiles.py
new file mode 100644
index 0000000..6c7493c
--- /dev/null
+++ b/scripts/source_selection_profiles.py
@@ -0,0 +1,134 @@
+from __future__ import annotations
+
+from dataclasses import dataclass, field
+from pathlib import Path
+import sys
+
+SCRIPT_DIR = Path(__file__).resolve().parent
+script_dir_str = str(SCRIPT_DIR)
+if script_dir_str in sys.path:
+    sys.path.remove(script_dir_str)
+sys.path.insert(0, script_dir_str)
+
+import git_source_selection as git_source_selection_utils
+
+
+SOURCE_SELECTION_PROFILE_BUILD_SEED = "build_seed"
+SOURCE_SELECTION_PROFILE_SOURCE_PACK = "source_pack"
+SOURCE_SELECTION_PROFILES = (
+    SOURCE_SELECTION_PROFILE_BUILD_SEED,
+    SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+)
+
+BUILD_SEED_SOURCE_ROOTS: tuple[str, ...] = (
+    "README.md",
+    "setup.py",
+    "deployment",
+    "fluxon_py",
+    "fluxon_release/closed_sdk",
+    "fluxon_rs",
+    "scripts/git_source_selection.py",
+    "scripts/source_selection_profiles.py",
+    "setup_and_pack",
+)
+SOURCE_PACK_SOURCE_ROOTS: tuple[str, ...] = (".",)
+
+BUILD_SEED_INCLUDED_RELPATHS: frozenset[str] = frozenset(
+    {
+        "fluxon_release/closed_sdk/manifest.json",
+        "setup_and_pack/pub_prepare_build.yaml",
+    }
+)
+SOURCE_PACK_EXCLUDED_RELPATH_PREFIXES: tuple[str, ...] = (
+    ".dever/",
+    "fluxon_release/",
+    "skills/",
+)
+SOURCE_PACK_EXCLUDED_RELPATH_NAMES: frozenset[str] = frozenset(
+    {
+        ".DS_Store",
+    }
+)
+
+
+@dataclass(frozen=True)
+class SourceSelectionProfileSpec:
+    source_roots: tuple[str, ...]
+    empty_selection_error: str
+    rather_no_git_submodule_context_name: str
+    include_relpaths: frozenset[str] = field(default_factory=frozenset)
+
+
+BUILD_SEED_PROFILE_SPEC = SourceSelectionProfileSpec(
+    source_roots=BUILD_SEED_SOURCE_ROOTS,
+    empty_selection_error="public workspace source selection produced no files",
+    rather_no_git_submodule_context_name="public workspace source selection",
+    include_relpaths=BUILD_SEED_INCLUDED_RELPATHS,
+)
+SOURCE_PACK_PROFILE_SPEC = SourceSelectionProfileSpec(
+    source_roots=SOURCE_PACK_SOURCE_ROOTS,
+    empty_selection_error="git-based CI source selection produced no files",
+    rather_no_git_submodule_context_name="CI source pack",
+)
+
+
+def get_source_profile_spec(*, profile: str) -> SourceSelectionProfileSpec:
+    if profile == SOURCE_SELECTION_PROFILE_BUILD_SEED:
+        return BUILD_SEED_PROFILE_SPEC
+    if profile == SOURCE_SELECTION_PROFILE_SOURCE_PACK:
+        return SOURCE_PACK_PROFILE_SPEC
+    raise ValueError(
+        f"unsupported source selection profile: {profile!r}; expected one of {SOURCE_SELECTION_PROFILES}"
+    )
+
+
+def get_source_profile_source_roots(*, profile: str) -> tuple[str, ...]:
+    return get_source_profile_spec(profile=profile).source_roots
+
+
+def source_profile_relpath_excluded(*, profile: str, relpath: str) -> bool:
+    spec = get_source_profile_spec(profile=profile)
+    normalized = relpath.strip("/")
+    if not normalized:
+        return True
+    if normalized in spec.include_relpaths:
+        return False
+    if profile == SOURCE_SELECTION_PROFILE_SOURCE_PACK:
+        if normalized in SOURCE_PACK_EXCLUDED_RELPATH_NAMES:
+            return True
+        return any(
+            normalized == prefix.rstrip("/") or normalized.startswith(prefix)
+            for prefix in SOURCE_PACK_EXCLUDED_RELPATH_PREFIXES
+        )
+    return False
+
+
+def collect_source_profile_relpaths(*, repo_root: Path, profile: str) -> tuple[str, ...]:
+    spec = get_source_profile_spec(profile=profile)
+    return tuple(
+        git_source_selection_utils.collect_source_relpaths_with_rather_no_git_submodule(
+            repo_root=repo_root,
+            source_roots=spec.source_roots,
+            is_excluded=lambda relpath: source_profile_relpath_excluded(
+                profile=profile,
+                relpath=relpath,
+            ),
+            empty_selection_error=spec.empty_selection_error,
+            rather_no_git_submodule_context_name=spec.rather_no_git_submodule_context_name,
+        )
+    )
+
+
+__all__ = [
+    "BUILD_SEED_SOURCE_ROOTS",
+    "SOURCE_PACK_SOURCE_ROOTS",
+    "SOURCE_PACK_EXCLUDED_RELPATH_NAMES",
+    "SOURCE_PACK_EXCLUDED_RELPATH_PREFIXES",
+    "SOURCE_SELECTION_PROFILE_BUILD_SEED",
+    "SOURCE_SELECTION_PROFILE_SOURCE_PACK",
+    "SOURCE_SELECTION_PROFILES",
+    "collect_source_profile_relpaths",
+    "get_source_profile_source_roots",
+    "get_source_profile_spec",
+    "source_profile_relpath_excluded",
+]
diff --git a/setup_and_pack/nix/lib_layout.py b/setup_and_pack/nix/lib_layout.py
index 05ac4b0..8322a55 100644
--- a/setup_and_pack/nix/lib_layout.py
+++ b/setup_and_pack/nix/lib_layout.py
@@ -10,7 +10,7 @@
 import yaml
 
 from setup_and_pack.public_workspace_contract import (
-    PUBLIC_WORKSPACE_INPUT_RELATIVE_PATHS,
+    collect_public_workspace_input_relative_paths,
     _copy_public_workspace_input_path,
     _sanitize_public_workspace_input,
 )
@@ -48,35 +48,6 @@
     ("manylinux", "cargo_registry_dir"): "manylinux-cache/cargo-registry",
     ("manylinux", "cargo_git_dir"): "manylinux-cache/cargo-git",
 }
-BRIDGE_PREBUILT_WORKSPACE_SEED_EXTRA_RELATIVE_PATHS = (
-    "setup_and_pack/nix",
-    "setup_and_pack/lib_tool.py",
-    "setup_and_pack/pyscript_util.py",
-    "setup_and_pack/closed_sdk_contract.py",
-    "setup_and_pack/public_workspace_contract.py",
-    "setup_and_pack/pub_prepare_build.py",
-    "setup_and_pack/pub_prepare_build.yaml",
-    "setup_and_pack/utils/wheel_runtime_helper.py",
-    "setup_and_pack/utils",
-    "deployment/utils/placeholder_utils.py",
-    "deployment/utils/proc_lifecycle_codegen.py",
-    "deployment/utils/selection_supervisor_codegen.py",
-    "fluxon_release/closed_sdk",
-    "fluxon_rs/fluxon_commu_contract",
-    "fluxon_rs/fluxon_commu",
-    "fluxon_rs/fluxon_commu_closed_sdk_consumer",
-    "fluxon_rs/Cargo.lock",
-)
-BRIDGE_PREBUILT_WORKSPACE_SEED_RELATIVE_PATHS = tuple(
-    dict.fromkeys(
-        (
-            *PUBLIC_WORKSPACE_INPUT_RELATIVE_PATHS,
-            *BRIDGE_PREBUILT_WORKSPACE_SEED_EXTRA_RELATIVE_PATHS,
-        )
-    )
-)
-
-
 @dataclass(frozen=True)
 class AssemblyRefs:
     baseline_path: str
@@ -757,7 +728,9 @@ def _materialize_bridge_prebuilt_workspace_seed(*, source_root: Path, target_roo
     _remove_stale_derived_entry(path=target_root)
     target_root.mkdir(parents=True, exist_ok=True)
     target_root.chmod(0o777)
-    for relative_path in BRIDGE_PREBUILT_WORKSPACE_SEED_RELATIVE_PATHS:
+    for relative_path in collect_public_workspace_input_relative_paths(
+        repo_root=source_root
+    ):
         source_path = source_root / relative_path
         if not source_path.exists():
             raise RuntimeError(
diff --git a/setup_and_pack/nix/pack_fluxonkv_pylib.py b/setup_and_pack/nix/pack_fluxonkv_pylib.py
index c44df13..e12f8fe 100644
--- a/setup_and_pack/nix/pack_fluxonkv_pylib.py
+++ b/setup_and_pack/nix/pack_fluxonkv_pylib.py
@@ -43,6 +43,9 @@
     CLOSED_SDK_CONSUMER_BOUNDARY_MODE,
     rewrite_fluxon_native_export_bundle,
 )
+from setup_and_pack.public_workspace_contract import (
+    collect_public_workspace_input_relative_paths,
+)
 from utils.sudo_prefix_utils import host_sudo_prefix
 import utils as script_utils
 ABI3_SMOKE_TEST_INTERPRETERS = (
@@ -142,11 +145,6 @@
     )
 )
 SUPPORTED_TARGET_CACHE_GENERATOR_KINDS = frozenset()
-REQUIRED_DEPLOYMENT_UTIL_FILES_FOR_PYO3_BUILD = (
-    "placeholder_utils.py",
-    "proc_lifecycle_codegen.py",
-    "selection_supervisor_codegen.py",
-)
 TEMP_WORKSPACE_MOUNT_DIRS: list[Path] = []
 
 
@@ -160,54 +158,6 @@ def _cleanup_temp_workspace_mount_dirs() -> None:
 
 
 atexit.register(_cleanup_temp_workspace_mount_dirs)
-REQUIRED_DEPLOYMENT_UTIL_RELATIVE_PATHS_FOR_PYO3_BUILD = tuple(
-    f"deployment/utils/{name}" for name in REQUIRED_DEPLOYMENT_UTIL_FILES_FOR_PYO3_BUILD
-)
-PYO3_WORKSPACE_HELPER_RELATIVE_PATHS = (
-    "fluxon_rs/rust-toolchain.toml",
-    "setup_and_pack/lib_tool.py",
-    "setup_and_pack/pyscript_util.py",
-    "setup_and_pack/closed_sdk_contract.py",
-    "setup_and_pack/public_workspace_contract.py",
-    "setup_and_pack/pub_prepare_build.py",
-    "setup_and_pack/pub_prepare_build.yaml",
-    "setup_and_pack/nix/pack_release_in_container.py",
-    "setup_and_pack/utils/wheel_runtime_helper.py",
-    "setup_and_pack/nix/lib_layout.py",
-)
-PYO3_INPUT_RELATIVE_PATHS_COMMON = (
-    "fluxon_rs/Cargo.toml",
-    "fluxon_rs/Cargo.lock",
-    "fluxon_rs/.cargo",
-    "fluxon_rs/rust-toolchain.toml",
-    "fluxon_rs/fluxon_commu_contract",
-    "fluxon_rs/fluxon_commu_closed_sdk_consumer",
-    "fluxon_rs/fluxon_pyo3",
-    "fluxon_rs/limit_thirdparty",
-    "fluxon_rs/fluxon_commu",
-    "fluxon_rs/fluxon_kv",
-    "fluxon_rs/fluxon_framework",
-    "fluxon_rs/fluxon_framework_compiled",
-    "fluxon_rs/fluxon_util",
-    "fluxon_rs/fluxon_mq",
-    "fluxon_rs/fluxon_cli",
-    "fluxon_rs/fluxon_ops",
-    "fluxon_rs/fluxon_proxy_proto",
-    "fluxon_rs/fluxon_proxy",
-    "fluxon_rs/fluxon_fs",
-    "fluxon_rs/fluxon_fs_core",
-    "fluxon_rs/fluxon_fs_s3_gateway",
-    "fluxon_rs/fluxon_observability",
-    "fluxon_rs/moka",
-    "fluxon_py",
-    "fluxon_release/closed_sdk",
-    "setup_and_pack/nix/lib_layout.py",
-    "setup_and_pack/closed_sdk_contract.py",
-    "setup_and_pack/public_workspace_contract.py",
-    "setup_and_pack/lib_tool.py",
-    "setup_and_pack/pyscript_util.py",
-    *REQUIRED_DEPLOYMENT_UTIL_RELATIVE_PATHS_FOR_PYO3_BUILD,
-)
 PYO3_INPUT_RELATIVE_PATHS_BY_TRANSPORT_BACKEND = {
     "fastws": (),
     "tquic": (),
@@ -218,15 +168,6 @@ def _cleanup_temp_workspace_mount_dirs() -> None:
 PYO3_INPUT_RELATIVE_PATHS_BY_RDMA_BACKEND = {
     "closed_sdk": ("fluxon_release/closed_sdk",),
 }
-PYO3_WORKSPACE_COPY_RELATIVE_PATHS_PUBLIC_NATIVE = ()
-PYO3_WORKSPACE_COPY_RELATIVE_PATHS_COMMON = tuple(
-    relative_path
-    for relative_path in (
-        *PYO3_INPUT_RELATIVE_PATHS_COMMON,
-        *PYO3_WORKSPACE_COPY_RELATIVE_PATHS_PUBLIC_NATIVE,
-        *PYO3_WORKSPACE_HELPER_RELATIVE_PATHS,
-    )
-)
 TRANSPORT_BACKEND_FEATURES = {
     "fastws": ["fastws_transport"],
     "tquic": ["tquic_transport"],
@@ -257,90 +198,6 @@ def _cleanup_temp_workspace_mount_dirs() -> None:
     "libstdc++.so.6",
     "libgomp.so.1",
 )
-IGNORED_FILE_SUFFIXES = (
-    ".gitignore",
-    ".pkl",
-    ".pyc",
-    ".md",
-    ".rst",
-    ".html",
-    ".htm",
-    ".xml",
-    ".css",
-    ".js",
-    ".map",
-    ".png",
-    ".jpg",
-    ".jpeg",
-    ".gif",
-    ".bmp",
-    ".svg",
-    ".ico",
-    ".pdf",
-    ".ppt",
-    ".pptx",
-    ".doc",
-    ".docx",
-    ".pem",
-    ".crt",
-    ".crl",
-    ".key",
-    ".csr",
-    ".p12",
-    ".der",
-    ".serial",
-    ".old",
-    ".orig",
-    ".rej",
-    ".tar",
-    ".tar.gz",
-    ".tgz",
-    ".tar.xz",
-    ".txz",
-    ".tar.bz2",
-    ".tbz2",
-    ".zip",
-    ".7z",
-    ".xz",
-    ".bz2",
-    ".gz",
-)
-IGNORED_DIR_NAMES = {
-    ".git",
-    "__pycache__",
-    "target",
-    "wheels",
-    "docs",
-    "doc",
-    "doxygen",
-    "examples",
-    "example",
-    "tests",
-    "test",
-    "testdata",
-    "bench",
-    "benches",
-    "benchmark",
-    "benchmarks",
-    "fuzz",
-    "fuzzers",
-    "packagecache",
-    "wycheproof_testvectors",
-    "tfprof",
-}
-IGNORED_FILE_NAMES = (
-    PYO3_CHECKSUM_FILE_NAME,
-    "configure~",
-)
-
-
-def _pyo3_input_relative_paths(transport_backend: str, rdma_backend: str) -> tuple[str, ...]:
-    return (
-        PYO3_INPUT_RELATIVE_PATHS_COMMON
-        + PYO3_INPUT_RELATIVE_PATHS_BY_TRANSPORT_BACKEND[transport_backend]
-        + PYO3_INPUT_RELATIVE_PATHS_BY_RDMA_BACKEND[rdma_backend]
-    )
-
 
 def _dedupe_relative_paths(relative_paths: tuple[str, ...]) -> tuple[str, ...]:
     ordered_relative_paths: list[str] = []
@@ -354,11 +211,13 @@ def _dedupe_relative_paths(relative_paths: tuple[str, ...]) -> tuple[str, ...]:
 
 
 def pyo3_workspace_copy_relative_paths(transport_backend: str, rdma_backend: str) -> tuple[str, ...]:
-    return _dedupe_relative_paths(
-        PYO3_WORKSPACE_COPY_RELATIVE_PATHS_COMMON
-        + PYO3_INPUT_RELATIVE_PATHS_BY_TRANSPORT_BACKEND[transport_backend]
-        + PYO3_INPUT_RELATIVE_PATHS_BY_RDMA_BACKEND[rdma_backend]
-    )
+    del transport_backend
+    del rdma_backend
+    return collect_public_workspace_input_relative_paths(repo_root=REPO_ROOT)
+
+
+def _pyo3_input_relative_paths(transport_backend: str, rdma_backend: str) -> tuple[str, ...]:
+    return pyo3_workspace_copy_relative_paths(transport_backend, rdma_backend)
 
 
 def _wheel_variant_key(transport_backend: str, rdma_backend: str) -> str:
@@ -435,9 +294,9 @@ def _compute_inputs_digest(repo_root: Path, relative_paths: tuple[str, ...]) ->
         relative_to=repo_root,
         mode=script_utils.PathDigestMode.CONTENTS_ONLY,
         algorithm=script_utils.PathHashAlgorithm.MD5,
-        ignored_dir_names=IGNORED_DIR_NAMES,
-        ignored_file_names=IGNORED_FILE_NAMES,
-        ignored_file_suffixes=IGNORED_FILE_SUFFIXES,
+        ignored_dir_names=(),
+        ignored_file_names=(),
+        ignored_file_suffixes=(),
     )
 
 
@@ -593,33 +452,6 @@ def current_checksum(self) -> str:
             _pyo3_input_relative_paths(self.transport_backend, self.rdma_backend),
         ) + f"|transport_backend={self.transport_backend}|rdma_backend={self.rdma_backend}"
 
-    def _legacy_checksum_map(self) -> dict[str, str]:
-        file_hash: dict[str, str] = {}
-        for current_root, dirnames, filenames in os.walk(self.rs_root, topdown=True):
-            current_root_path = Path(current_root)
-            root_rel = current_root_path.relative_to(self.rs_root).as_posix()
-            root_text = current_root_path.as_posix()
-            if root_rel == "target" or root_rel.startswith("target/"):
-                dirnames[:] = []
-                continue
-            if root_rel == "wheels" or root_rel.startswith("wheels/"):
-                dirnames[:] = []
-                continue
-            if "/.git/" in root_text or root_text.endswith("/.git"):
-                dirnames[:] = []
-                continue
-            dirnames[:] = sorted(dir_name for dir_name in dirnames if dir_name != ".git")
-            for file_name in sorted(filenames):
-                if file_name in IGNORED_FILE_NAMES or file_name.endswith(IGNORED_FILE_SUFFIXES):
-                    continue
-                file_path = current_root_path / file_name
-                hash_md5 = hashlib.md5()
-                with open(file_path, "rb") as f:
-                    for chunk in iter(lambda: f.read(4096), b""):
-                        hash_md5.update(chunk)
-                file_hash[file_path.relative_to(self.rs_root).as_posix()] = hash_md5.hexdigest()
-        return file_hash
-
     def find_cached_wheel(self) -> Path | None:
         if not self.target_wheels_dir.exists():
             return None
@@ -2976,12 +2808,15 @@ def _build_published_profile_manifest(
     selected_backend_plan: dict,
     native_build_authority: dict | None,
 ) -> dict:
-    workspace_seed_digest = _compute_inputs_digest(
-        workspace_seed_dir,
-        _public_workspace_seed_relative_paths(
-            transport_backend,
-            rdma_backend=selected_backend_plan["rdma_backend"],
-        ),
+    del transport_backend
+    workspace_seed_digest = script_utils.compute_paths_digest(
+        [workspace_seed_dir],
+        relative_to=workspace_seed_dir,
+        mode=script_utils.PathDigestMode.CONTENTS_ONLY,
+        algorithm=script_utils.PathHashAlgorithm.MD5,
+        ignored_dir_names=(),
+        ignored_file_names=(),
+        ignored_file_suffixes=(),
     )
     manifest = {
         "object_kind": "FluxonManylinuxPublishedProfile",
@@ -3137,18 +2972,19 @@ def _copy_workspace_seed_subset(
     transport_backend: str,
     rdma_backend: str,
 ) -> None:
+    del transport_backend
+    del rdma_backend
     target_workspace_seed_dir.mkdir(parents=True, exist_ok=True)
     target_workspace_seed_dir.chmod(0o777)
-    for relative_path in _public_workspace_seed_relative_paths(
-        transport_backend,
-        rdma_backend=rdma_backend,
-    ):
-        source_path = source_workspace_seed_dir / relative_path
-        if not source_path.exists():
-            raise RuntimeError(
-                f"workspace seed path is missing required publish input: {source_path}"
-            )
+    for source_path in sorted(source_workspace_seed_dir.rglob("*")):
+        if source_path == source_workspace_seed_dir:
+            continue
+        relative_path = source_path.relative_to(source_workspace_seed_dir)
         target_path = target_workspace_seed_dir / relative_path
+        if source_path.is_dir() and not source_path.is_symlink():
+            target_path.mkdir(parents=True, exist_ok=True)
+            target_path.chmod(0o777)
+            continue
         target_path.parent.mkdir(parents=True, exist_ok=True)
         target_path.parent.chmod(0o777)
         _sudo_copy_path(source_path=source_path, target_path=target_path)
@@ -3248,10 +3084,6 @@ def _run_with_tee_log(*, argv: list[str], log_path: Path) -> None:
 
     if return_code != 0:
         raise RuntimeError(f"docker run failed with exit code {return_code}, log={log_path}")
-def _public_workspace_seed_relative_paths(transport_backend: str, *, rdma_backend: str) -> tuple[str, ...]:
-    return pyo3_workspace_copy_relative_paths(transport_backend, rdma_backend)
-
-
 def _require_workspace_seed_fluxon_commu_source_dir(*, workspace_seed_dir: Path, field_name: str) -> Path:
     source_dir = workspace_seed_dir / FLUXON_COMMU_AUTHORITY_RELATIVE_PATH
     cargo_toml_path = source_dir / "Cargo.toml"
diff --git a/setup_and_pack/public_workspace_contract.py b/setup_and_pack/public_workspace_contract.py
index 5cd6b50..cb1574e 100644
--- a/setup_and_pack/public_workspace_contract.py
+++ b/setup_and_pack/public_workspace_contract.py
@@ -1,47 +1,46 @@
 from __future__ import annotations
 
+import os
 import shutil
+import sys
 from pathlib import Path
 
+REPO_ROOT = Path(__file__).resolve().parent.parent
+SCRIPTS_DIR = REPO_ROOT / "scripts"
+scripts_dir_str = str(SCRIPTS_DIR)
+if scripts_dir_str in sys.path:
+    sys.path.remove(scripts_dir_str)
+sys.path.insert(0, scripts_dir_str)
 
-PUBLIC_WORKSPACE_INPUT_RELATIVE_PATHS = (
-    "setup.py",
-    "fluxon_py",
-    "fluxon_release/closed_sdk",
-    "fluxon_rs/Cargo.toml",
-    "fluxon_rs/Cargo.lock",
-    "fluxon_rs/.cargo",
-    "fluxon_rs/rust-toolchain.toml",
-    "fluxon_rs/fluxon_commu_contract",
-    "fluxon_rs/fluxon_commu_closed_sdk_consumer",
-    "fluxon_rs/fluxon_commu",
-    "fluxon_rs/fluxon_pyo3",
-    "fluxon_rs/limit_thirdparty",
-    "fluxon_rs/fluxon_kv",
-    "fluxon_rs/fluxon_framework",
-    "fluxon_rs/fluxon_framework_compiled",
-    "fluxon_rs/fluxon_util",
-    "fluxon_rs/fluxon_mq",
-    "fluxon_rs/fluxon_cli",
-    "fluxon_rs/fluxon_ops",
-    "fluxon_rs/fluxon_proxy_proto",
-    "fluxon_rs/fluxon_proxy",
-    "fluxon_rs/fluxon_fs",
-    "fluxon_rs/fluxon_fs_core",
-    "fluxon_rs/fluxon_fs_s3_gateway",
-    "fluxon_rs/fluxon_observability",
-    "fluxon_rs/moka",
+from source_selection_profiles import (
+    SOURCE_SELECTION_PROFILE_BUILD_SEED,
+    collect_source_profile_relpaths,
 )
 
 
 def _copy_public_workspace_input_path(source_path: Path, target_path: Path) -> None:
     target_path.parent.mkdir(parents=True, exist_ok=True)
+    if source_path.is_symlink():
+        if target_path.exists() or target_path.is_symlink():
+            if target_path.is_dir() and not target_path.is_symlink():
+                shutil.rmtree(target_path)
+            else:
+                target_path.unlink()
+        os.symlink(os.readlink(source_path), target_path)
+        return
     if source_path.is_dir():
         shutil.copytree(source_path, target_path, symlinks=True, dirs_exist_ok=True)
         return
     shutil.copy2(source_path, target_path)
 
 
+def collect_public_workspace_input_relative_paths(*, repo_root: Path) -> tuple[str, ...]:
+    return collect_source_profile_relpaths(
+        repo_root=repo_root,
+        profile=SOURCE_SELECTION_PROFILE_BUILD_SEED,
+    )
+
+
 def _sanitize_public_workspace_input(*, workspace_root: Path) -> None:
     for pycache_dir in workspace_root.rglob("__pycache__"):
         shutil.rmtree(pycache_dir, ignore_errors=True)
@@ -51,9 +50,8 @@ def _sanitize_public_workspace_input(*, workspace_root: Path) -> None:
         except FileNotFoundError:
             pass
 
-
 __all__ = [
-    "PUBLIC_WORKSPACE_INPUT_RELATIVE_PATHS",
+    "collect_public_workspace_input_relative_paths",
     "_copy_public_workspace_input_path",
     "_sanitize_public_workspace_input",
 ]
diff --git a/setup_and_pack/tests/test_git_source_selection_utils.py b/setup_and_pack/tests/test_git_source_selection_utils.py
new file mode 100644
index 0000000..b28d64d
--- /dev/null
+++ b/setup_and_pack/tests/test_git_source_selection_utils.py
@@ -0,0 +1,182 @@
+from __future__ import annotations
+
+import importlib.util
+import sys
+import tempfile
+import unittest
+from pathlib import Path
+from unittest import mock
+
+
+REPO_ROOT = Path(__file__).resolve().parents[2]
+MODULE_PATH = REPO_ROOT / "scripts" / "git_source_selection.py"
+PROFILE_MODULE_PATH = REPO_ROOT / "scripts" / "source_selection_profiles.py"
+
+
+def _load_module():
+    spec = importlib.util.spec_from_file_location(
+        "scripts_git_source_selection_test",
+        MODULE_PATH,
+    )
+    assert spec is not None and spec.loader is not None
+    mod = importlib.util.module_from_spec(spec)
+    sys.modules[spec.name] = mod
+    spec.loader.exec_module(mod)
+    return mod
+
+
+_MOD = _load_module()
+
+
+def _load_profile_module():
+    scripts_root_str = str(REPO_ROOT / "scripts")
+    if scripts_root_str in sys.path:
+        sys.path.remove(scripts_root_str)
+    sys.path.insert(0, scripts_root_str)
+    spec = importlib.util.spec_from_file_location(
+        "scripts_source_selection_profiles_test",
+        PROFILE_MODULE_PATH,
+    )
+    assert spec is not None and spec.loader is not None
+    mod = importlib.util.module_from_spec(spec)
+    sys.modules[spec.name] = mod
+    spec.loader.exec_module(mod)
+    return mod
+
+
+_PROFILE_MOD = _load_profile_module()
+
+
+class GitSourceSelectionUtilsTest(unittest.TestCase):
+    def test_collect_source_relpaths_with_rather_no_git_submodule_merges_module_sources(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            repo_root = Path(tmpdir)
+            (repo_root / "README.md").write_text("repo\n", encoding="utf-8")
+            module_root = repo_root / "fluxon_rs" / "moka"
+            (module_root / "src").mkdir(parents=True, exist_ok=True)
+            (module_root / "Cargo.toml").write_text("module\n", encoding="utf-8")
+            (module_root / "src" / "lib.rs").write_text("pub fn x() {}\n", encoding="utf-8")
+            cfg_path = repo_root / "setup_and_pack" / "rather_no_git_submodule.yaml"
+            cfg_path.parent.mkdir(parents=True, exist_ok=True)
+            cfg_path.write_text(
+                "modules:\n"
+                "  - path: fluxon_rs/moka\n"
+                "    repo: https://example.com/moka.git\n"
+                "    checkout: main\n",
+                encoding="utf-8",
+            )
+
+            def fake_check_output(argv, cwd=None):
+                del argv
+                cwd_path = Path(cwd).resolve()
+                if cwd_path == repo_root.resolve():
+                    return b"README.md\0"
+                if cwd_path == module_root.resolve():
+                    return b"Cargo.toml\0src/lib.rs\0"
+                raise AssertionError(f"unexpected git ls-files cwd: {cwd_path}")
+
+            with mock.patch.object(_MOD.subprocess, "check_output", side_effect=fake_check_output):
+                relpaths = _MOD.collect_source_relpaths_with_rather_no_git_submodule(
+                    repo_root=repo_root,
+                    source_roots=("README.md",),
+                    is_excluded=lambda _relpath: False,
+                    empty_selection_error="no files",
+                    rather_no_git_submodule_context_name="test source selection",
+                )
+
+            self.assertEqual(
+                relpaths,
+                [
+                    "README.md",
+                    "fluxon_rs/moka/Cargo.toml",
+                    "fluxon_rs/moka/src/lib.rs",
+                ],
+            )
+
+    def test_load_rather_no_git_submodule_source_roots_uses_context_name_in_missing_dir_error(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            repo_root = Path(tmpdir)
+            cfg_path = repo_root / "setup_and_pack" / "rather_no_git_submodule.yaml"
+            cfg_path.parent.mkdir(parents=True, exist_ok=True)
+            cfg_path.write_text(
+                "modules:\n"
+                "  - path: fluxon_rs/moka\n"
+                "    repo: https://example.com/moka.git\n"
+                "    checkout: main\n",
+                encoding="utf-8",
+            )
+
+            with self.assertRaisesRegex(
+                RuntimeError,
+                "test source selection requires configured rather_no_git_submodule path to exist",
+            ):
+                _MOD.load_rather_no_git_submodule_source_roots(
+                    repo_root=repo_root,
+                    context_name="test source selection",
+                )
+
+    def test_source_profiles_only_add_inclusions_beyond_gitignore(self) -> None:
+        self.assertTrue(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+                relpath=".dever/run.log",
+            )
+        )
+        self.assertTrue(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+                relpath="fluxon_release/install.py",
+            )
+        )
+        self.assertTrue(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_SOURCE_PACK,
+                relpath="skills/demo/SKILL.md",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="fluxon_release/closed_sdk/manifest.json",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="fluxon_doc_cn/roadmap.md",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="deployment/utils/log_shard.py",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="scripts/source_selection_profiles.py",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="fluxon_rs/moka/examples/append_value_async.rs",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="fluxon_rs/moka/tests/entry_api_sync.rs",
+            )
+        )
+        self.assertFalse(
+            _PROFILE_MOD.source_profile_relpath_excluded(
+                profile=_PROFILE_MOD.SOURCE_SELECTION_PROFILE_BUILD_SEED,
+                relpath="fluxon_rs/fluxon_cli/templates/landing.html",
+            )
+        )
+
+
+if __name__ == "__main__":
+    raise SystemExit(unittest.main())
diff --git a/setup_and_pack/tests/test_lib_layout.py b/setup_and_pack/tests/test_lib_layout.py
index dd19442..6d05d54 100644
--- a/setup_and_pack/tests/test_lib_layout.py
+++ b/setup_and_pack/tests/test_lib_layout.py
@@ -14,6 +14,10 @@
 
 
 def _load_lib_layout():
+    repo_root_str = str(REPO_ROOT)
+    if repo_root_str in sys.path:
+        sys.path.remove(repo_root_str)
+    sys.path.insert(0, repo_root_str)
     spec = importlib.util.spec_from_file_location("setup_and_pack_nix_lib_layout_test", LIB_LAYOUT_PATH)
     assert spec is not None and spec.loader is not None
     mod = importlib.util.module_from_spec(spec)
@@ -83,14 +87,17 @@ def test_bridge_prebuilt_materializes_workspace_seed(self) -> None:
             self.assertTrue(workspace_seed_dir.is_dir())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/closed_sdk_contract.py").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/public_workspace_contract.py").is_file())
+            self.assertTrue((workspace_seed_dir / "README.md").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_rs/fluxon_commu_contract/Cargo.toml").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_rs/fluxon_commu/Cargo.toml").is_file())
+            self.assertTrue((workspace_seed_dir / "fluxon_rs/fluxon_ops/build.rs").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_release/closed_sdk/manifest.json").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/nix/pack_fluxonkv_pylib.py").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/nix/pack_release_in_container.py").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/utils/__init__.py").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/utils/sudo_prefix_utils.py").is_file())
             self.assertTrue((workspace_seed_dir / "setup_and_pack/utils/wheel_runtime_helper.py").is_file())
+            self.assertTrue((workspace_seed_dir / "deployment/utils/log_shard.py").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_rs/fluxon_kv/Cargo.toml").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_rs/Cargo.lock").is_file())
             self.assertTrue((workspace_seed_dir / "fluxon_rs/moka/Cargo.toml").is_file())
diff --git a/setup_and_pack/tests/test_pack_fluxonkv_pylib_bridge_prebuilt.py b/setup_and_pack/tests/test_pack_fluxonkv_pylib_bridge_prebuilt.py
index db1bcd7..bae0e86 100644
--- a/setup_and_pack/tests/test_pack_fluxonkv_pylib_bridge_prebuilt.py
+++ b/setup_and_pack/tests/test_pack_fluxonkv_pylib_bridge_prebuilt.py
@@ -38,6 +38,39 @@ def _load_module():
 
 
 class BridgePrebuiltAuthorityMaterializationTest(unittest.TestCase):
+    def test_pyo3_workspace_inputs_follow_dynamic_public_workspace_selection(self) -> None:
+        relpaths = _PACKMOD.pyo3_workspace_copy_relative_paths(
+            transport_backend="tcp_thread",
+            rdma_backend="closed_sdk",
+        )
+
+        self.assertIn("README.md", relpaths)
+        self.assertIn("deployment/utils/log_shard.py", relpaths)
+        self.assertIn("fluxon_rs/fluxon_ops/build.rs", relpaths)
+        self.assertIn("fluxon_rs/moka/examples/append_value_async.rs", relpaths)
+        self.assertIn("fluxon_rs/fluxon_cli/templates/landing.html", relpaths)
+        self.assertNotIn("skills/browser-helm/SKILL.md", relpaths)
+        self.assertNotIn("fluxon_doc_cn/roadmap.md", relpaths)
+
+    def test_pyo3_workspace_digest_tracks_selected_template_inputs(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            repo_root = Path(tmpdir)
+            landing_path = repo_root / "fluxon_rs" / "fluxon_cli" / "templates" / "landing.html"
+            landing_path.parent.mkdir(parents=True, exist_ok=True)
+            landing_path.write_text("v1\n", encoding="utf-8")
+
+            digest_before = _PACKMOD._compute_inputs_digest(
+                repo_root,
+                ("fluxon_rs/fluxon_cli/templates/landing.html",),
+            )
+            landing_path.write_text("v2\n", encoding="utf-8")
+            digest_after = _PACKMOD._compute_inputs_digest(
+                repo_root,
+                ("fluxon_rs/fluxon_cli/templates/landing.html",),
+            )
+
+            self.assertNotEqual(digest_before, digest_after)
+
     def test_host_side_materialization_only_creates_placeholders(self) -> None:
         with tempfile.TemporaryDirectory() as tmpdir:
             build_root = Path(tmpdir)
diff --git a/setup_and_pack/utils/__init__.py b/setup_and_pack/utils/__init__.py
index df414f6..3921245 100644
--- a/setup_and_pack/utils/__init__.py
+++ b/setup_and_pack/utils/__init__.py
@@ -10,6 +10,7 @@
     _iter_digest_entries,
     build_cached_tarball,
     compute_paths_digest,
+    prune_stage_paths,
     rsync_stage,
     tar_gz,
     tarball_rule,
@@ -66,6 +67,7 @@
     "ArtifactRule",
     "tarball_rule",
     "build_cached_tarball",
+    "prune_stage_paths",
     "rsync_stage",
     "tar_gz",
     "_iter_digest_entries",
diff --git a/setup_and_pack/utils/artifact_cache_digest_utils.py b/setup_and_pack/utils/artifact_cache_digest_utils.py
index 11739ef..d3780e3 100644
--- a/setup_and_pack/utils/artifact_cache_digest_utils.py
+++ b/setup_and_pack/utils/artifact_cache_digest_utils.py
@@ -1,8 +1,10 @@
 from __future__ import annotations
 
 import enum
+import fnmatch
 import hashlib
 import os
+import shutil
 from dataclasses import dataclass
 from pathlib import Path
 from typing import Callable, Collection, Iterator, Sequence
@@ -19,6 +21,7 @@
     "ArtifactCheck",
     "ArtifactRule",
     "tarball_rule",
+    "prune_stage_paths",
     "build_cached_tarball",
     "rsync_stage",
     "tar_gz",
@@ -114,7 +117,14 @@ def build_cached_tarball(*, rule: ArtifactRule, out_path: Path, build_tarball: C
     rule.write_stamp(check.digest)
 
 
-def rsync_stage(*, repo_root: Path, src: Path, dst: Path, honor_gitignore: bool) -> None:
+def rsync_stage(
+    *,
+    repo_root: Path,
+    src: Path,
+    dst: Path,
+    honor_gitignore: bool,
+    exclude_rel_paths: tuple[str, ...] = (),
+) -> None:
     if not src.exists():
         print(f"Missing required source path for staging: {src}")
         raise SystemExit(1)
@@ -132,6 +142,8 @@ def rsync_stage(*, repo_root: Path, src: Path, dst: Path, honor_gitignore: bool)
             "--exclude-from=.gitignore",
             "--filter=:- .gitignore",
         ]
+    for pattern in exclude_rel_paths:
+        argv.append(f"--exclude={pattern}")
     if src.is_dir():
         argv += [str(src) + "/", str(dst) + "/"]
     else:
@@ -139,6 +151,21 @@ def rsync_stage(*, repo_root: Path, src: Path, dst: Path, honor_gitignore: bool)
     run_cmd_argv(argv, cwd=repo_root)
 
 
+def prune_stage_paths(stage_root: Path, exclude_rel_paths: tuple[str, ...]) -> None:
+    if not stage_root.exists():
+        return
+    for path in sorted(stage_root.rglob("*"), reverse=True):
+        rel_path = path.relative_to(stage_root).as_posix()
+        for pattern in exclude_rel_paths:
+            normalized_pattern = pattern.rstrip("/")
+            if fnmatch.fnmatch(rel_path, normalized_pattern) or fnmatch.fnmatch(path.name, normalized_pattern):
+                if path.is_dir() and not path.is_symlink():
+                    shutil.rmtree(path)
+                else:
+                    path.unlink(missing_ok=True)
+                break
+
+
 def tar_gz(
     *,
     cwd: Path,
diff --git a/skills/browser-helm/SKILL.md b/skills/browser-helm/SKILL.md
new file mode 100644
index 0000000..dbe1afd
--- /dev/null
+++ b/skills/browser-helm/SKILL.md
@@ -0,0 +1,232 @@
+---
+name: browser-helm
+description: Helm-only browser runtime workflow for operating Browser Helm managed tabs via `browser-helm`, with namespaced `browser` / `tab` / `page` / `picker` / `events` commands and namespaced `.tmp/browser-helm/` output conventions.
+allowed-tools: Bash(*)
+---
+
+# 用 `browser-helm` 操作 Browser Helm 受控标签页
+
+当用户想通过 **Helm-only runtime** 操作浏览器，而不是使用通用 `agent-browser` 时，使用这个 skill。
+
+适用场景：
+
+- 需要列出已连接浏览器 / managed tab
+- 需要创建 managed tab 并 attach debugger
+- 需要执行 `page navigate` / `page click` / `page eval` / `page wait` / `page type` / `page press` / `page summary` / `page snapshot` / `page screenshot`
+- 需要通过 picker 获取/清空最近一次选中元素的 metadata（无需用户粘贴 JSON）
+- 需要遵守 `browser-helm` 当前的输出与落盘约定
+
+不适用场景：
+
+- 用户明确要用通用 `agent-browser` / noVNC 工作流
+- 用户只是要解释代码，不需要运行 `browser-helm`
+
+## 默认工作流（新主路径）
+
+默认 Base URL：`http://127.0.0.1:5181`（不需要设置环境变量）。
+
+如需覆盖（可选）：在命令前追加 `--base-url http://127.0.0.1:5181`。
+
+如本机未全局安装 `browser-helm`，也可以用 `node browser-helm/dist/cli.js` 替代下方命令。
+
+## 多人/多 AI 会话（互信）约定（重要）
+
+当前产品定位下，daemon / Web UI / WS **默认不做鉴权**，更偏向“同一局域网多人互信”的协作模型。
+
+但为了避免 **同一台浏览器 + 多个 AI 对话** 时出现“串台/误操作”，推荐强制使用 `session` 做操作隔离：
+
+- 每个 AI 对话固定用一个 `--session <name>`（或设置环境变量 `BROWSER_HELM_SESSION=<name>`）
+- `session` 会隔离：
+  - CLI context 落盘：`.tmp/browser-helm/context.json`（default）或 `.tmp/browser-helm/sessions/<session>/context.json`
+  - CLI 输出落盘：`.tmp/browser-helm/<type>/...`（default）或 `.tmp/browser-helm/sessions/<session>/<type>/...`
+  - `tab create` 会自动加前缀：`[session:<session>] ...`（用于人类/AI 识别归属）
+- `tab list --mine` 只在非 default session 下可用（通过 note 前缀过滤“我这条会话创建的 tab”）
+
+注意：`session` 只是“操作习惯/隔离约定”，**不是安全边界**。知道 `managed-tab-id` 仍然能跨 session 操作；不要把端口暴露到不可信网络。
+
+### 前置（必须）：安装插件并配对
+
+`browser-helm` 的所有浏览器动作都依赖 **Chrome 插件已连接 daemon（WebSocket）**：
+
+- 创建 managed tab 时建议提供 `--note <text>`，用于描述这个 tab 的意图/用途。
+  - 若省略 `--note` 且提供 URL，CLI 会自动生成：`打开页面：<url>`
+
+- 若 `browser-helm browser list` 一直为空，优先判断是「插件未安装/未 Connect」而不是 CLI 出错。
+
+一次性配对步骤：
+
+1) 启动 daemon
+
+```bash
+browser-helm daemon ensure
+```
+
+（可选）如需重启：
+
+```bash
+browser-helm daemon restart
+```
+
+2) 用 Chrome 打开 Web UI（用“Chrome 能访问到的地址”打开）
+
+- Web UI：`http://127.0.0.1:5181`
+- 页面上会显示 `Pairing Code`（推荐）以及 `WS URL`/`Pairing Token`（Advanced）
+
+3) 安装扩展（Unpacked）
+
+- 在 Web UI 点击“下载插件 zip”，解压
+- 打开 `chrome://extensions`，开启开发者模式
+- 点击“加载已解压的扩展程序”，选择解压后的目录
+
+4) 插件配对（Connect）
+
+- 打开扩展弹窗
+- 粘贴 Web UI 中的 `Pairing Code`，点击 `Connect`
+- （可选）点一次 `Status` 确认连接 OK
+- Advanced：也可手填 `WS URL` + `Pairing Token`
+
+5) CLI 验证插件已连接
+
+```bash
+browser-helm browser list
+```
+
+### 默认动作流
+
+1. 确保 `Browser Helm daemon` 已启动（AI 可通过 CLI 直接启动/拉起）
+
+```bash
+browser-helm daemon ensure
+```
+
+注：`daemon ensure` 会启动内置的预编译 daemon（当前提供 `linux-x64`），不要求用户安装 `cargo`。
+
+2. 确认扩展已连接，并列出浏览器
+
+```bash
+browser-helm browser list
+```
+
+（推荐）3. Pin 默认 browser/tab（减少长对话遗忘成本）
+
+```bash
+browser-helm context use-browser <browser-id>
+browser-helm context use-tab <managed-tab-id>
+browser-helm context show
+```
+
+4. 列 tab；如无 tab，则创建新 tab
+
+```bash
+browser-helm browser list
+browser-helm tab list <browser-id>
+browser-helm tab create <browser-id> https://example.com --note "说明这个 tab 的用途"
+```
+
+5. （可选）显式 `tab attach` debugger
+
+`tab create` / `page navigate` 已会自动 ensure debugger attach（用于更早捕获 network/console）。如果你准备在浏览器里手动刷新/导航，也建议先 `tab attach`。
+
+```bash
+browser-helm tab attach <browser-id> <managed-tab-id>
+```
+
+6. 页面分析优先走返回值主路
+
+```bash
+browser-helm page summary <browser-id> <managed-tab-id>
+browser-helm page snapshot <browser-id> <managed-tab-id>
+```
+
+7. 只有在需要留档时才显式保存 `page summary` / `page snapshot`
+
+```bash
+browser-helm --save page summary <browser-id> <managed-tab-id>
+browser-helm --save page snapshot <browser-id> <managed-tab-id>
+```
+
+8. `page screenshot` 默认会落盘；`page click` 会走受控页遮罩下的程序化点击
+
+```bash
+browser-helm page click <browser-id> <managed-tab-id> '#selector'
+browser-helm page click <browser-id> <managed-tab-id> '#selector' --wait-text 'Finished working' --timeout-ms 15000
+browser-helm page eval <browser-id> <managed-tab-id> '1+1'
+browser-helm page wait <browser-id> <managed-tab-id> --until-text 'Finished working' --timeout-ms 15000
+browser-helm page type <browser-id> <managed-tab-id> 'div[aria-label="Composer"]' 'hello'
+browser-helm page press <browser-id> <managed-tab-id> 'Enter'
+browser-helm page screenshot <browser-id> <managed-tab-id>
+```
+
+9. 推荐先 `page snapshot` 生成 `@iN` refs，再用 ref 操作（类似 agent-browser 的 `@eN`）
+
+```bash
+browser-helm page snapshot <browser-id> <managed-tab-id>
+browser-helm page click @i1
+browser-helm page type @i2 'hello'
+```
+
+9. 如用户在 SidePanel 做了元素选择（Start Picking），AI 可直接从 daemon 拉取最近一次选择结果
+
+```bash
+browser-helm picker last
+browser-helm picker clear
+```
+
+### 交互录制（用户手动复现）
+
+当你需要「AI 先打开受控 tab，然后用户自己操作复现问题，再让 AI 回看」时，可以开启交互录制：
+
+```bash
+# 记录起始时间（ms）
+t0=$(date +%s%3N)
+
+# 开始录制（会注入监听脚本，并临时隐藏遮罩，允许用户点击/输入）
+browser-helm recorder start <browser-id> <managed-tab-id>
+
+# ...用户在该 tab 上手动复现...
+
+# 拉取复现阶段的交互/console/network 事件（按 since 过滤）
+browser-helm events interaction <browser-id> <managed-tab-id> --since $t0 --limit 2000
+browser-helm events console <browser-id> <managed-tab-id> --since $t0 --limit 2000
+browser-helm events network <browser-id> <managed-tab-id> --since $t0 --limit 2000
+
+# 停止录制（恢复遮罩）
+browser-helm recorder stop <browser-id> <managed-tab-id>
+```
+
+注意：交互录制会包含 input 的原始 value（不脱敏）。仅建议在互信/本地环境使用。
+
+## 输出与落盘约定
+
+- `page summary`：默认只打印；传 `output-path` 或 `--save` 时，写入 `.tmp/browser-helm/summaries/`
+- `page snapshot`：默认只打印；传 `output-path` 或 `--save` 时，写入 `.tmp/browser-helm/snapshots/`
+- `page screenshot`：默认写入 `.tmp/browser-helm/screenshots/`
+- 若使用 `--session <name>` / `BROWSER_HELM_SESSION=<name>`：上述目录会自动切换到 `.tmp/browser-helm/sessions/<session>/...`
+- 如用户显式提供路径，优先使用用户路径
+
+## 命令参考
+
+详细命令与示例见：[`browser-helm/skills/browser-helm/references/commands.md`]
+
+优先顺序建议：
+
+1. `browser list`
+2. `tab list`
+3. `tab create`（推荐写 `--note`；若省略且提供 URL，则自动生成 note）
+   - 或：`tab adopt-active`（接管当前活动 tab）
+4. `tab attach`
+5. `page navigate`
+6. `page summary` / `page snapshot`
+7. `page click` / `page screenshot`
+
+
+## 目录约定
+
+- 项目内 skill 源目录：[`browser-helm/skills/browser-helm/`]
+- 仓库根入口：[`skills/browser-helm/`]
+
+
+## 命令约定
+
+- 仅支持 namespaced 命令面：`browser list`、`tab create`、`page navigate`、`picker last` 等。
+- 默认文档路径改为 namespaced 形式：`browser list`、`tab create`、`page navigate`、`events console`、`picker last`。
diff --git a/skills/browser-helm/agents/openai.yaml b/skills/browser-helm/agents/openai.yaml
new file mode 100644
index 0000000..686f428
--- /dev/null
+++ b/skills/browser-helm/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: Browser Helm
+  short_description: 通过 Browser Helm 操作 Browser Helm 受控标签页流程
+  default_prompt: Use $browser-helm to inspect and operate Browser Helm managed tabs.
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/browser-helm/references/commands.md b/skills/browser-helm/references/commands.md
new file mode 100644
index 0000000..d22d465
--- /dev/null
+++ b/skills/browser-helm/references/commands.md
@@ -0,0 +1,131 @@
+# `browser-helm` 命令参考
+
+## 前置（必须）：插件安装与配对
+
+CLI 能否操作浏览器，取决于 **Chrome 插件是否已连接 daemon（WebSocket）**。
+
+最小闭环步骤：
+
+```bash
+# 1) 启动/确保 daemon
+browser-helm daemon ensure
+browser-helm daemon status
+browser-helm daemon restart
+
+# 2) 在 Chrome 打开 Web UI（用 Chrome 能访问到的地址打开）
+#    http://127.0.0.1:5181
+#    从页面复制 Pairing Code（推荐；含多网卡候选地址）或 WS URL + Pairing Token（Advanced）
+#
+# 3) 安装扩展（Unpacked）
+#    - Web UI 下载插件 zip -> 解压
+#    - chrome://extensions 开启开发者模式 -> 加载已解压扩展
+#
+# 4) 插件弹窗填 Pairing Code -> Connect
+
+# 5) 验证浏览器已连接
+browser-helm browser list
+```
+
+## 基础命令（新主路径）
+
+```bash
+browser-helm daemon status
+browser-helm daemon ensure
+browser-helm daemon stop
+browser-helm daemon restart
+browser-helm status
+browser-helm browser list
+browser-helm tab list [browser-id] [--mine]
+browser-helm recorder start [browser-id] [managed-tab-id]
+browser-helm recorder stop [browser-id] [managed-tab-id]
+```
+
+## 受控 tab 生命周期
+
+```bash
+browser-helm tab create [browser-id] [url] [--note <text>]
+browser-helm tab adopt-active [browser-id] [--note <text>]
+browser-helm tab attach [browser-id] [managed-tab-id]
+browser-helm page navigate [browser-id] [managed-tab-id] <url>
+```
+
+## 交互与分析
+
+```bash
+browser-helm page click [browser-id] [managed-tab-id] <selector> [--wait-(selector|text|js) <value>] [--timeout-ms <n>] [--interval-ms <n>]
+browser-helm page eval [browser-id] [managed-tab-id] <expression>
+browser-helm page wait [browser-id] [managed-tab-id] --until-(selector|text|js) <value> [--timeout-ms <n>] [--interval-ms <n>]
+browser-helm page type [browser-id] [managed-tab-id] <selector> <text>
+browser-helm page press [browser-id] [managed-tab-id] <key>
+browser-helm page summary [browser-id] [managed-tab-id] [output-path]
+browser-helm page snapshot [browser-id] [managed-tab-id] [output-path]
+browser-helm page screenshot [browser-id] [managed-tab-id] [output-path]
+browser-helm events console [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
+browser-helm events network [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
+browser-helm events interaction [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
+browser-helm picker last [browser-id] [managed-tab-id]
+browser-helm picker clear [browser-id] [managed-tab-id]
+```
+
+说明：
+
+- `page snapshot` 会生成可复用的 interactive refs：`@i1/@i2/...`（按 interactives 列表顺序）。
+- `page click/@iN`、`page type/@iN` 会把 ref 解析为 snapshot 中记录的 selector（落盘于 `.tmp/browser-helm/refs/<managed_tab_id>.json`，按 `--session` 隔离）。
+
+## Context（session-like，新主路径）
+
+长对话/长任务里，为了避免反复提供 `browser-id` / `managed-tab-id`，可以把默认对象写入本地 context：
+
+```bash
+browser-helm context use-browser <browser-id>
+browser-helm context use-tab <managed-tab-id>
+browser-helm context show
+browser-helm context clear
+```
+
+## 多 AI 对话隔离（推荐）
+
+为了避免“同一浏览器 + 多个 AI 对话”串台，建议为每条对话固定一个 `session`：
+
+```bash
+browser-helm --session chat-a browser list
+browser-helm --session chat-a tab list --mine
+browser-helm --session chat-a tab create <browser-id> https://example.com --note "这条对话的用途说明"
+```
+
+说明：
+
+- `tab create` 会自动加前缀：`[session:chat-a] ...`
+- `tab list --mine` 需要非 default session（否则会报错）
+
+## 输出约定
+
+- `page summary`
+  - 默认只打印
+  - `--save` 时默认落到 [`.tmp/browser-helm/summaries/`]
+- `page snapshot`
+  - 默认只打印
+  - `--save` 时默认落到 [`.tmp/browser-helm/snapshots/`]
+- `page screenshot`
+  - 默认落到 [`.tmp/browser-helm/screenshots/`]
+- 若使用 `--session <name>` / `BROWSER_HELM_SESSION=<name>`：上述目录会自动切换到 [`.tmp/browser-helm/sessions/<session>/...`]
+
+## 推荐示例
+
+```bash
+browser-helm browser list
+browser-helm tab create <browser-id> https://example.com --note "说明这个 tab 的用途"
+browser-helm tab attach <browser-id> <managed-tab-id>
+browser-helm page snapshot <browser-id> <managed-tab-id>
+browser-helm --save page summary <browser-id> <managed-tab-id>
+browser-helm page screenshot <browser-id> <managed-tab-id>
+```
+
+说明：
+
+- `tab create` 若省略 `--note` 且提供 URL，会自动生成：`打开页面：<url>`
+
+## 命令约定
+
+- 仅支持 namespaced 命令面：`browser list`、`tab create`、`tab attach`、`page navigate`、`picker last` 等。
+- 文档与 skill 后续默认都以 namespaced 命令作为主路径。
diff --git a/skills/canvas-dag_organizer-v1/SKILL.md b/skills/canvas-dag_organizer-v1/SKILL.md
new file mode 100644
index 0000000..db3dc0d
--- /dev/null
+++ b/skills/canvas-dag_organizer-v1/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "canvas-dag_organizer-v1"
+description: "Canvas DAG Organizer v1"
+metadata:
+  short-description: "Canvas DAG Organizer v1"
+---
+
+# Canvas DAG Organizer v1
+
+你是「Canvas DAG 可读性优化专家」(canvas_dag_organizer)。\n你的目标：基于当前 canvas 内容与 DAG（causal/timeline edges）结构，决定如何拆分/分组/调整空间布局，以最大化可读性。\n\n硬约束（必须遵守）：\n- 禁止要求用户手工编辑 `.canvas` / `.canvas.ext` JSON。\n- 你不能执行任何命令；你只能输出一个严格 JSON 对象（不要 markdown、不要 code fence、不要额外文本）。\n- 你输出的修改必须是“可复现/确定性”的（同一输入得到同一输出）。\n\n你会收到：\n- path + expectedCanvasSha256（并发保护）\n- scopeNodes / scopeEdges（允许你改动的子图范围）\n- 每个节点的 effective rect（考虑 ext.dx/dy/scale）\n\n你的输出 JSON schema（version=1）：\n{\n  "version": 1,\n  "kind": "canvas_dag_organize_apply_v1",\n  "path": "<same as input.path>",\n  "expectedCanvasSha256": "<same as input.expectedCanvasSha256>",\n  "summary": "一句话总结你做了什么（用于 UI 提示）",\n  "ops": [\n    // CanvasOpsRequestV1.ops: op=upsert_node|delete_node|upsert_edge|delete_edge\n  ]\n}\n\n重要规则：\n- 只允许改动 scope 内的 existing session nodes（移动/尺寸/文本等）与 existing edges。\n- 允许创建 group 节点用于分区（id 必须以 "group-" 开头；type="group"）。\n- 禁止删除任何 session 节点（dever_kind=session）。\n- 如果你删除 node，必须同时删除所有引用它的 edges（否则服务端会拒绝 apply）。\n- 优先做：分组 + 分层/泳道 + 对齐 + 留白；不要盲目网格化。
diff --git a/skills/canvas-dag_organizer-v1/agents/openai.yaml b/skills/canvas-dag_organizer-v1/agents/openai.yaml
new file mode 100644
index 0000000..f7ffc0e
--- /dev/null
+++ b/skills/canvas-dag_organizer-v1/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "Canvas DAG Organizer v1"
+  short_description: "Canvas DAG Organizer v1"
+  default_prompt: "Use $canvas-dag_organizer-v1."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/canvas-ops-v1/SKILL.md b/skills/canvas-ops-v1/SKILL.md
new file mode 100644
index 0000000..ffa8017
--- /dev/null
+++ b/skills/canvas-ops-v1/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "canvas-ops-v1"
+description: "Canvas Ops v1"
+metadata:
+  short-description: "Canvas Ops v1"
+---
+
+# Canvas Ops v1
+
+你是「Canvas 文件操作助手」(canvas_ops)。\n你的目标：对 `*.canvas` / `*.canvas.ext` 的任何修改，都必须通过项目内的脚本执行；禁止手工编辑 JSON。\n\n唯一允许的执行入口：\n- `.dever/tools/canvas_ops/canvas_ops.sh`\n- 配置：`.dever/tools/canvas_ops/config.json`\n\n硬约束：\n- 你只能生成 `apply` 需要的 request JSON（version=1），并给出一条可执行命令来调用脚本。\n- 禁止直接输出/粘贴完整 `.canvas` 内容作为“修改后的文件”。\n- 如果需要删除 node：必须同时显式删除所有依赖该 node 的 edges（否则脚本会拒绝执行）。\n\n你的输出格式（两段，且仅两段）：\n(1) request JSON（纯 JSON，不要 markdown，不要 code fence）\n(2) 一段 bash 命令（用 heredoc 把 JSON 送进脚本；命令内必须显式传 `-w` 与 `-c`）\n\n命令模板（把 <WORKDIR> 替换为项目根；一般是 `.`）：\n.dever/tools/canvas_ops/canvas_ops.sh apply -w <WORKDIR> -c .dever/tools/canvas_ops/config.json --request-stdin <<'JSON'\n{...}\nJSON\n\n建议（可选）：命令后再跑一次 validate，确认写盘结果可读且 ext sha 一致。
diff --git a/skills/canvas-ops-v1/agents/openai.yaml b/skills/canvas-ops-v1/agents/openai.yaml
new file mode 100644
index 0000000..5566cff
--- /dev/null
+++ b/skills/canvas-ops-v1/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: Canvas Ops v1
+  short_description: Canvas Ops v1
+  default_prompt: Use $canvas-ops-v1.
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/canvas-tidy_selection-v1/SKILL.md b/skills/canvas-tidy_selection-v1/SKILL.md
new file mode 100644
index 0000000..0dbfdf1
--- /dev/null
+++ b/skills/canvas-tidy_selection-v1/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "canvas-tidy_selection-v1"
+description: "Canvas Tidy Selection v1"
+metadata:
+  short-description: "Canvas Tidy Selection v1"
+---
+
+# Canvas Tidy Selection v1
+
+你是「Canvas 会话块整理专家」(canvas_tidy_selection)。\n你的目标：为“画布上选中的会话块”提供一键自动整理（确定性布局、可复现）。\n\n硬约束：\n- 禁止建议用户手工编辑 `.canvas` / `.canvas.ext` JSON。\n- 不要输出“修改后的完整 canvas 文件内容”。\n- 你只能输出（两段，且仅两段）：\n  (1) request JSON（纯 JSON，不要 markdown，不要 code fence）\n  (2) 一条 curl 命令（向 manager 的 tidy_selection API 发请求）。\n\n请求/响应（V1）约定：\n- Endpoint: POST /api/projects/:projectId/canvas/tidy_selection\n- request JSON schema (version=1):\n  - version: 1\n  - path: string  (project root 下的相对路径，必须以 .canvas 结尾)\n  - expectedCanvasSha256: string  (并发保护；必须来自最新 load 响应的 canvas_sha256)\n  - selectedSessionIds: string[]  (选中的会话块 node id 列表；会去重并保持稳定顺序)\n  - layout: { kind: "grid_sqrt_v1"; gapX: number; gapY: number }\n  - anchor: { kind: "keep_bounds_topleft_v1" }\n  - resetConnectedEdgeRoutes: boolean  (true 表示清空相关连线 ext 路由，回到默认路由)\n\ncurl 模板（把 <PROJECT_ID> 替换为实际 id）：\ncurl -sS -X POST 'http://localhost:8788/api/projects/<PROJECT_ID>/canvas/tidy_selection' \\n  -H 'Content-Type: application/json' \\n  -d '<REQUEST_JSON>'\n\n输出策略：\n- 不要向用户提问；基于已给信息直接产出最强可执行请求。\n- 若关键信息缺失（例如 projectId/path/sha/selected ids），在 request JSON 中用空值占位，并在 curl 命令中保留 <...> 占位符。
diff --git a/skills/canvas-tidy_selection-v1/agents/openai.yaml b/skills/canvas-tidy_selection-v1/agents/openai.yaml
new file mode 100644
index 0000000..120f1ac
--- /dev/null
+++ b/skills/canvas-tidy_selection-v1/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "Canvas Tidy Selection v1"
+  short_description: "Canvas Tidy Selection v1"
+  default_prompt: "Use $canvas-tidy_selection-v1."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/find-skills/SKILL.md b/skills/find-skills/SKILL.md
new file mode 100644
index 0000000..c797184
--- /dev/null
+++ b/skills/find-skills/SKILL.md
@@ -0,0 +1,133 @@
+---
+name: find-skills
+description: Helps users discover and install agent skills when they ask questions like "how do I do X", "find a skill for X", "is there a skill that can...", or express interest in extending capabilities. This skill should be used when the user is looking for functionality that might exist as an installable skill.
+---
+
+# Find Skills
+
+This skill helps you discover and install skills from the open agent skills ecosystem.
+
+## When to Use This Skill
+
+Use this skill when the user:
+
+- Asks "how do I do X" where X might be a common task with an existing skill
+- Says "find a skill for X" or "is there a skill for X"
+- Asks "can you do X" where X is a specialized capability
+- Expresses interest in extending agent capabilities
+- Wants to search for tools, templates, or workflows
+- Mentions they wish they had help with a specific domain (design, testing, deployment, etc.)
+
+## What is the Skills CLI?
+
+The Skills CLI (`npx skills`) is the package manager for the open agent skills ecosystem. Skills are modular packages that extend agent capabilities with specialized knowledge, workflows, and tools.
+
+**Key commands:**
+
+- `npx skills find [query]` - Search for skills interactively or by keyword
+- `npx skills add <package>` - Install a skill from GitHub or other sources
+- `npx skills check` - Check for skill updates
+- `npx skills update` - Update all installed skills
+
+**Browse skills at:** https://skills.sh/
+
+## How to Help Users Find Skills
+
+### Step 1: Understand What They Need
+
+When a user asks for help with something, identify:
+
+1. The domain (e.g., React, testing, design, deployment)
+2. The specific task (e.g., writing tests, creating animations, reviewing PRs)
+3. Whether this is a common enough task that a skill likely exists
+
+### Step 2: Search for Skills
+
+Run the find command with a relevant query:
+
+```bash
+npx skills find [query]
+```
+
+For example:
+
+- User asks "how do I make my React app faster?" → `npx skills find react performance`
+- User asks "can you help me with PR reviews?" → `npx skills find pr review`
+- User asks "I need to create a changelog" → `npx skills find changelog`
+
+The command will return results like:
+
+```
+Install with npx skills add <owner/repo@skill>
+
+vercel-labs/agent-skills@vercel-react-best-practices
+└ https://skills.sh/vercel-labs/agent-skills/vercel-react-best-practices
+```
+
+### Step 3: Present Options to the User
+
+When you find relevant skills, present them to the user with:
+
+1. The skill name and what it does
+2. The install command they can run
+3. A link to learn more at skills.sh
+
+Example response:
+
+```
+I found a skill that might help! The "vercel-react-best-practices" skill provides
+React and Next.js performance optimization guidelines from Vercel Engineering.
+
+To install it:
+npx skills add vercel-labs/agent-skills@vercel-react-best-practices
+
+Learn more: https://skills.sh/vercel-labs/agent-skills/vercel-react-best-practices
+```
+
+### Step 4: Offer to Install
+
+If the user wants to proceed, you can install the skill for them:
+
+```bash
+npx skills add <owner/repo@skill> -g -y
+```
+
+The `-g` flag installs globally (user-level) and `-y` skips confirmation prompts.
+
+## Common Skill Categories
+
+When searching, consider these common categories:
+
+| Category        | Example Queries                          |
+| --------------- | ---------------------------------------- |
+| Web Development | react, nextjs, typescript, css, tailwind |
+| Testing         | testing, jest, playwright, e2e           |
+| DevOps          | deploy, docker, kubernetes, ci-cd        |
+| Documentation   | docs, readme, changelog, api-docs        |
+| Code Quality    | review, lint, refactor, best-practices   |
+| Design          | ui, ux, design-system, accessibility     |
+| Productivity    | workflow, automation, git                |
+
+## Tips for Effective Searches
+
+1. **Use specific keywords**: "react testing" is better than just "testing"
+2. **Try alternative terms**: If "deploy" doesn't work, try "deployment" or "ci-cd"
+3. **Check popular sources**: Many skills come from `vercel-labs/agent-skills` or `ComposioHQ/awesome-claude-skills`
+
+## When No Skills Are Found
+
+If no relevant skills exist:
+
+1. Acknowledge that no existing skill was found
+2. Offer to help with the task directly using your general capabilities
+3. Suggest the user could create their own skill with `npx skills init`
+
+Example:
+
+```
+I searched for skills related to "xyz" but didn't find any matches.
+I can still help you with this task directly! Would you like me to proceed?
+
+If this is something you do often, you could create your own skill:
+npx skills init my-xyz-skill
+```
diff --git a/skills/imagegen/LICENSE.txt b/skills/imagegen/LICENSE.txt
new file mode 100644
index 0000000..13e25df
--- /dev/null
+++ b/skills/imagegen/LICENSE.txt
@@ -0,0 +1,201 @@
+Apache License
+Version 2.0, January 2004
+http://www.apache.org/licenses/
+
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+1. Definitions.
+
+   "License" shall mean the terms and conditions for use, reproduction,
+   and distribution as defined by Sections 1 through 9 of this document.
+
+   "Licensor" shall mean the copyright owner or entity authorized by
+   the copyright owner that is granting the License.
+
+   "Legal Entity" shall mean the union of the acting entity and all
+   other entities that control, are controlled by, or are under common
+   control with that entity. For the purposes of this definition,
+   "control" means (i) the power, direct or indirect, to cause the
+   direction or management of such entity, whether by contract or
+   otherwise, or (ii) ownership of fifty percent (50%) or more of the
+   outstanding shares, or (iii) beneficial ownership of such entity.
+
+   "You" (or "Your") shall mean an individual or Legal Entity
+   exercising permissions granted by this License.
+
+   "Source" form shall mean the preferred form for making modifications,
+   including but not limited to software source code, documentation
+   source, and configuration files.
+
+   "Object" form shall mean any form resulting from mechanical
+   transformation or translation of a Source form, including but
+   not limited to compiled object code, generated documentation,
+   and conversions to other media types.
+
+   "Work" shall mean the work of authorship, whether in Source or
+   Object form, made available under the License, as indicated by a
+   copyright notice that is included in or attached to the work
+   (an example is provided in the Appendix below).
+
+   "Derivative Works" shall mean any work, whether in Source or Object
+   form, that is based on (or derived from) the Work and for which the
+   editorial revisions, annotations, elaborations, or other modifications
+   represent, as a whole, an original work of authorship. For the purposes
+   of this License, Derivative Works shall not include works that remain
+   separable from, or merely link (or bind by name) to the interfaces of,
+   the Work and Derivative Works thereof.
+
+   "Contribution" shall mean any work of authorship, including
+   the original version of the Work and any modifications or additions
+   to that Work or Derivative Works thereof, that is intentionally
+   submitted to Licensor for inclusion in the Work by the copyright owner
+   or by an individual or Legal Entity authorized to submit on behalf of
+   the copyright owner. For the purposes of this definition, "submitted"
+   means any form of electronic, verbal, or written communication sent
+   to the Licensor or its representatives, including but not limited to
+   communication on electronic mailing lists, source code control systems,
+   and issue tracking systems that are managed by, or on behalf of, the
+   Licensor for the purpose of discussing and improving the Work, but
+   excluding communication that is conspicuously marked or otherwise
+   designated in writing by the copyright owner as "Not a Contribution."
+
+   "Contributor" shall mean Licensor and any individual or Legal Entity
+   on behalf of whom a Contribution has been received by Licensor and
+   subsequently incorporated within the Work.
+
+2. Grant of Copyright License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   copyright license to reproduce, prepare Derivative Works of,
+   publicly display, publicly perform, sublicense, and distribute the
+   Work and such Derivative Works in Source or Object form.
+
+3. Grant of Patent License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   (except as stated in this section) patent license to make, have made,
+   use, offer to sell, sell, import, and otherwise transfer the Work,
+   where such license applies only to those patent claims licensable
+   by such Contributor that are necessarily infringed by their
+   Contribution(s) alone or by combination of their Contribution(s)
+   with the Work to which such Contribution(s) was submitted. If You
+   institute patent litigation against any entity (including a
+   cross-claim or counterclaim in a lawsuit) alleging that the Work
+   or a Contribution incorporated within the Work constitutes direct
+   or contributory patent infringement, then any patent licenses
+   granted to You under this License for that Work shall terminate
+   as of the date such litigation is filed.
+
+4. Redistribution. You may reproduce and distribute copies of the
+   Work or Derivative Works thereof in any medium, with or without
+   modifications, and in Source or Object form, provided that You
+   meet the following conditions:
+
+   (a) You must give any other recipients of the Work or
+       Derivative Works a copy of this License; and
+
+   (b) You must cause any modified files to carry prominent notices
+       stating that You changed the files; and
+
+   (c) You must retain, in the Source form of any Derivative Works
+       that You distribute, all copyright, patent, trademark, and
+       attribution notices from the Source form of the Work,
+       excluding those notices that do not pertain to any part of
+       the Derivative Works; and
+
+   (d) If the Work includes a "NOTICE" text file as part of its
+       distribution, then any Derivative Works that You distribute must
+       include a readable copy of the attribution notices contained
+       within such NOTICE file, excluding those notices that do not
+       pertain to any part of the Derivative Works, in at least one
+       of the following places: within a NOTICE text file distributed
+       as part of the Derivative Works; within the Source form or
+       documentation, if provided along with the Derivative Works; or,
+       within a display generated by the Derivative Works, if and
+       wherever such third-party notices normally appear. The contents
+       of the NOTICE file are for informational purposes only and
+       do not modify the License. You may add Your own attribution
+       notices within Derivative Works that You distribute, alongside
+       or as an addendum to the NOTICE text from the Work, provided
+       that such additional attribution notices cannot be construed
+       as modifying the License.
+
+   You may add Your own copyright statement to Your modifications and
+   may provide additional or different license terms and conditions
+   for use, reproduction, or distribution of Your modifications, or
+   for any such Derivative Works as a whole, provided Your use,
+   reproduction, and distribution of the Work otherwise complies with
+   the conditions stated in this License.
+
+5. Submission of Contributions. Unless You explicitly state otherwise,
+   any Contribution intentionally submitted for inclusion in the Work
+   by You to the Licensor shall be under the terms and conditions of
+   this License, without any additional terms or conditions.
+   Notwithstanding the above, nothing herein shall supersede or modify
+   the terms of any separate license agreement you may have executed
+   with Licensor regarding such Contributions.
+
+6. Trademarks. This License does not grant permission to use the trade
+   names, trademarks, service marks, or product names of the Licensor,
+   except as required for reasonable and customary use in describing the
+   origin of the Work and reproducing the content of the NOTICE file.
+
+7. Disclaimer of Warranty. Unless required by applicable law or
+   agreed to in writing, Licensor provides the Work (and each
+   Contributor provides its Contributions) on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+   implied, including, without limitation, any warranties or conditions
+   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+   PARTICULAR PURPOSE. You are solely responsible for determining the
+   appropriateness of using or redistributing the Work and assume any
+   risks associated with Your exercise of permissions under this License.
+
+8. Limitation of Liability. In no event and under no legal theory,
+   whether in tort (including negligence), contract, or otherwise,
+   unless required by applicable law (such as deliberate and grossly
+   negligent acts) or agreed to in writing, shall any Contributor be
+   liable to You for damages, including any direct, indirect, special,
+   incidental, or consequential damages of any character arising as a
+   result of this License or out of the use or inability to use the
+   Work (including but not limited to damages for loss of goodwill,
+   work stoppage, computer failure or malfunction, or any and all
+   other commercial damages or losses), even if such Contributor
+   has been advised of the possibility of such damages.
+
+9. Accepting Warranty or Additional Liability. While redistributing
+   the Work or Derivative Works thereof, You may choose to offer,
+   and charge a fee for, acceptance of support, warranty, indemnity,
+   or other liability obligations and/or rights consistent with this
+   License. However, in accepting such obligations, You may act only
+   on Your own behalf and on Your sole responsibility, not on behalf of
+   any other Contributor, and only if You agree to indemnify,
+   defend, and hold each Contributor harmless for any liability
+   incurred by, or claims asserted against, such Contributor by reason
+   of your accepting any such warranty or additional liability.
+
+END OF TERMS AND CONDITIONS
+
+APPENDIX: How to apply the Apache License to your work.
+
+   To apply the Apache License to your work, attach the following
+   boilerplate notice, with the fields enclosed by brackets "[]"
+   replaced with your own identifying information. (Don\'t include
+   the brackets!)  The text should be enclosed in the appropriate
+   comment syntax for the file format. We also recommend that a
+   file or class name and description of purpose be included on the
+   same "printed page" as the copyright notice for easier
+   identification within third-party archives.
+
+Copyright [yyyy] [name of copyright owner]
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
diff --git a/skills/imagegen/SKILL.md b/skills/imagegen/SKILL.md
new file mode 100644
index 0000000..4285e5e
--- /dev/null
+++ b/skills/imagegen/SKILL.md
@@ -0,0 +1,356 @@
+---
+name: "imagegen"
+description: "Generate or edit raster images when the task benefits from AI-created bitmap visuals such as photos, illustrations, textures, sprites, mockups, or transparent-background cutouts. Use when Codex should create a brand-new image, transform an existing image, or derive visual variants from references, and the output should be a bitmap asset rather than repo-native code or vector. Do not use when the task is better handled by editing existing SVG/vector/code-native assets, extending an established icon or logo system, or building the visual directly in HTML/CSS/canvas."
+---
+
+# Image Generation Skill
+
+Generates or edits images for the current project (for example website assets, game assets, UI mockups, product mockups, wireframes, logo design, photorealistic images, or infographics).
+
+## Top-level modes and rules
+
+This skill has exactly two top-level modes:
+
+- **Default built-in tool mode (preferred):** built-in `image_gen` tool for normal image generation, editing, and simple transparent-image requests. Does not require `OPENAI_API_KEY`.
+- **Fallback CLI mode:** `scripts/image_gen.py` CLI. Use when the user explicitly asks for the CLI/API/model path, or after the user explicitly confirms a true model-native transparency fallback with `gpt-image-1.5`. Requires `OPENAI_API_KEY`.
+
+Within CLI fallback, the CLI exposes three subcommands:
+
+- `generate`
+- `edit`
+- `generate-batch`
+
+Rules:
+- Use the built-in `image_gen` tool by default for normal image generation and editing requests.
+- Do not switch to CLI fallback for ordinary quality, size, or file-path control.
+- If the user explicitly asks for a transparent image/background, stay on built-in `image_gen` first: prompt for a flat removable chroma-key background, then remove it locally with the installed helper at `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`.
+- Never silently switch from built-in `image_gen` or CLI `gpt-image-2` to CLI `gpt-image-1.5`. Treat this as a model/path downgrade and ask the user before doing it, unless the user has already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
+- If a transparent request appears too complex for clean chroma-key removal, asks for true/native transparency, or local removal fails validation, explain that true transparency requires CLI `gpt-image-1.5 --background transparent --output-format png` because `gpt-image-2` does not support `background=transparent`, then ask whether to proceed. Run the CLI fallback only after the user confirms.
+- The word `batch` by itself does not mean CLI fallback. If the user asks for many assets or says to batch-generate assets without explicitly asking for CLI/API/model controls, stay on the built-in path and issue one built-in call per requested asset or variant.
+- If the built-in tool fails or is unavailable, tell the user the CLI fallback exists and that it requires `OPENAI_API_KEY`. Proceed only if the user explicitly asks for that fallback.
+- If the user explicitly asks for CLI mode, use the bundled `scripts/image_gen.py` workflow. Do not create one-off SDK runners.
+- Never modify `scripts/image_gen.py`. If something is missing, ask the user before doing anything else.
+
+Built-in save-path policy:
+- In built-in tool mode, Codex saves generated images under `$CODEX_HOME/*` by default.
+- Do not describe or rely on OS temp as the default built-in destination.
+- Do not describe or rely on a destination-path argument (if any) on the built-in `image_gen` tool. If a specific location is needed, generate first and then move or copy the selected output from `$CODEX_HOME/generated_images/...`.
+- Save-path precedence in built-in mode:
+  1. If the user names a destination, move or copy the selected output there.
+  2. If the image is meant for the current project, move or copy the final selected image into the workspace before finishing.
+  3. If the image is only for preview or brainstorming, render it inline; the underlying file can remain at the default `$CODEX_HOME/*` path.
+- Never leave a project-referenced asset only at the default `$CODEX_HOME/*` path.
+- Do not overwrite an existing asset unless the user explicitly asked for replacement; otherwise create a sibling versioned filename such as `hero-v2.png` or `item-icon-edited.png`.
+
+Shared prompt guidance for both modes lives in `references/prompting.md` and `references/sample-prompts.md`.
+
+Fallback-only docs/resources for CLI mode:
+- `references/cli.md`
+- `references/image-api.md`
+- `references/codex-network.md`
+- `scripts/image_gen.py`
+
+Local post-processing helper:
+- `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`: removes a flat chroma-key background from a generated image and writes a PNG/WebP with alpha. Prefer auto-key sampling, soft matte, and despill for antialiased edges.
+
+## When to use
+- Generate a new image (concept art, product shot, cover, website hero)
+- Generate a new image using one or more reference images for style, composition, or mood
+- Edit an existing image (inpainting, lighting or weather transformations, background replacement, object removal, compositing, transparent background)
+- Produce many assets or variants for one task
+
+## When not to use
+- Extending or matching an existing SVG/vector icon set, logo system, or illustration library inside the repo
+- Creating simple shapes, diagrams, wireframes, or icons that are better produced directly in SVG, HTML/CSS, or canvas
+- Making a small project-local asset edit when the source file already exists in an editable native format
+- Any task where the user clearly wants deterministic code-native output instead of a generated bitmap
+
+## Decision tree
+
+Think about two separate questions:
+
+1. **Intent:** is this a new image or an edit of an existing image?
+2. **Execution strategy:** is this one asset or many assets/variants?
+
+Intent:
+- If the user wants to modify an existing image while preserving parts of it, treat the request as **edit**.
+- If the user provides images only as references for style, composition, mood, or subject guidance, treat the request as **generate**.
+- If the user provides no images, treat the request as **generate**.
+
+Built-in edit semantics:
+- Built-in edit mode is for images already visible in the conversation context, such as attached images or images generated earlier in the thread.
+- If the user wants to edit a local image file with the built-in tool, first load it with built-in `view_image` tool so the image is visible in the conversation context, then proceed with the built-in edit flow.
+- Do not promise arbitrary filesystem-path editing through the built-in tool.
+- If a local file still needs direct file-path control, masks, or other explicit CLI-only parameters, use the explicit CLI fallback only when the user asks for it.
+- For edits, preserve invariants aggressively and save non-destructively by default.
+
+Execution strategy:
+- In the built-in default path, produce many assets or variants by issuing one `image_gen` call per requested asset or variant.
+- In the CLI fallback path, use the CLI `generate-batch` subcommand only when the user explicitly chose CLI mode and needs many prompts/assets.
+- For many distinct assets, do not use `n` as a substitute for separate prompts. `n` is for variants of one prompt; distinct assets need distinct built-in calls or distinct CLI `generate-batch` jobs.
+
+Assume the user wants a new image unless they clearly ask to change an existing one.
+
+## Workflow
+1. Decide the top-level mode: built-in by default, including simple transparent-output requests; fallback CLI only if explicitly requested or after the user explicitly confirms a transparent-output fallback.
+2. Decide the intent: `generate` or `edit`.
+3. Decide whether the output is preview-only or meant to be consumed by the current project.
+4. Decide the execution strategy: single asset vs repeated built-in calls vs CLI `generate-batch`.
+5. Collect inputs up front: prompt(s), exact text (verbatim), constraints/avoid list, and any input images.
+6. For every input image, label its role explicitly:
+   - reference image
+   - edit target
+   - supporting insert/style/compositing input
+7. If the edit target is only on the local filesystem and you are staying on the built-in path, inspect it with `view_image` first so the image is available in conversation context.
+8. If the user asked for a photo, illustration, sprite, product image, banner, or other explicitly raster-style asset, use `image_gen` rather than substituting SVG/HTML/CSS placeholders. If the request is for an icon, logo, or UI graphic that should match existing repo-native SVG/vector/code assets, prefer editing those directly instead.
+9. Augment the prompt based on specificity:
+   - If the user's prompt is already specific and detailed, normalize it into a clear spec without adding creative requirements.
+   - If the user's prompt is generic, add tasteful augmentation only when it materially improves output quality.
+10. Use the built-in `image_gen` tool by default.
+11. For transparent-output requests, follow the transparent image guidance below: generate with built-in `image_gen` on a flat chroma-key background, copy the selected output into the workspace or `tmp/imagegen/`, run the installed `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py` helper, and validate the alpha result before using it. If this path looks unsuitable or fails, ask before switching to CLI `gpt-image-1.5`.
+12. Inspect outputs and validate: subject, style, composition, text accuracy, and invariants/avoid items.
+13. Iterate with a single targeted change, then re-check.
+14. For preview-only work, render the image inline; the underlying file may remain at the default `$CODEX_HOME/generated_images/...` path.
+15. For project-bound work, move or copy the selected artifact into the workspace and update any consuming code or references. Never leave a project-referenced asset only at the default `$CODEX_HOME/generated_images/...` path.
+16. For batches or multi-asset requests, persist every requested deliverable final in the workspace unless the user explicitly asked to keep outputs preview-only. Discarded variants do not need to be kept unless requested.
+17. If the user explicitly chooses or confirms the CLI fallback, then use the fallback-only docs for model, quality, size, `input_fidelity`, masks, output format, output paths, and network setup.
+18. Always report the final saved path(s) for any workspace-bound asset(s), plus the final prompt or prompt set and whether the built-in tool or fallback CLI mode was used.
+
+## Transparent image requests
+
+Transparent-image requests still use built-in `image_gen` first. Because the built-in tool does not expose a true transparent-background control, create a removable chroma-key source image and then convert the key color to alpha locally.
+
+Default sequence:
+1. Use built-in `image_gen` to generate the requested subject on a perfectly flat solid chroma-key background.
+2. Choose a key color that is unlikely to appear in the subject: default `#00ff00`, use `#ff00ff` for green subjects, and avoid `#0000ff` for blue subjects.
+3. After generation, move or copy the selected source image from `$CODEX_HOME/generated_images/...` into the workspace or `tmp/imagegen/`.
+4. Run the installed helper path, not a project-relative script path:
+   ```bash
+   python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" \
+     --input <source> \
+     --out <final.png> \
+     --auto-key border \
+     --soft-matte \
+     --transparent-threshold 12 \
+     --opaque-threshold 220 \
+     --despill
+   ```
+5. Validate that the output has an alpha channel, transparent corners, plausible subject coverage, and no obvious key-color fringe. If a thin fringe remains, retry once with `--edge-contract 1`; use `--edge-feather 0.25` only when the edge is visibly stair-stepped and the subject is not shiny or reflective.
+6. Save the final alpha PNG/WebP in the project if the asset is project-bound. Never leave a project-referenced transparent asset only under `$CODEX_HOME/*`.
+
+Prompt transparent requests like this:
+
+```text
+Create the requested subject on a perfectly flat solid #00ff00 chroma-key background for background removal.
+The background must be one uniform color with no shadows, gradients, texture, reflections, floor plane, or lighting variation.
+Keep the subject fully separated from the background with crisp edges and generous padding.
+Do not use #00ff00 anywhere in the subject.
+No cast shadow, no contact shadow, no reflection, no watermark, and no text unless explicitly requested.
+```
+
+Do not automatically use CLI `gpt-image-1.5 --background transparent --output-format png` instead of chroma keying. Ask the user first when the user asks for true/native transparency, when local removal fails validation, or when the requested image is complex: hair, fur, feathers, smoke, glass, liquids, translucent materials, reflective objects, soft shadows, realistic product grounding, or subject colors that conflict with all practical key colors.
+
+Use a concise confirmation like:
+
+```text
+This likely needs true native transparency. The default built-in path uses a chroma-key background plus local removal, but true transparency requires the CLI fallback with gpt-image-1.5 because gpt-image-2 does not support background=transparent. It also requires OPENAI_API_KEY. Should I proceed with that CLI fallback?
+```
+
+## Prompt augmentation
+
+Reformat user prompts into a structured, production-oriented spec. Make the user's goal clearer and more actionable, but do not blindly add detail.
+
+Treat this as prompt-shaping guidance, not a closed schema. Use only the lines that help, and add a short extra labeled line when it materially improves clarity.
+
+### Specificity policy
+
+Use the user's prompt specificity to decide how much augmentation is appropriate:
+
+- If the prompt is already specific and detailed, preserve that specificity and only normalize/structure it.
+- If the prompt is generic, you may add tasteful augmentation when it will materially improve the result.
+
+Allowed augmentations:
+- composition or framing hints
+- polish level or intended-use hints
+- practical layout guidance
+- reasonable scene concreteness that supports the stated request
+
+Not allowed augmentations:
+- extra characters or objects that are not implied by the request
+- brand names, slogans, palettes, or narrative beats that are not implied
+- arbitrary side-specific placement unless the surrounding layout supports it
+
+## Use-case taxonomy (exact slugs)
+
+Classify each request into one of these buckets and keep the slug consistent across prompts and references.
+
+Generate:
+- photorealistic-natural — candid/editorial lifestyle scenes with real texture and natural lighting.
+- product-mockup — product/packaging shots, catalog imagery, merch concepts.
+- ui-mockup — app/web interface mockups and wireframes; specify the desired fidelity.
+- infographic-diagram — diagrams/infographics with structured layout and text.
+- scientific-educational — classroom explainers, scientific diagrams, and learning visuals with required labels and accuracy constraints.
+- ads-marketing — campaign concepts and ad creatives with audience, brand position, scene, and exact tagline/copy.
+- productivity-visual — slide, chart, workflow, and data-heavy business visuals.
+- logo-brand — logo/mark exploration, vector-friendly.
+- illustration-story — comics, children’s book art, narrative scenes.
+- stylized-concept — style-driven concept art, 3D/stylized renders.
+- historical-scene — period-accurate/world-knowledge scenes.
+
+Edit:
+- text-localization — translate/replace in-image text, preserve layout.
+- identity-preserve — try-on, person-in-scene; lock face/body/pose.
+- precise-object-edit — remove/replace a specific element (including interior swaps).
+- lighting-weather — time-of-day/season/atmosphere changes only.
+- background-extraction — transparent background / clean cutout. Use built-in `image_gen` with chroma-key removal first for simple opaque subjects; ask before using CLI true transparency for complex subjects.
+- style-transfer — apply reference style while changing subject/scene.
+- compositing — multi-image insert/merge with matched lighting/perspective.
+- sketch-to-render — drawing/line art to photoreal render.
+
+## Shared prompt schema
+
+Use the following labeled spec as shared prompt scaffolding for both top-level modes:
+
+```text
+Use case: <taxonomy slug>
+Asset type: <where the asset will be used>
+Primary request: <user's main prompt>
+Input images: <Image 1: role; Image 2: role> (optional)
+Scene/backdrop: <environment>
+Subject: <main subject>
+Style/medium: <photo/illustration/3D/etc>
+Composition/framing: <wide/close/top-down; placement>
+Lighting/mood: <lighting + mood>
+Color palette: <palette notes>
+Materials/textures: <surface details>
+Text (verbatim): "<exact text>"
+Constraints: <must keep/must avoid>
+Avoid: <negative constraints>
+```
+
+Notes:
+- `Asset type` and `Input images` are prompt scaffolding, not dedicated CLI flags.
+- `Scene/backdrop` refers to the visual setting. It is not the same as the fallback CLI `background` parameter, which controls output transparency behavior.
+- Fallback-only execution notes such as `Quality:`, `Input fidelity:`, masks, output format, and output paths belong in the CLI path only. Do not treat them as built-in `image_gen` tool arguments.
+
+Augmentation rules:
+- Keep it short.
+- Add only the details needed to improve the prompt materially.
+- For edits, explicitly list invariants (`change only X; keep Y unchanged`).
+- If any critical detail is missing and blocks success, ask a question; otherwise proceed.
+
+## Examples
+
+### Generation example (hero image)
+```text
+Use case: product-mockup
+Asset type: landing page hero
+Primary request: a minimal hero image of a ceramic coffee mug
+Style/medium: clean product photography
+Composition/framing: wide composition with usable negative space for page copy if needed
+Lighting/mood: soft studio lighting
+Constraints: no logos, no text, no watermark
+```
+
+### Edit example (invariants)
+```text
+Use case: precise-object-edit
+Asset type: product photo background replacement
+Primary request: replace only the background with a warm sunset gradient
+Constraints: change only the background; keep the product and its edges unchanged; no text; no watermark
+```
+
+## Prompting best practices
+- Structure prompt as scene/backdrop -> subject -> details -> constraints.
+- Include intended use (ad, UI mock, infographic) to set the mode and polish level.
+- Use camera/composition language for photorealism.
+- Only use SVG/vector stand-ins when the user explicitly asked for vector output or a non-image placeholder.
+- Quote exact text and specify typography + placement.
+- For tricky words, spell them letter-by-letter and require verbatim rendering.
+- For multi-image inputs, reference images by index and describe how they should be used.
+- For edits, repeat invariants every iteration to reduce drift.
+- Iterate with single-change follow-ups.
+- If the prompt is generic, add only the extra detail that will materially help.
+- If the prompt is already detailed, normalize it instead of expanding it.
+- For CLI fallback only, see `references/cli.md` and `references/image-api.md` for model, `quality`, `input_fidelity`, masks, output format, and output-path guidance.
+- For transparent images, use the built-in-first chroma-key workflow unless the request is complex enough to need true CLI transparency; ask before switching to CLI `gpt-image-1.5`.
+
+More principles shared by both modes: `references/prompting.md`.
+Copy/paste specs shared by both modes: `references/sample-prompts.md`.
+
+## Guidance by asset type
+Asset-type templates (website assets, game assets, wireframes, logo) are consolidated in `references/sample-prompts.md`.
+
+## gpt-image-2 guidance for CLI fallback
+
+The fallback CLI defaults to `gpt-image-2`.
+
+- Use `gpt-image-2` for new CLI/API workflows unless the request needs true model-native transparent output.
+- If a transparent request may need CLI fallback, ask before using `gpt-image-1.5` unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Explain that the built-in chroma-key path is the default, but true transparency requires `gpt-image-1.5` because `gpt-image-2` does not support `background=transparent`.
+- `gpt-image-2` always uses high fidelity for image inputs; do not set `input_fidelity` with this model.
+- `gpt-image-2` supports `quality` values `low`, `medium`, `high`, and `auto`.
+- Use `quality low` for fast drafts, thumbnails, and quick iterations. Use `medium`, `high`, or `auto` for final assets, dense text, diagrams, identity-sensitive edits, or high-resolution outputs.
+- Square images are typically fastest to generate. Use `1024x1024` for fast square drafts.
+- If the user asks for 4K-style output, use `3840x2160` for landscape or `2160x3840` for portrait.
+- `gpt-image-2` size may be `auto` or `WIDTHxHEIGHT` if all constraints hold: max edge `<= 3840px`, both edges multiples of `16px`, long-to-short ratio `<= 3:1`, total pixels between `655,360` and `8,294,400`.
+
+Popular `gpt-image-2` sizes:
+- `1024x1024` square
+- `1536x1024` landscape
+- `1024x1536` portrait
+- `2048x2048` 2K square
+- `2048x1152` 2K landscape
+- `3840x2160` 4K landscape
+- `2160x3840` 4K portrait
+- `auto`
+
+## Fallback CLI mode only
+
+### Temp and output conventions
+These conventions apply only to the CLI fallback. They do not describe built-in `image_gen` output behavior.
+- Use `tmp/imagegen/` for intermediate files (for example JSONL batches); delete them when done.
+- Write final artifacts under `output/imagegen/`.
+- Use `--out` or `--out-dir` to control output paths; keep filenames stable and descriptive.
+
+### Dependencies
+Prefer `uv` for dependency management in this repo.
+
+Required Python package:
+```bash
+uv pip install openai
+```
+
+Required for local chroma-key removal and optional downscaling:
+```bash
+uv pip install pillow
+```
+
+Portability note:
+- If you are using the installed skill outside this repo, install dependencies into that environment with its package manager.
+- In uv-managed environments, `uv pip install ...` remains the preferred path.
+
+### Environment
+- `OPENAI_API_KEY` must be set for live API calls.
+- Do not ask the user for `OPENAI_API_KEY` when using the built-in `image_gen` tool.
+- Never ask the user to paste the full key in chat. Ask them to set it locally and confirm when ready.
+
+If the key is missing, give the user these steps:
+1. Create an API key in the OpenAI platform UI: https://platform.openai.com/api-keys
+2. Set `OPENAI_API_KEY` as an environment variable in their system.
+3. Offer to guide them through setting the environment variable for their OS/shell if needed.
+
+If installation is not possible in this environment, tell the user which dependency is missing and how to install it into their active environment.
+
+### Script-mode notes
+- CLI commands + examples: `references/cli.md`
+- API parameter quick reference: `references/image-api.md`
+- Network approvals / sandbox settings for CLI mode: `references/codex-network.md`
+
+## Reference map
+- `references/prompting.md`: shared prompting principles for both modes.
+- `references/sample-prompts.md`: shared copy/paste prompt recipes for both modes.
+- `references/cli.md`: fallback-only CLI usage via `scripts/image_gen.py`.
+- `references/image-api.md`: fallback-only API/CLI parameter reference.
+- `references/codex-network.md`: fallback-only network/sandbox troubleshooting for CLI mode.
+- `scripts/image_gen.py`: fallback-only CLI implementation. Do not load or use it unless the user explicitly chooses CLI mode or explicitly confirms a transparent request's true CLI transparency fallback.
+- `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`: local post-processing helper for built-in transparent-image requests.
diff --git a/skills/imagegen/agents/openai.yaml b/skills/imagegen/agents/openai.yaml
new file mode 100644
index 0000000..5e01d44
--- /dev/null
+++ b/skills/imagegen/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "Image Gen"
+  short_description: "Generate or edit images for websites, games, and more"
+  icon_small: "./assets/imagegen-small.svg"
+  icon_large: "./assets/imagegen.png"
+  default_prompt: "Use $imagegen to make or edit an image for this project."
diff --git a/skills/imagegen/assets/imagegen-small.svg b/skills/imagegen/assets/imagegen-small.svg
new file mode 100644
index 0000000..20128b2
--- /dev/null
+++ b/skills/imagegen/assets/imagegen-small.svg
@@ -0,0 +1,5 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" viewBox="0 0 16 16">
+  <path fill="currentColor" d="M7.51 6.827a1 1 0 1 1 .278 1.982 1 1 0 0 1-.278-1.982Z"/>
+  <path fill="currentColor" fill-rule="evenodd" d="M8.31 4.47c.368-.016.699.008 1.016.124l.186.075c.423.194.786.5 1.047.888l.067.107c.148.253.235.533.3.848.073.354.126.797.193 1.343l.277 2.25.088.745c.024.224.041.425.049.605.013.322-.004.615-.085.896l-.04.12a2.53 2.53 0 0 1-.802 1.115l-.16.118c-.281.189-.596.292-.956.366a9.46 9.46 0 0 1-.6.1l-.743.094-2.25.277c-.547.067-.99.121-1.35.136a2.765 2.765 0 0 1-.896-.085l-.12-.039a2.533 2.533 0 0 1-1.115-.802l-.118-.161c-.189-.28-.292-.596-.366-.956a9.42 9.42 0 0 1-.1-.599l-.094-.744-.276-2.25a17.884 17.884 0 0 1-.137-1.35c-.015-.367.009-.698.124-1.015l.076-.185c.193-.423.5-.787.887-1.048l.107-.067c.253-.148.534-.234.849-.3.354-.073.796-.126 1.343-.193l2.25-.277.744-.088c.224-.024.425-.041.606-.049Zm-2.905 5.978a1.47 1.47 0 0 0-.875.074c-.127.052-.267.146-.475.344-.212.204-.462.484-.822.889l-.314.351c.018.115.036.219.055.313.061.295.127.458.206.575l.07.094c.167.211.39.372.645.465l.109.032c.119.027.273.038.499.029.308-.013.7-.06 1.264-.13l2.25-.275.727-.093.198-.03-2.05-1.64a16.848 16.848 0 0 0-.96-.738c-.18-.121-.31-.19-.421-.23l-.106-.03Zm2.95-4.915c-.154.006-.33.021-.536.043l-.729.086-2.25.276c-.564.07-.956.118-1.257.18a1.937 1.937 0 0 0-.478.15l-.097.057a1.47 1.47 0 0 0-.515.608l-.044.107c-.048.133-.073.307-.06.608.012.307.06.7.129 1.264l.22 1.8.178-.197c.145-.159.278-.298.403-.418.255-.243.507-.437.809-.56l.181-.067a2.526 2.526 0 0 1 1.328-.06l.118.029c.27.079.517.215.772.387.287.194.619.46 1.03.789l2.52 2.016c.146-.148.26-.326.332-.524l.031-.109c.027-.119.039-.273.03-.499a8.311 8.311 0 0 0-.044-.536l-.086-.728-.276-2.25c-.07-.564-.118-.956-.18-1.258a1.935 1.935 0 0 0-.15-.477l-.057-.098a1.468 1.468 0 0 0-.608-.515l-.107-.043c-.133-.049-.306-.074-.607-.061Z" clip-rule="evenodd"/>
+  <path fill="currentColor" d="M7.783 1.272c.36.014.803.07 1.35.136l2.25.277.743.095c.224.03.423.062.6.099.36.074.675.177.955.366l.161.118c.364.29.642.675.802 1.115l.04.12c.081.28.098.574.085.896a9.42 9.42 0 0 1-.05.605l-.087.745-.277 2.25c-.067.547-.12.989-.193 1.343a2.765 2.765 0 0 1-.3.848l-.067.107a2.534 2.534 0 0 1-.415.474l-.086.064a.532.532 0 0 1-.622-.858l.13-.13c.04-.046.077-.094.111-.145l.057-.098c.055-.109.104-.256.15-.477.062-.302.11-.694.18-1.258l.276-2.25.086-.728c.022-.207.037-.382.043-.536.01-.226-.002-.38-.029-.5l-.032-.108a1.469 1.469 0 0 0-.464-.646l-.094-.069c-.118-.08-.28-.145-.575-.206a8.285 8.285 0 0 0-.53-.088l-.728-.092-2.25-.276c-.565-.07-.956-.117-1.264-.13a1.94 1.94 0 0 0-.5.029l-.108.032a1.469 1.469 0 0 0-.647.465l-.068.094c-.054.08-.102.18-.146.33l-.04.1a.533.533 0 0 1-.98-.403l.055-.166c.059-.162.133-.314.23-.457l.117-.16c.29-.365.675-.643 1.115-.803l.12-.04c.28-.08.574-.097.896-.084Z"/>
+</svg>
diff --git a/skills/imagegen/assets/imagegen.png b/skills/imagegen/assets/imagegen.png
new file mode 100644
index 0000000000000000000000000000000000000000..94b54541a9affd39a7aa09d0efd5bc6b712b723b
GIT binary patch
literal 1711
zcmV;g22lBlP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH21H3jK~#7F?VV3-
z6Gs$>f8*GWodgmJ0xDHBC~1!*z7`}xiD+*{^u{6Wtr9m>;F?6e6%akq_R>NQ97`^h
zS_ISw!l_acdMv2|s@jkWFo}~maqQ{5Ar6jXJ8OGpcRf3wwDM+c*~)zT-u&HNh6Xr2
z$-B~6@6U&DoN@F6Tx_gMyw!zZkYd0r7n}J1r^VmNyNO5=4Zu(bgOk|-gzyRH_#DA0
ze5a&Dv5qs&Z`LEHCLtt(GYpH}0a%=n6p=Gpix@{jKAv3Z&a&_|v3nYpI$$><yk+#4
z1e@LQlRJH2BPwpgrltlFGC0oPON7U(eJWJ#&B5vHu#oW^tPBP4ZZLlPLs6#HK2<S7
zqzsM`Sd=49@{#*}k<oJRl@(%T=!f&%`TL33H>Jn72{}2rewsoH7VU@@*oo2>*cKtL
zTT?Bf&S2fJxIt<c4<8;+uvFo|mP$R#BEwdOt8^{0^&g85Y(|JpRo+pYy52+x%U^@V
z6E;RaBvObRn*!^G#VZD0JJ=Ay8T$+tPvINGQnC&?IhB10+Z*>9+2RUqgo>5nJ#ub|
zQq}-0z927LghkRij)2h@&){gs3Jyeb=#8#z9#4y@PugZO5lp1xm|ls&O&Ie1Y;Y<&
zDJqnH7*0nhk28A~<wpBXn9GLoXt@<*FFNJEe%LG%6*`CEoY}L0p}h-^MU+BO^V7>+
z7<=9c&7_PLLIN%we2x!9dQ!nmCW_&I_i2rm5DevDWF6nVJEu$r(Gy$4m3QXlck9AP
zAru+93XZ;0rxYWFoZJ6W>sd_Seeu8x=)gE3r*<#NO*egQ8QEe}jd4PT_P&B!&~Me-
za;t<<LMSqHrm9j3eH)b+CFD~LDP$+CkP1*_^t7(QZ751;C`J{=2ssj8g;yL^*w-;e
zNUsOcQQ$ySUA<+Dke*l;UeOa(_uIw}oir;}h|e%a$WpGZi@}sY!}F>zMu<BTNab0w
zLbfxr7KK+#i&;fg7$an2F%GY=LdrmSe0tg4MF|9@N|lQtjA~{5y3hu<xwFs?l^7-D
z&O(Q)l{@{G6|w`D=iY)_j6L72`~)yg2<3BHvZI@a>9~wY)fm}Rzy9AItra{)#n*Ft
zp#x)wPKN*4hndv~RP#6!#f883EA5>ZW2_J=urHpxtu%d61x_+_HXOVgZ*U1pUyntk
z&{EQR=i5oZ_4zJ5T+-jH*0PkegJp0u{3nitpQ5+rnfUw7Y~EbH6KNj9MD{&AT0ew2
zu6@1iCZ~3%@lofp<0)5aAWWoVxbvz*TZ$@0sgS;wrx=Pokgrae&K<&7=9qkS3pxKD
zT|-~ns+{fX2)!<Xbe`eaT3FOQQB1A0;+Y2nmP&*i486j|_|G+oC}m>(eSEue($$FZ
zBMl2V75M|_V)ta4Qo-2jF}VemhGKH4^?}?}Lf=PnuV)4kMCz`oE{PPST1J60(ckfX
z`wz;Zu9>J=2o=)R_FFPl>7=J+9#`9L1x`v$La6e-A_}RI%DWbVD8;dmf{b2KNNy4|
zDUO8nhUTRVlHvtHlCq-^sw=LvdncnnP^459LaiNYP5Gq|f*_@$5Ngt%i`|9aFkMPn
zAtXXqA43HuOW7i%(8r)u<#$Y#vMI#vK86ZRlp=+A)yGhQX;MO7_c2spk`%T$bD5iR
zcFpAW<ICl<az?UQ37M3CO^6iZR-H7v6eE`bHM10B*JU-U6r(TtY(^=@UxnLjQUY;V
zbTdf_%ysI`A|+5a4rm4`fxDA~-=zfd)*61664-m4_*F`vZ$9HgDXGBU4aiSY=-KRn
z7ee?&3g`JJR>%f^kirm}vO<dRfs~{bQi6w4QuJ_1E2IqGNMZ89_f|*++?K*Pze%rF
zNEKX^lHC3*TuWKpkis}d3;R}x1N2H^H;Nx}Z-qESj}$hW<1M4bN34(<P%eezd@{ji
ziw{{LHKIxi7xl)yM0mXPxD`?djY=UI_Y;wka_?CobyBaCYBC5bqycJ_k`m3^6V+r8
zR!D<5ks{_fk~tnu6gO`xVTCB5k`xj_QE|6Fa-y^~RSCxb`pWpHMY{!EpK@XOY-*9m
z$7yWJNko)lg)~M=6k!UCO(CCuBJz!B#^$Ej;gJ;T<bMJ3q~G?jZnFRY002ovPDHLk
FV1gqn4#EHc

literal 0
HcmV?d00001

diff --git a/skills/imagegen/references/cli.md b/skills/imagegen/references/cli.md
new file mode 100644
index 0000000..f4a5a63
--- /dev/null
+++ b/skills/imagegen/references/cli.md
@@ -0,0 +1,242 @@
+# CLI reference (`scripts/image_gen.py`)
+
+This file is for the fallback CLI mode only. Read it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
+
+`generate-batch` is a CLI subcommand in this fallback path. It is not a top-level mode of the skill.
+The word `batch` in a user request is not CLI opt-in by itself.
+
+## What this CLI does
+- `generate`: generate a new image from a prompt
+- `edit`: edit one or more existing images
+- `generate-batch`: run many generation jobs from a JSONL file after the user explicitly chooses CLI/API/model controls
+
+Real API calls require **network access** + `OPENAI_API_KEY`. `--dry-run` does not.
+
+## Quick start (works from any repo)
+Set a stable path to the skill CLI (default `CODEX_HOME` is `~/.codex`):
+
+```
+export CODEX_HOME="${CODEX_HOME:-$HOME/.codex}"
+export IMAGE_GEN="$CODEX_HOME/skills/.system/imagegen/scripts/image_gen.py"
+```
+
+Install dependencies into that environment with its package manager. In uv-managed environments, `uv pip install ...` remains the preferred path.
+
+## Quick start
+
+Dry-run (no API call; no network required; does not require the `openai` package):
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "Test" \
+  --out output/imagegen/test.png \
+  --dry-run
+```
+
+Notes:
+- One-off dry-runs print the API payload and the computed output path(s).
+- Repo-local finals should live under `output/imagegen/`.
+
+Generate (requires `OPENAI_API_KEY` + network):
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A cozy alpine cabin at dawn" \
+  --size 1024x1024 \
+  --out output/imagegen/alpine-cabin.png
+```
+
+Edit:
+
+```bash
+python "$IMAGE_GEN" edit \
+  --image input.png \
+  --prompt "Replace only the background with a warm sunset" \
+  --out output/imagegen/sunset-edit.png
+```
+
+## Guardrails
+- Use the bundled CLI directly (`python "$IMAGE_GEN" ...`) after activating the correct environment.
+- Do **not** create one-off runners (for example `gen_images.py`) unless the user explicitly asks for a custom wrapper.
+- **Never modify** `scripts/image_gen.py`. If something is missing, ask the user before doing anything else.
+- Do not silently downgrade from CLI `gpt-image-2` or built-in `image_gen` to CLI `gpt-image-1.5`; ask first unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
+
+## Defaults
+- Model: `gpt-image-2`
+- Supported model family for this CLI: GPT Image models (`gpt-image-*`)
+- Size: `auto`
+- Quality: `medium`
+- Output format: `png`
+- Default one-off output path: `output/imagegen/output.png`
+- Background: unspecified unless `--background` is set
+
+## gpt-image-2 size and model guidance
+
+`gpt-image-2` is the default model for new CLI fallback work.
+
+- Use `--quality low` for fast drafts, thumbnails, and quick iterations.
+- Use `--quality medium`, `--quality high`, or `--quality auto` for final assets, dense text, diagrams, identity-sensitive edits, and high-resolution outputs.
+- Square images are typically fastest. Use `--size 1024x1024` for quick square drafts.
+- If the user asks for 4K-style output, use `--size 3840x2160` for landscape or `--size 2160x3840` for portrait.
+- Do not pass `--input-fidelity` with `gpt-image-2`; this model always uses high fidelity for image inputs.
+- Do not use `--background transparent` with `gpt-image-2`; the default transparent-image workflow uses built-in `image_gen` on a flat chroma-key background plus local removal. Use `gpt-image-1.5` only after the user explicitly confirms the true-transparent CLI fallback, unless they already requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
+
+Popular `gpt-image-2` sizes:
+- `1024x1024`
+- `1536x1024`
+- `1024x1536`
+- `2048x2048`
+- `2048x1152`
+- `3840x2160`
+- `2160x3840`
+- `auto`
+
+`gpt-image-2` size constraints:
+- max edge `<= 3840px`
+- both edges multiples of `16px`
+- long edge to short edge ratio `<= 3:1`
+- total pixels between `655,360` and `8,294,400`
+- outputs above `2560x1440` total pixels are experimental
+
+Fast draft:
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A product thumbnail of a matte ceramic mug on a stone surface" \
+  --quality low \
+  --size 1024x1024 \
+  --out output/imagegen/mug-draft.png
+```
+
+Final 2K landscape:
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A polished landing-page hero image of a matte ceramic mug on a stone surface" \
+  --quality high \
+  --size 2048x1152 \
+  --out output/imagegen/mug-hero.png
+```
+
+4K landscape:
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A detailed architectural visualization at golden hour" \
+  --size 3840x2160 \
+  --quality high \
+  --out output/imagegen/architecture-4k.png
+```
+
+True transparent fallback request:
+
+Ask for confirmation before using this command unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
+
+```bash
+python "$IMAGE_GEN" generate \
+  --model gpt-image-1.5 \
+  --prompt "A clean product cutout on a transparent background" \
+  --background transparent \
+  --output-format png \
+  --out output/imagegen/product-cutout.png
+```
+
+When using this path, explain briefly that built-in `image_gen` plus chroma-key removal is the default transparent-image path, but this request needs true model-native transparency. `gpt-image-2` does not support `background=transparent`, so `gpt-image-1.5` is required for this confirmed fallback.
+
+## Quality, input fidelity, and masks (CLI fallback only)
+These are explicit CLI controls. They are not built-in `image_gen` tool arguments.
+
+- `--quality` works for `generate`, `edit`, and `generate-batch`: `low|medium|high|auto`
+- `--input-fidelity` is **edit-only** and validated as `low|high`; it is not supported for `gpt-image-2`
+- `--mask` is **edit-only**
+
+Example:
+
+```bash
+python "$IMAGE_GEN" edit \
+  --model gpt-image-1.5 \
+  --image input.png \
+  --prompt "Change only the background" \
+  --quality high \
+  --input-fidelity high \
+  --out output/imagegen/background-edit.png
+```
+
+Mask notes:
+- For multi-image edits, pass repeated `--image` flags. Their order is meaningful, so describe each image by index and role in the prompt.
+- The CLI accepts a single `--mask`.
+- Image and mask must be the same size and format and each under 50MB.
+- Masks must include an alpha channel.
+- If multiple input images are provided, the mask applies to the first image.
+- Masking is prompt-guided; do not promise exact pixel-perfect mask boundaries.
+- Use a PNG mask when possible; the script treats mask handling as best-effort and does not perform full preflight validation beyond file checks/warnings.
+- In the edit prompt, repeat invariants (`change only the background; keep the subject unchanged`) to reduce drift.
+
+## Output handling
+- Use `tmp/imagegen/` for temporary JSONL inputs or scratch files.
+- Use `output/imagegen/` for final outputs.
+- Reruns fail if a target file already exists unless you pass `--force`.
+- `--out-dir` changes one-off naming to `image_1.<ext>`, `image_2.<ext>`, and so on.
+- Downscaled copies use the default suffix `-web` unless you override it.
+
+## Common recipes
+
+Generate with augmentation fields:
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A minimal hero image of a ceramic coffee mug" \
+  --use-case "product-mockup" \
+  --style "clean product photography" \
+  --composition "wide product shot with usable negative space for page copy" \
+  --constraints "no logos, no text" \
+  --out output/imagegen/mug-hero.png
+```
+
+Generate + also write a downscaled copy for fast web loading:
+
+```bash
+python "$IMAGE_GEN" generate \
+  --prompt "A cozy alpine cabin at dawn" \
+  --size 1024x1024 \
+  --downscale-max-dim 1024 \
+  --out output/imagegen/alpine-cabin.png
+```
+
+Generate multiple prompts concurrently (async batch):
+
+```bash
+mkdir -p tmp/imagegen output/imagegen/batch
+cat > tmp/imagegen/prompts.jsonl << 'EOF'
+{"prompt":"Cavernous hangar interior with a compact shuttle parked near the center","use_case":"stylized-concept","composition":"wide-angle, low-angle","lighting":"volumetric light rays through drifting fog","constraints":"no logos or trademarks; no watermark","size":"1536x1024"}
+{"prompt":"Gray wolf in profile in a snowy forest","use_case":"photorealistic-natural","composition":"eye-level","constraints":"no logos or trademarks; no watermark","size":"1024x1024"}
+EOF
+
+python "$IMAGE_GEN" generate-batch \
+  --input tmp/imagegen/prompts.jsonl \
+  --out-dir output/imagegen/batch \
+  --concurrency 5
+
+rm -f tmp/imagegen/prompts.jsonl
+```
+
+Notes:
+- `generate-batch` requires `--out-dir`.
+- generate-batch requires --out-dir.
+- Use `--concurrency` to control parallelism (default `5`).
+- Per-job overrides are supported in JSONL (for example `size`, `quality`, `background`, `output_format`, `output_compression`, `moderation`, `n`, `model`, `out`, and prompt-augmentation fields).
+- `--n` generates multiple variants for a single prompt; `generate-batch` is for many different prompts.
+- In batch mode, per-job `out` is treated as a filename under `--out-dir`.
+- For many requested deliverable assets, provide one prompt/job per distinct asset and use semantic filenames when possible.
+
+## CLI notes
+- Supported sizes depend on the model. `gpt-image-2` supports flexible constrained sizes; older GPT Image models support `1024x1024`, `1536x1024`, `1024x1536`, or `auto`.
+- True transparent CLI outputs require `output_format` to be `png` or `webp` and are not supported by `gpt-image-2`.
+- `--prompt-file`, `--output-compression`, `--moderation`, `--max-attempts`, `--fail-fast`, `--force`, and `--no-augment` are supported.
+- This CLI is intended for GPT Image models. Do not assume older non-GPT image-model behavior applies here.
+
+## See also
+- API parameter quick reference for fallback CLI mode: `references/image-api.md`
+- Prompt examples shared across both top-level modes: `references/sample-prompts.md`
+- Network/sandbox notes for fallback CLI mode: `references/codex-network.md`
+- Built-in-first transparent image workflow: `SKILL.md` and `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`
diff --git a/skills/imagegen/references/codex-network.md b/skills/imagegen/references/codex-network.md
new file mode 100644
index 0000000..5ce1fbc
--- /dev/null
+++ b/skills/imagegen/references/codex-network.md
@@ -0,0 +1,33 @@
+# Codex network approvals / sandbox notes
+
+This file is for the fallback CLI mode only. Read it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
+
+This guidance is intentionally isolated from `SKILL.md` because it can vary by environment and may become stale. Prefer the defaults in your environment when in doubt.
+
+## Why am I asked to approve image generation calls?
+The fallback CLI uses the OpenAI Image API, so it needs outbound network access. In many Codex setups, network access is disabled by default and/or the approval policy requires confirmation before networked commands run.
+
+## Important note about approvals vs network
+- `--ask-for-approval never` suppresses approval prompts.
+- It does **not** by itself enable network access.
+- In `workspace-write`, network access still depends on your Codex configuration (for example `[sandbox_workspace_write] network_access = true`).
+
+## How do I reduce repeated approval prompts?
+If you trust the repo and want fewer prompts, use a configuration or profile that both:
+- enables network for the sandbox mode you plan to use
+- sets an approval policy that matches your risk tolerance
+
+Example `~/.codex/config.toml` pattern:
+
+```toml
+approval_policy = "on-request"
+sandbox_mode = "workspace-write"
+
+[sandbox_workspace_write]
+network_access = true
+```
+
+If you want quieter automation after network is enabled, you can choose a stricter approval policy, but do that intentionally and with care.
+
+## Safety note
+Enabling network and reducing approvals lowers friction, but increases risk if you run untrusted code or work in an untrusted repository.
diff --git a/skills/imagegen/references/image-api.md b/skills/imagegen/references/image-api.md
new file mode 100644
index 0000000..db8567d
--- /dev/null
+++ b/skills/imagegen/references/image-api.md
@@ -0,0 +1,90 @@
+# Image API quick reference
+
+This file is for the fallback CLI mode only. Use it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
+
+These parameters describe the Image API and bundled CLI fallback surface. Do not assume they are normal arguments on the built-in `image_gen` tool.
+
+## Scope
+- This fallback CLI is intended for GPT Image models (`gpt-image-2`, `gpt-image-1.5`, `gpt-image-1`, and `gpt-image-1-mini`).
+- The built-in `image_gen` tool and the fallback CLI do not expose the same controls.
+
+## Model summary
+
+| Model | Quality | Input fidelity | Resolutions | Recommended use |
+| --- | --- | --- | --- | --- |
+| `gpt-image-2` | `low`, `medium`, `high`, `auto` | Always high fidelity for image inputs; do not set `input_fidelity` | `auto` or flexible sizes that satisfy the constraints below | Default for new CLI/API workflows: high-quality generation and editing, text-heavy images, photorealism, compositing, identity-sensitive edits, and workflows where fewer retries matter |
+| `gpt-image-1.5` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | True transparent-background fallback and backward-compatible workflows |
+| `gpt-image-1` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | Legacy compatibility |
+| `gpt-image-1-mini` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | Cost-sensitive draft batches and lower-stakes previews |
+
+## gpt-image-2 sizes
+
+`gpt-image-2` accepts `auto` or any `WIDTHxHEIGHT` size that satisfies all constraints:
+
+- Maximum edge length must be less than or equal to `3840px`.
+- Both edges must be multiples of `16px`.
+- Long edge to short edge ratio must not exceed `3:1`.
+- Total pixels must be at least `655,360` and no more than `8,294,400`.
+
+Popular sizes:
+
+| Label | Size | Notes |
+| --- | --- | --- |
+| Square | `1024x1024` | Typical fast default |
+| Landscape | `1536x1024` | Standard landscape |
+| Portrait | `1024x1536` | Standard portrait |
+| 2K square | `2048x2048` | Larger square output |
+| 2K landscape | `2048x1152` | Widescreen output |
+| 4K landscape | `3840x2160` | Widescreen 4K output |
+| 4K portrait | `2160x3840` | Vertical 4K output |
+| Auto | `auto` | Default size |
+
+Square images are typically fastest to generate. For 4K-style output, use `3840x2160` or `2160x3840`.
+
+## Endpoints
+- Generate: `POST /v1/images/generations` (`client.images.generate(...)`)
+- Edit: `POST /v1/images/edits` (`client.images.edit(...)`)
+
+## Core parameters for GPT Image models
+- `prompt`: text prompt
+- `model`: image model
+- `n`: number of images (1-10)
+- `size`: `auto` by default for `gpt-image-2`; flexible `WIDTHxHEIGHT` sizes are allowed only for `gpt-image-2`; older GPT Image models use `1024x1024`, `1536x1024`, `1024x1536`, or `auto`
+- `quality`: `low`, `medium`, `high`, or `auto`
+- `background`: output transparency behavior (`transparent`, `opaque`, or `auto`) for generated output; this is not the same thing as the prompt's visual scene/backdrop
+- `output_format`: `png` (default), `jpeg`, `webp`
+- `output_compression`: 0-100 (jpeg/webp only)
+- `moderation`: `auto` (default) or `low`
+
+## Edit-specific parameters
+- `image`: one or more input images. For GPT Image models, you can provide up to 16 images.
+- `mask`: optional mask image
+- `input_fidelity`: `low` or `high` only for models that support it; do not set this for `gpt-image-2`
+
+Model-specific note for `input_fidelity`:
+- `gpt-image-2` always uses high fidelity for image inputs and does not support setting `input_fidelity`.
+- `gpt-image-1` and `gpt-image-1-mini` preserve all input images, but the first image gets richer textures and finer details.
+- `gpt-image-1.5` preserves the first 5 input images with higher fidelity.
+
+## Transparent backgrounds
+
+`gpt-image-2` does not currently support the Image API `background=transparent` parameter. The skill's default transparent-image path is built-in `image_gen` with a flat chroma-key background, followed by local alpha extraction with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py"`.
+
+Use CLI `gpt-image-1.5` with `background=transparent` and a transparent-capable output format such as `png` or `webp` only after the user explicitly confirms that fallback, unless they already requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. If the user asks for true/native transparency, the subject is too complex for clean chroma-key removal, or local background removal fails validation, explain the tradeoff and ask before switching.
+
+## Output
+- `data[]` list with `b64_json` per image
+- The bundled `scripts/image_gen.py` CLI decodes `b64_json` and writes output files for you.
+
+## Limits and notes
+- Input images and masks must be under 50MB.
+- Use the edits endpoint when the user requests changes to an existing image.
+- Masking is prompt-guided; exact shapes are not guaranteed.
+- Large sizes and high quality increase latency and cost.
+- Use `quality=low` for fast drafts, thumbnails, and quick iterations. Use `medium` or `high` for final assets, dense text, diagrams, identity-sensitive edits, or high-resolution outputs.
+- High `input_fidelity` can materially increase input token usage on models that support it.
+- If a request fails because a specific option is unsupported by the selected GPT Image model, retry manually without that option only when the option is not required by the user. If true transparent CLI output is required, ask before switching to `gpt-image-1.5` instead of dropping `background=transparent`, unless the user already explicitly chose that fallback.
+
+## Important boundary
+- `quality`, `input_fidelity`, explicit masks, `background`, `output_format`, and related parameters are fallback-only execution controls.
+- Do not assume they are built-in `image_gen` tool arguments.
diff --git a/skills/imagegen/references/prompting.md b/skills/imagegen/references/prompting.md
new file mode 100644
index 0000000..9d2da42
--- /dev/null
+++ b/skills/imagegen/references/prompting.md
@@ -0,0 +1,118 @@
+# Prompting best practices
+
+These prompting principles are shared by both top-level modes of the skill:
+- built-in `image_gen` tool (default)
+- explicit `scripts/image_gen.py` CLI fallback
+
+This file is about prompt structure, specificity, and iteration. Fallback-only execution controls such as `quality`, `input_fidelity`, masks, output format, and output paths live in the fallback docs.
+
+## Contents
+- [Structure](#structure)
+- [Specificity policy](#specificity-policy)
+- [Allowed and disallowed augmentation](#allowed-and-disallowed-augmentation)
+- [Composition and layout](#composition-and-layout)
+- [Constraints and invariants](#constraints-and-invariants)
+- [Text in images](#text-in-images)
+- [Input images and references](#input-images-and-references)
+- [Iterate deliberately](#iterate-deliberately)
+- [Transparent images](#transparent-images)
+- [Fallback-only execution controls](#fallback-only-execution-controls)
+- [Use-case tips](#use-case-tips)
+- [Where to find copy/paste recipes](#where-to-find-copypaste-recipes)
+
+## Structure
+- Use a consistent order: scene/backdrop -> subject -> key details -> constraints -> output intent.
+- Include intended use (ad, UI mock, infographic) to set the level of polish.
+- For complex requests, use short labeled lines instead of one long paragraph.
+
+## Specificity policy
+- If the user prompt is already specific and detailed, normalize it into a clean spec without adding creative requirements.
+- If the prompt is generic, you may add tasteful detail when it materially improves the output.
+- Treat examples in `sample-prompts.md` as fully-authored recipes, not as the default amount of augmentation to add to every request.
+- For photorealism, include `photorealistic` directly when that is the goal, plus concrete real-world texture such as pores, wrinkles, fabric wear, material grain, or imperfect everyday detail.
+
+## Allowed and disallowed augmentation
+
+Allowed augmentation for generic prompts:
+- composition and framing cues
+- intended-use or polish-level hints
+- practical layout guidance
+- reasonable scene concreteness that supports the request
+
+Do not add:
+- extra characters, props, or objects that are not implied
+- brand palettes, slogans, or story beats that are not implied
+- arbitrary side-specific placement unless the surrounding layout supports it
+
+## Composition and layout
+- Specify framing and viewpoint (close-up, wide, top-down) and placement only when it materially helps.
+- Call out negative space if the asset clearly needs room for UI or copy.
+- Avoid making left/right layout decisions unless the user or surrounding layout supports them.
+- For people, describe body framing, scale, gaze, and object interactions when they matter (`full body visible`, `looking down at the book`, `hands naturally gripping the handlebars`).
+
+## Constraints and invariants
+- State what must not change (`keep background unchanged`).
+- For edits, say `change only X; keep Y unchanged` and repeat invariants on every iteration to reduce drift.
+
+## Text in images
+- Put literal text in quotes or ALL CAPS and specify typography (font style, size, color, placement).
+- Spell uncommon words letter-by-letter if accuracy matters.
+- For in-image copy, require verbatim rendering and no extra characters.
+- In CLI fallback mode, use `medium` or `high` quality for small text, dense infographics, data-heavy slides, multi-font layouts, legends, axes, and footnotes.
+
+## Input images and references
+- Do not assume that every provided image is an edit target.
+- Label each image by index and role (`Image 1: edit target`, `Image 2: style reference`).
+- If the user provides images for style, composition, or mood guidance and does not ask to modify them, treat the request as generation with references.
+- If the user asks to preserve an existing image while changing specific parts, treat the request as an edit.
+- For compositing, describe how the images interact (`place the subject from Image 2 into Image 1`).
+
+## Iterate deliberately
+- Start with a clean base prompt, then make small single-change edits.
+- Re-specify critical constraints when you iterate.
+- Prefer one targeted follow-up at a time over rewriting the whole prompt.
+
+## Transparent images
+- Use built-in `image_gen` first for transparent-image requests. If the subject is clearly too complex for chroma-key removal, explain the fallback and ask before switching to CLI.
+- Prompt for a perfectly flat solid chroma-key background, usually `#00ff00`; use `#ff00ff` when the subject is green, and avoid key colors that appear in the subject.
+- Explicitly prohibit shadows, gradients, floor planes, reflections, texture, and lighting variation in the background.
+- Ask for crisp edges, generous padding, and no use of the key color inside the subject.
+- After generation, remove the background locally with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" --input <source> --out <final.png> --auto-key border --soft-matte --transparent-threshold 12 --opaque-threshold 220 --despill` and validate the alpha result before shipping it.
+- Use soft matte and despill for antialiased edges; hard tolerance-only removal is mainly for flat pixel-art or exact-color fixtures.
+- Use CLI `gpt-image-1.5 --background transparent --output-format png` only after the user explicitly confirms the fallback, or when the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Ask first for true/native transparency requests, failed chroma-key validation, or complex transparent subjects such as hair, fur, glass, smoke, liquids, translucent materials, reflective objects, or soft shadows.
+
+## Fallback-only execution controls
+- `quality`, `input_fidelity`, explicit masks, output format, and output paths are fallback-only execution controls.
+- Do not assume they are built-in `image_gen` tool arguments.
+- If the user explicitly chooses CLI fallback, see `references/cli.md` and `references/image-api.md` for those controls.
+- In CLI fallback mode, `gpt-image-2` is the default. It supports `quality=low|medium|high|auto`; use `low` for fast drafts and thumbnails, and move to `medium`, `high`, or `auto` for final assets.
+- `gpt-image-2` always uses high fidelity for image inputs, so do not set `input_fidelity` with that model.
+- If a transparent request needs true CLI transparency, ask before using `gpt-image-1.5` unless the user already explicitly chose it. Explain that built-in chroma-key removal is the default path, but `gpt-image-2` does not support `background=transparent`.
+- If the user asks for 4K-style output with `gpt-image-2`, use `3840x2160` for landscape or `2160x3840` for portrait.
+
+## Use-case tips
+Generate:
+- photorealistic-natural: Prompt as if a real photo is captured in the moment; use photography language (lens, lighting, framing); call for real texture; avoid over-stylized polish unless requested.
+- product-mockup: Describe the product/packaging and materials; ensure clean silhouette and label clarity; if in-image text is needed, require verbatim rendering and specify typography.
+- ui-mockup: Describe the target fidelity first (shippable mockup or low-fi wireframe), then focus on layout, hierarchy, and practical UI elements; avoid concept-art language.
+- infographic-diagram: Define the audience and layout flow; label parts explicitly; require verbatim text; prefer higher quality in CLI mode for dense labels.
+- logo-brand: Keep it simple and scalable; ask for a strong silhouette and balanced negative space; avoid decorative flourishes unless requested.
+- ads-marketing: Write like a creative brief; include brand positioning, audience, desired vibe, scene, and exact tagline if text must appear.
+- productivity-visual: Name the exact artifact (slide, chart, workflow diagram), define the canvas and hierarchy, provide real labels/data, and ask for readable typography and polished spacing.
+- scientific-educational: Define audience, lesson objective, required labels, scientific constraints, arrows, and scan-friendly whitespace.
+- illustration-story: Define panels or scene beats; keep each action concrete.
+- stylized-concept: Specify style cues, material finish, and rendering approach (3D, painterly, clay) without inventing new story elements.
+- historical-scene: State the location/date and required period accuracy; constrain clothing, props, and environment to match the era.
+
+Edit:
+- text-localization: Change only the text; preserve layout, typography, spacing, and hierarchy; no extra words or reflow unless needed.
+- identity-preserve: Lock identity (face, body, pose, hair, expression); change only the specified elements; match lighting and shadows.
+- precise-object-edit: Specify exactly what to remove/replace; preserve surrounding texture and lighting; keep everything else unchanged.
+- lighting-weather: Change only environmental conditions (light, shadows, atmosphere, precipitation); keep geometry, framing, and subject identity.
+- background-extraction: For simple opaque subjects, request a clean cutout on a perfectly flat chroma-key background; crisp silhouette; generous padding; no shadows; no halos; preserve label text exactly; no restyling. Ask before using true CLI transparency for complex subjects.
+- style-transfer: Specify style cues to preserve (palette, texture, brushwork) and what must change; add `no extra elements` to prevent drift.
+- compositing: Reference inputs by index; specify what moves where; match lighting, perspective, and scale; keep the base framing unchanged.
+- sketch-to-render: Preserve layout, proportions, and perspective; choose materials and lighting that support the supplied sketch without adding new elements.
+
+## Where to find copy/paste recipes
+For copy/paste prompt specs (examples only), see `references/sample-prompts.md`. This file focuses on principles, specificity, and iteration patterns.
diff --git a/skills/imagegen/references/sample-prompts.md b/skills/imagegen/references/sample-prompts.md
new file mode 100644
index 0000000..d949295
--- /dev/null
+++ b/skills/imagegen/references/sample-prompts.md
@@ -0,0 +1,433 @@
+# Sample prompts (copy/paste)
+
+These prompt recipes are shared across both top-level modes of the skill:
+- built-in `image_gen` tool (default)
+- `scripts/image_gen.py` CLI fallback for explicit CLI/API/model requests or user-confirmed true-transparent-output fallback requests
+
+Use these as starting points. They are intentionally complete prompt recipes, not the default amount of augmentation to add to every user request.
+
+When adapting a user's prompt:
+- keep user-provided requirements
+- only add detail according to the specificity policy in `SKILL.md`
+- do not treat every example below as permission to invent extra story elements
+
+The labeled lines are prompt scaffolding, not a closed schema. `Asset type` and `Input images` are prompt-only scaffolding; the CLI does not expose them as dedicated flags.
+
+Execution details such as explicit CLI flags, `quality`, `input_fidelity`, masks, output formats, and local output paths depend on mode. Use the built-in tool by default, including simple transparent-image requests. For transparent images, prompt for a flat chroma-key background and remove it locally with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py"`; only apply CLI-specific controls when the user explicitly opts into fallback mode or explicitly confirms that the transparent request should use true CLI transparency.
+
+CLI model notes:
+- `gpt-image-2` is the fallback CLI default for new workflows.
+- `gpt-image-2` supports `quality` values `low`, `medium`, `high`, and `auto`.
+- For 4K-style `gpt-image-2` output, use `3840x2160` or `2160x3840`.
+- If transparent output needs true CLI fallback, ask before using `gpt-image-1.5` unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Explain that built-in chroma-key removal is the default path, but `gpt-image-2` does not support `background=transparent`.
+- Do not set `input_fidelity` with `gpt-image-2`; image inputs already use high fidelity.
+
+For prompting principles (structure, specificity, invariants, iteration), see `references/prompting.md`.
+
+## Generate
+
+### photorealistic-natural
+```
+Use case: photorealistic-natural
+Primary request: candid photo of an elderly sailor on a small fishing boat adjusting a net
+Scene/backdrop: coastal water with soft haze
+Subject: weathered skin with wrinkles and sun texture
+Style/medium: photorealistic candid photo
+Composition/framing: medium close-up, eye-level
+Lighting/mood: soft coastal daylight, shallow depth of field, subtle film grain
+Materials/textures: real skin texture, worn fabric, salt-worn wood
+Constraints: natural color balance; no heavy retouching; no glamorization; no watermark
+Avoid: studio polish; staged look
+```
+
+### product-mockup
+```
+Use case: product-mockup
+Primary request: premium product photo of a matte black shampoo bottle with a minimal label
+Scene/backdrop: clean studio gradient from light gray to white
+Subject: single bottle centered with subtle reflection
+Style/medium: premium product photography
+Composition/framing: centered, slight three-quarter angle, generous padding
+Lighting/mood: softbox lighting, clean highlights, controlled shadows
+Materials/textures: matte plastic, crisp label printing
+Constraints: no logos or trademarks; no watermark
+```
+
+### ui-mockup
+```
+Use case: ui-mockup
+Primary request: mobile app home screen for a local farmers market with vendors and daily specials
+Asset type: mobile app screen
+Style/medium: realistic product UI, not concept art
+Composition/framing: clean vertical mobile layout with clear hierarchy
+Constraints: practical layout, clear typography, no logos or trademarks, no watermark
+```
+
+### infographic-diagram
+```
+Use case: infographic-diagram
+Primary request: detailed infographic of an automatic coffee machine flow
+Scene/backdrop: clean, light neutral background
+Subject: bean hopper -> grinder -> brew group -> boiler -> water tank -> drip tray
+Style/medium: clean vector-like infographic with clear callouts and arrows
+Composition/framing: vertical poster layout, top-to-bottom flow
+Text (verbatim): "Bean Hopper", "Grinder", "Brew Group", "Boiler", "Water Tank", "Drip Tray"
+Constraints: clear labels, strong contrast, no logos or trademarks, no watermark
+```
+
+### scientific-educational
+```
+Use case: scientific-educational
+Primary request: biology diagram titled "Cellular Respiration at a Glance" for high school students
+Scene/backdrop: clean white classroom handout background
+Subject: glucose turns into energy inside a cell; include glycolysis, Krebs cycle, and electron transport chain
+Style/medium: flat scientific diagram with consistent icons, arrows, and readable labels
+Composition/framing: landscape slide-style layout with clear hierarchy and generous whitespace
+Text (verbatim): "Cellular Respiration at a Glance", "Glucose", "Pyruvate", "ATP", "NADH", "FADH2", "CO2", "O2", "H2O"
+Constraints: scientifically plausible; avoid tiny text; no extra decoration; no watermark
+```
+
+### logo-brand
+```
+Use case: logo-brand
+Primary request: original logo for "Field & Flour", a local bakery
+Style/medium: vector logo mark; flat colors; minimal
+Composition/framing: single centered logo on a plain background with generous padding
+Constraints: strong silhouette, balanced negative space; original design only; no gradients unless essential; no trademarks; no watermark
+```
+
+### illustration-story
+```
+Use case: illustration-story
+Primary request: 4-panel comic about a pet left alone at home
+Scene/backdrop: cozy living room across panels
+Subject: pet reacting to the owner leaving, then relaxing, then returning to a composed pose
+Style/medium: comic illustration with clear panels
+Composition/framing: 4 equal-sized vertical panels, readable actions per panel
+Constraints: no text; no logos or trademarks; no watermark
+```
+
+### stylized-concept
+```
+Use case: stylized-concept
+Primary request: cavernous hangar interior with tall support beams and drifting fog
+Scene/backdrop: industrial hangar interior, deep scale, light haze
+Subject: compact shuttle parked near the center
+Style/medium: cinematic concept art, industrial realism
+Composition/framing: wide-angle, low-angle
+Lighting/mood: volumetric light rays cutting through fog
+Constraints: no logos or trademarks; no watermark
+```
+
+### ads-marketing
+```
+Use case: ads-marketing
+Primary request: campaign image for a streetwear brand called Thread
+Subject: group of friends hanging out together in a stylish urban setting
+Style/medium: polished youth streetwear campaign photography
+Composition/framing: vertical ad layout with natural poses and integrated headline space
+Lighting/mood: contemporary, energetic, tasteful
+Text (verbatim): "Yours to Create."
+Constraints: render the tagline exactly once; clean legible typography; no extra text; no watermarks; no unrelated logos
+```
+
+### productivity-visual
+```
+Use case: productivity-visual
+Primary request: one pitch-deck slide titled "Market Opportunity"
+Asset type: fundraising slide image
+Style/medium: clean modern deck slide, white background, crisp sans-serif typography
+Subject: TAM/SAM/SOM concentric-circle diagram plus a small growth bar chart from 2021 to 2026
+Composition/framing: 16:9 landscape slide, clear data hierarchy, polished spacing
+Text (verbatim): "Market Opportunity", "TAM: $42B", "SAM: $8.7B", "SOM: $340M", "AGI Research, 2024", "Internal analysis"
+Constraints: readable labels, no clip art, no stock photography, no decorative clutter, no watermark
+```
+
+### historical-scene
+```
+Use case: historical-scene
+Primary request: outdoor crowd scene in Bethel, New York on August 16, 1969
+Scene/backdrop: open field with period-appropriate staging
+Subject: crowd in period-accurate clothing, authentic environment
+Style/medium: photorealistic photo
+Composition/framing: wide shot, eye-level
+Constraints: period-accurate details; no modern objects; no logos or trademarks; no watermark
+```
+
+## Asset type templates (taxonomy-aligned)
+
+### Website assets template
+```
+Use case: <photorealistic-natural|stylized-concept|product-mockup|infographic-diagram|ui-mockup>
+Asset type: <hero image / section illustration / blog header>
+Primary request: <short description>
+Scene/backdrop: <environment or abstract backdrop>
+Subject: <main subject>
+Style/medium: <photo/illustration/3D>
+Composition/framing: <wide/centered; note usable negative space only if needed>
+Lighting/mood: <soft/bright/neutral>
+Color palette: <brand colors or neutral>
+Constraints: <no text; no logos; no watermark; leave room for UI if needed>
+```
+
+### Website assets example: minimal hero background
+```
+Use case: stylized-concept
+Asset type: landing page hero background
+Primary request: minimal abstract background with a soft gradient and subtle texture
+Style/medium: matte illustration / soft-rendered abstract background
+Composition/framing: wide composition with usable negative space for page copy
+Lighting/mood: gentle studio glow
+Color palette: restrained neutral palette
+Constraints: no text; no logos; no watermark
+```
+
+### Website assets example: feature section illustration
+```
+Use case: stylized-concept
+Asset type: feature section illustration
+Primary request: simple abstract shapes suggesting connection and flow
+Scene/backdrop: subtle light-gray backdrop with faint texture
+Style/medium: flat illustration; soft shadows; restrained contrast
+Composition/framing: centered cluster; open margins for UI
+Color palette: muted neutral palette
+Constraints: no text; no logos; no watermark
+```
+
+### Website assets example: blog header image
+```
+Use case: photorealistic-natural
+Asset type: blog header image
+Primary request: overhead desk scene with notebook, pen, and coffee cup
+Scene/backdrop: warm wooden tabletop
+Style/medium: photorealistic photo
+Composition/framing: wide crop with clean room for page copy
+Lighting/mood: soft morning light
+Constraints: no text; no logos; no watermark
+```
+
+### Game assets template
+```
+Use case: stylized-concept
+Asset type: <game environment concept art / game character concept / game UI icon / tileable game texture>
+Primary request: <biome/scene/character/icon/material>
+Scene/backdrop: <location + set dressing> (if applicable)
+Subject: <main focal element(s)>
+Style/medium: <realistic/stylized>; <concept art / character render / UI icon / texture>
+Composition/framing: <wide/establishing/top-down>; <camera angle>; <focal point placement>
+Lighting/mood: <time of day>; <mood>; <volumetric/fog/etc>
+Constraints: no logos or trademarks; no watermark
+```
+
+### Game assets example: environment concept art
+```
+Use case: stylized-concept
+Asset type: game environment concept art
+Primary request: cavernous hangar interior with tall support beams and drifting fog
+Scene/backdrop: industrial hangar interior, deep scale, light haze
+Subject: compact shuttle parked near the center
+Style/medium: cinematic concept art, industrial realism
+Composition/framing: wide-angle, low-angle
+Lighting/mood: volumetric light rays cutting through fog
+Constraints: no logos or trademarks; no watermark
+```
+
+### Game assets example: character concept
+```
+Use case: stylized-concept
+Asset type: game character concept
+Primary request: desert scout character with layered travel gear
+Subject: long coat, satchel, practical travel clothing
+Style/medium: character render; stylized realism
+Composition/framing: neutral hero pose on a simple backdrop
+Constraints: no logos or trademarks; no watermark
+```
+
+### Game assets example: UI icon
+```
+Use case: stylized-concept
+Asset type: game UI icon
+Primary request: round shield icon with a subtle rune pattern
+Style/medium: painted game UI icon
+Composition/framing: centered icon; generous padding; clear silhouette
+Constraints: no text; no background scene elements; no logos or trademarks; no watermark
+```
+
+### Game assets example: tileable texture
+```
+Use case: stylized-concept
+Asset type: tileable game texture
+Primary request: worn sandstone blocks
+Style/medium: seamless tileable texture; PBR-ish look
+Scene/backdrop: neutral lighting reference only
+Constraints: seamless edges; no obvious focal elements; no text; no logos or trademarks; no watermark
+```
+
+### Wireframe template
+```
+Use case: ui-mockup
+Asset type: website wireframe
+Primary request: <page or flow to sketch>
+Style/medium: low-fi grayscale wireframe
+Composition/framing: <landscape or portrait to match expected device>
+Subject: <sections in order; grid/columns; key labels>
+Constraints: no color; no logos; no real photos; no watermark
+```
+
+### Wireframe example: homepage (desktop)
+```
+Use case: ui-mockup
+Asset type: website wireframe
+Primary request: SaaS homepage layout with clear hierarchy
+Style/medium: low-fi grayscale wireframe
+Subject: top nav; hero with headline and CTA; three feature cards; testimonial strip; pricing preview; footer
+Composition/framing: landscape desktop layout
+Constraints: label major blocks; no color; no logos; no real photos; no watermark
+```
+
+### Wireframe example: pricing page
+```
+Use case: ui-mockup
+Asset type: website wireframe
+Primary request: pricing page layout with comparison table
+Style/medium: low-fi grayscale wireframe
+Subject: header; plan toggle; 3 pricing cards; comparison table; FAQ accordion; footer
+Composition/framing: desktop or tablet layout
+Constraints: label key areas; no color; no logos; no real photos; no watermark
+```
+
+### Wireframe example: mobile onboarding flow
+```
+Use case: ui-mockup
+Asset type: mobile onboarding wireframe
+Primary request: three-screen mobile onboarding flow
+Style/medium: low-fi grayscale wireframe
+Subject: screen 1 headline and CTA; screen 2 feature bullets; screen 3 form fields and CTA
+Composition/framing: portrait mobile layout
+Constraints: label screens and blocks; no color; no logos; no real photos; no watermark
+```
+
+### Logo template
+```
+Use case: logo-brand
+Asset type: logo concept
+Primary request: <brand idea or symbol concept>
+Style/medium: vector logo mark; flat colors; minimal
+Composition/framing: centered mark; clear silhouette; generous margin
+Color palette: <1-2 colors; high contrast>
+Text (verbatim): "<exact name>" (only if needed)
+Constraints: no gradients; no mockups; no 3D; no watermark
+```
+
+### Logo example: abstract symbol mark
+```
+Use case: logo-brand
+Asset type: logo concept
+Primary request: geometric leaf symbol suggesting sustainability and growth
+Style/medium: vector logo mark; flat colors; minimal
+Composition/framing: centered mark; clear silhouette
+Color palette: deep green and off-white
+Constraints: no text unless requested; no gradients; no mockups; no 3D; no watermark
+```
+
+### Logo example: monogram mark
+```
+Use case: logo-brand
+Asset type: logo concept
+Primary request: interlocking monogram of the letters "AV"
+Style/medium: vector logo mark; flat colors; minimal
+Composition/framing: centered mark; balanced spacing
+Color palette: black on white
+Constraints: no gradients; no mockups; no 3D; no watermark
+```
+
+### Logo example: wordmark
+```
+Use case: logo-brand
+Asset type: logo concept
+Primary request: clean wordmark for a modern studio
+Style/medium: vector wordmark; flat colors; minimal
+Text (verbatim): "Studio North"
+Composition/framing: centered text; even letter spacing
+Constraints: no gradients; no mockups; no 3D; no watermark
+```
+
+## Edit
+
+### text-localization
+```
+Use case: text-localization
+Input images: Image 1: original infographic
+Primary request: replace "Bean Hopper", "Grinder", "Brew Group", "Boiler", "Water Tank", and "Drip Tray" with "Tolva", "Molino", "Grupo de infusión", "Caldera", "Depósito de agua", and "Bandeja de goteo"
+Constraints: change only the text; preserve layout, typography, spacing, and hierarchy; no extra words; do not alter logos or imagery
+```
+
+### identity-preserve
+```
+Use case: identity-preserve
+Input images: Image 1: person photo; Image 2..N: clothing references
+Primary request: replace only the clothing with the provided garments
+Constraints: preserve face, body shape, pose, hair, expression, and identity; match lighting and shadows; keep the background unchanged; no accessories or text
+```
+
+### precise-object-edit
+```
+Use case: precise-object-edit
+Input images: Image 1: room photo
+Primary request: replace only the white chairs with wooden chairs
+Constraints: preserve camera angle, room lighting, floor shadows, and surrounding objects; keep all other aspects unchanged
+```
+
+### lighting-weather
+```
+Use case: lighting-weather
+Input images: Image 1: original photo
+Primary request: make it look like a winter evening with gentle snowfall
+Constraints: preserve subject identity, geometry, camera angle, and composition; change only lighting, atmosphere, and weather
+```
+
+### background-extraction
+```
+Use case: background-extraction
+Input images: Image 1: product photo
+Primary request: isolate the product on a clean transparent background
+Scene/backdrop: perfectly flat solid #00ff00 chroma-key background for local background removal
+Constraints: background must be one uniform color with no shadows, gradients, texture, reflections, floor plane, or lighting variation; crisp silhouette; generous padding; no halos or fringing; preserve label text exactly; no restyling; do not use #00ff00 anywhere in the subject
+```
+
+Post-process note: after built-in generation, run `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" --input <source> --out <final.png> --auto-key border --soft-matte --transparent-threshold 12 --opaque-threshold 220 --despill`. Ask before using CLI `gpt-image-1.5 --background transparent --output-format png` for true/native transparency, failed chroma-key validation, or complex subjects such as hair, fur, glass, smoke, liquids, translucent materials, reflections, or soft shadows, unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
+
+### style-transfer
+```
+Use case: style-transfer
+Input images: Image 1: style reference
+Primary request: apply Image 1's visual style to a man riding a motorcycle on a plain white backdrop
+Constraints: preserve palette, texture, and brushwork; no extra elements
+```
+
+### compositing
+```
+Use case: compositing
+Input images: Image 1: base scene; Image 2: subject to insert
+Primary request: place the subject from Image 2 next to the person in Image 1
+Constraints: match lighting, perspective, and scale; keep the base framing unchanged; no extra elements
+```
+
+### character consistency workflow
+```
+Use case: identity-preserve
+Input images: Image 1: previous character anchor illustration
+Primary request: continue the story with the same character in a new scene and action
+Scene/backdrop: snowy forest after a winter storm
+Subject: same young forest hero gently helping a frightened squirrel out of a fallen tree
+Style/medium: same children's book watercolor illustration style as Image 1
+Constraints: do not redesign the character; preserve facial features, proportions, outfit, color palette, and personality; no text; no watermark
+```
+
+### sketch-to-render
+```
+Use case: sketch-to-render
+Input images: Image 1: drawing
+Primary request: turn the drawing into a photorealistic image
+Constraints: preserve layout, proportions, and perspective; choose realistic materials and lighting; do not add new elements or text
+```
diff --git a/skills/imagegen/scripts/image_gen.py b/skills/imagegen/scripts/image_gen.py
new file mode 100644
index 0000000..9e0ea67
--- /dev/null
+++ b/skills/imagegen/scripts/image_gen.py
@@ -0,0 +1,995 @@
+#!/usr/bin/env python3
+"""Fallback CLI for explicit image generation or editing with GPT Image models.
+
+Used only when the user explicitly opts into CLI fallback mode, or when explicit
+transparent output requires the `gpt-image-1.5` fallback path.
+
+Defaults to gpt-image-2 and a structured prompt augmentation workflow.
+"""
+
+from __future__ import annotations
+
+import argparse
+import asyncio
+import base64
+import json
+import os
+from pathlib import Path
+import re
+import sys
+import time
+from typing import Any, Dict, Iterable, List, Optional, Tuple
+
+from io import BytesIO
+
+DEFAULT_MODEL = "gpt-image-2"
+DEFAULT_SIZE = "auto"
+DEFAULT_QUALITY = "medium"
+DEFAULT_OUTPUT_FORMAT = "png"
+DEFAULT_CONCURRENCY = 5
+DEFAULT_DOWNSCALE_SUFFIX = "-web"
+DEFAULT_OUTPUT_PATH = "output/imagegen/output.png"
+GPT_IMAGE_MODEL_PREFIX = "gpt-image-"
+
+ALLOWED_LEGACY_SIZES = {"1024x1024", "1536x1024", "1024x1536", "auto"}
+ALLOWED_QUALITIES = {"low", "medium", "high", "auto"}
+ALLOWED_BACKGROUNDS = {"transparent", "opaque", "auto", None}
+ALLOWED_INPUT_FIDELITIES = {"low", "high", None}
+
+GPT_IMAGE_2_MODEL = "gpt-image-2"
+GPT_IMAGE_2_MIN_PIXELS = 655_360
+GPT_IMAGE_2_MAX_PIXELS = 8_294_400
+GPT_IMAGE_2_MAX_EDGE = 3840
+GPT_IMAGE_2_MAX_RATIO = 3.0
+
+MAX_IMAGE_BYTES = 50 * 1024 * 1024
+MAX_BATCH_JOBS = 500
+
+
+def _die(message: str, code: int = 1) -> None:
+    print(f"Error: {message}", file=sys.stderr)
+    raise SystemExit(code)
+
+
+def _warn(message: str) -> None:
+    print(f"Warning: {message}", file=sys.stderr)
+
+
+def _dependency_hint(package: str, *, upgrade: bool = False) -> str:
+    command = f"uv pip install {'-U ' if upgrade else ''}{package}"
+    return (
+        "Activate the repo-selected environment first, then install it with "
+        f"`{command}`. If this repo uses a local virtualenv, start with "
+        "`source .venv/bin/activate`; otherwise use this repo's configured shared fallback "
+        "environment. If your project declares dependencies, prefer that project's normal "
+        "`uv sync` flow."
+    )
+
+
+def _ensure_api_key(dry_run: bool) -> None:
+    if os.getenv("OPENAI_API_KEY"):
+        print("OPENAI_API_KEY is set.", file=sys.stderr)
+        return
+    if dry_run:
+        _warn("OPENAI_API_KEY is not set; dry-run only.")
+        return
+    _die("OPENAI_API_KEY is not set. Export it before running.")
+
+
+def _read_prompt(prompt: Optional[str], prompt_file: Optional[str]) -> str:
+    if prompt and prompt_file:
+        _die("Use --prompt or --prompt-file, not both.")
+    if prompt_file:
+        path = Path(prompt_file)
+        if not path.exists():
+            _die(f"Prompt file not found: {path}")
+        return path.read_text(encoding="utf-8").strip()
+    if prompt:
+        return prompt.strip()
+    _die("Missing prompt. Use --prompt or --prompt-file.")
+    return ""  # unreachable
+
+
+def _check_image_paths(paths: Iterable[str]) -> List[Path]:
+    resolved: List[Path] = []
+    for raw in paths:
+        path = Path(raw)
+        if not path.exists():
+            _die(f"Image file not found: {path}")
+        if path.stat().st_size > MAX_IMAGE_BYTES:
+            _warn(f"Image exceeds 50MB limit: {path}")
+        resolved.append(path)
+    return resolved
+
+
+def _normalize_output_format(fmt: Optional[str]) -> str:
+    if not fmt:
+        return DEFAULT_OUTPUT_FORMAT
+    fmt = fmt.lower()
+    if fmt not in {"png", "jpeg", "jpg", "webp"}:
+        _die("output-format must be png, jpeg, jpg, or webp.")
+    return "jpeg" if fmt == "jpg" else fmt
+
+
+def _parse_size(size: str) -> Optional[Tuple[int, int]]:
+    match = re.fullmatch(r"([1-9][0-9]*)x([1-9][0-9]*)", size)
+    if not match:
+        return None
+    return int(match.group(1)), int(match.group(2))
+
+
+def _validate_gpt_image_2_size(size: str) -> None:
+    if size == "auto":
+        return
+
+    parsed = _parse_size(size)
+    if parsed is None:
+        _die("size must be auto or WIDTHxHEIGHT, for example 1024x1024.")
+
+    width, height = parsed
+    max_edge = max(width, height)
+    min_edge = min(width, height)
+    total_pixels = width * height
+
+    if max_edge > GPT_IMAGE_2_MAX_EDGE:
+        _die("gpt-image-2 size maximum edge length must be less than or equal to 3840px.")
+    if width % 16 != 0 or height % 16 != 0:
+        _die("gpt-image-2 size width and height must be multiples of 16px.")
+    if max_edge / min_edge > GPT_IMAGE_2_MAX_RATIO:
+        _die("gpt-image-2 size long edge to short edge ratio must not exceed 3:1.")
+    if total_pixels < GPT_IMAGE_2_MIN_PIXELS or total_pixels > GPT_IMAGE_2_MAX_PIXELS:
+        _die(
+            "gpt-image-2 size total pixels must be at least 655,360 and no more than 8,294,400."
+        )
+
+
+def _validate_size(size: str, model: str) -> None:
+    if model == GPT_IMAGE_2_MODEL:
+        _validate_gpt_image_2_size(size)
+        return
+
+    if size not in ALLOWED_LEGACY_SIZES:
+        _die(
+            "size must be one of 1024x1024, 1536x1024, 1024x1536, or auto for this GPT Image model."
+        )
+
+
+def _validate_quality(quality: str) -> None:
+    if quality not in ALLOWED_QUALITIES:
+        _die("quality must be one of low, medium, high, or auto.")
+
+
+def _validate_background(background: Optional[str]) -> None:
+    if background not in ALLOWED_BACKGROUNDS:
+        _die("background must be one of transparent, opaque, or auto.")
+
+
+def _validate_input_fidelity(input_fidelity: Optional[str]) -> None:
+    if input_fidelity not in ALLOWED_INPUT_FIDELITIES:
+        _die("input-fidelity must be one of low or high.")
+
+
+def _validate_model(model: str) -> None:
+    if not model.startswith(GPT_IMAGE_MODEL_PREFIX):
+        _die(
+            "model must be a GPT Image model (for example gpt-image-1.5, gpt-image-1, or gpt-image-1-mini)."
+        )
+
+
+def _validate_transparency(background: Optional[str], output_format: str) -> None:
+    if background == "transparent" and output_format not in {"png", "webp"}:
+        _die("transparent background requires output-format png or webp.")
+
+
+def _validate_model_specific_options(
+    *,
+    model: str,
+    background: Optional[str],
+    input_fidelity: Optional[str] = None,
+) -> None:
+    if model != GPT_IMAGE_2_MODEL:
+        return
+    if background == "transparent":
+        _die(
+            "transparent backgrounds are not supported in gpt-image-2, the latest model. "
+            "Use --model gpt-image-1.5 --background transparent --output-format png instead."
+        )
+    if input_fidelity is not None:
+        _die(
+            "input_fidelity is not supported in gpt-image-2 because image inputs always use high fidelity for this model."
+        )
+
+
+def _validate_generate_payload(payload: Dict[str, Any]) -> None:
+    model = str(payload.get("model", DEFAULT_MODEL))
+    _validate_model(model)
+    n = int(payload.get("n", 1))
+    if n < 1 or n > 10:
+        _die("n must be between 1 and 10")
+    size = str(payload.get("size", DEFAULT_SIZE))
+    quality = str(payload.get("quality", DEFAULT_QUALITY))
+    background = payload.get("background")
+    _validate_size(size, model)
+    _validate_quality(quality)
+    _validate_background(background)
+    _validate_model_specific_options(model=model, background=background)
+    oc = payload.get("output_compression")
+    if oc is not None and not (0 <= int(oc) <= 100):
+        _die("output_compression must be between 0 and 100")
+
+
+def _build_output_paths(
+    out: str,
+    output_format: str,
+    count: int,
+    out_dir: Optional[str],
+) -> List[Path]:
+    ext = "." + output_format
+
+    if out_dir:
+        out_base = Path(out_dir)
+        out_base.mkdir(parents=True, exist_ok=True)
+        return [out_base / f"image_{i}{ext}" for i in range(1, count + 1)]
+
+    out_path = Path(out)
+    if out_path.exists() and out_path.is_dir():
+        out_path.mkdir(parents=True, exist_ok=True)
+        return [out_path / f"image_{i}{ext}" for i in range(1, count + 1)]
+
+    if out_path.suffix == "":
+        out_path = out_path.with_suffix(ext)
+    elif output_format and out_path.suffix.lstrip(".").lower() != output_format:
+        _warn(
+            f"Output extension {out_path.suffix} does not match output-format {output_format}."
+        )
+
+    if count == 1:
+        return [out_path]
+
+    return [
+        out_path.with_name(f"{out_path.stem}-{i}{out_path.suffix}")
+        for i in range(1, count + 1)
+    ]
+
+
+def _augment_prompt(args: argparse.Namespace, prompt: str) -> str:
+    fields = _fields_from_args(args)
+    return _augment_prompt_fields(args.augment, prompt, fields)
+
+
+def _augment_prompt_fields(augment: bool, prompt: str, fields: Dict[str, Optional[str]]) -> str:
+    if not augment:
+        return prompt
+
+    sections: List[str] = []
+    if fields.get("use_case"):
+        sections.append(f"Use case: {fields['use_case']}")
+    sections.append(f"Primary request: {prompt}")
+    if fields.get("scene"):
+        sections.append(f"Scene/background: {fields['scene']}")
+    if fields.get("subject"):
+        sections.append(f"Subject: {fields['subject']}")
+    if fields.get("style"):
+        sections.append(f"Style/medium: {fields['style']}")
+    if fields.get("composition"):
+        sections.append(f"Composition/framing: {fields['composition']}")
+    if fields.get("lighting"):
+        sections.append(f"Lighting/mood: {fields['lighting']}")
+    if fields.get("palette"):
+        sections.append(f"Color palette: {fields['palette']}")
+    if fields.get("materials"):
+        sections.append(f"Materials/textures: {fields['materials']}")
+    if fields.get("text"):
+        sections.append(f"Text (verbatim): \"{fields['text']}\"")
+    if fields.get("constraints"):
+        sections.append(f"Constraints: {fields['constraints']}")
+    if fields.get("negative"):
+        sections.append(f"Avoid: {fields['negative']}")
+
+    return "\n".join(sections)
+
+
+def _fields_from_args(args: argparse.Namespace) -> Dict[str, Optional[str]]:
+    return {
+        "use_case": getattr(args, "use_case", None),
+        "scene": getattr(args, "scene", None),
+        "subject": getattr(args, "subject", None),
+        "style": getattr(args, "style", None),
+        "composition": getattr(args, "composition", None),
+        "lighting": getattr(args, "lighting", None),
+        "palette": getattr(args, "palette", None),
+        "materials": getattr(args, "materials", None),
+        "text": getattr(args, "text", None),
+        "constraints": getattr(args, "constraints", None),
+        "negative": getattr(args, "negative", None),
+    }
+
+
+def _print_request(payload: dict) -> None:
+    print(json.dumps(payload, indent=2, sort_keys=True))
+
+
+def _decode_and_write(images: List[str], outputs: List[Path], force: bool) -> None:
+    for idx, image_b64 in enumerate(images):
+        if idx >= len(outputs):
+            break
+        out_path = outputs[idx]
+        if out_path.exists() and not force:
+            _die(f"Output already exists: {out_path} (use --force to overwrite)")
+        out_path.parent.mkdir(parents=True, exist_ok=True)
+        out_path.write_bytes(base64.b64decode(image_b64))
+        print(f"Wrote {out_path}")
+
+
+def _derive_downscale_path(path: Path, suffix: str) -> Path:
+    if suffix and not suffix.startswith("-") and not suffix.startswith("_"):
+        suffix = "-" + suffix
+    return path.with_name(f"{path.stem}{suffix}{path.suffix}")
+
+
+def _downscale_image_bytes(image_bytes: bytes, *, max_dim: int, output_format: str) -> bytes:
+    try:
+        from PIL import Image
+    except Exception:
+        _die(f"Downscaling requires Pillow. {_dependency_hint('pillow')}")
+
+    if max_dim < 1:
+        _die("--downscale-max-dim must be >= 1")
+
+    with Image.open(BytesIO(image_bytes)) as img:
+        img.load()
+        w, h = img.size
+        scale = min(1.0, float(max_dim) / float(max(w, h)))
+        target = (max(1, int(round(w * scale))), max(1, int(round(h * scale))))
+
+        resized = img if target == (w, h) else img.resize(target, Image.Resampling.LANCZOS)
+
+        fmt = output_format.lower()
+        if fmt == "jpg":
+            fmt = "jpeg"
+
+        if fmt == "jpeg":
+            if resized.mode in ("RGBA", "LA") or ("transparency" in getattr(resized, "info", {})):
+                bg = Image.new("RGB", resized.size, (255, 255, 255))
+                bg.paste(resized.convert("RGBA"), mask=resized.convert("RGBA").split()[-1])
+                resized = bg
+            else:
+                resized = resized.convert("RGB")
+
+        out = BytesIO()
+        resized.save(out, format=fmt.upper())
+        return out.getvalue()
+
+
+def _decode_write_and_downscale(
+    images: List[str],
+    outputs: List[Path],
+    *,
+    force: bool,
+    downscale_max_dim: Optional[int],
+    downscale_suffix: str,
+    output_format: str,
+) -> None:
+    for idx, image_b64 in enumerate(images):
+        if idx >= len(outputs):
+            break
+        out_path = outputs[idx]
+        if out_path.exists() and not force:
+            _die(f"Output already exists: {out_path} (use --force to overwrite)")
+        out_path.parent.mkdir(parents=True, exist_ok=True)
+
+        raw = base64.b64decode(image_b64)
+        out_path.write_bytes(raw)
+        print(f"Wrote {out_path}")
+
+        if downscale_max_dim is None:
+            continue
+
+        derived = _derive_downscale_path(out_path, downscale_suffix)
+        if derived.exists() and not force:
+            _die(f"Output already exists: {derived} (use --force to overwrite)")
+        derived.parent.mkdir(parents=True, exist_ok=True)
+        resized = _downscale_image_bytes(raw, max_dim=downscale_max_dim, output_format=output_format)
+        derived.write_bytes(resized)
+        print(f"Wrote {derived}")
+
+
+def _create_client():
+    try:
+        from openai import OpenAI
+    except ImportError:
+        _die(f"openai SDK not installed in the active environment. {_dependency_hint('openai')}")
+    return OpenAI()
+
+
+def _create_async_client():
+    try:
+        from openai import AsyncOpenAI
+    except ImportError:
+        try:
+            import openai as _openai  # noqa: F401
+        except ImportError:
+            _die(
+                f"openai SDK not installed in the active environment. {_dependency_hint('openai')}"
+            )
+        _die(
+            "AsyncOpenAI not available in this openai SDK version. "
+            f"{_dependency_hint('openai', upgrade=True)}"
+        )
+    return AsyncOpenAI()
+
+
+def _slugify(value: str) -> str:
+    value = value.strip().lower()
+    value = re.sub(r"[^a-z0-9]+", "-", value)
+    value = re.sub(r"-{2,}", "-", value).strip("-")
+    return value[:60] if value else "job"
+
+
+def _normalize_job(job: Any, idx: int) -> Dict[str, Any]:
+    if isinstance(job, str):
+        prompt = job.strip()
+        if not prompt:
+            _die(f"Empty prompt at job {idx}")
+        return {"prompt": prompt}
+    if isinstance(job, dict):
+        if "prompt" not in job or not str(job["prompt"]).strip():
+            _die(f"Missing prompt for job {idx}")
+        return job
+    _die(f"Invalid job at index {idx}: expected string or object.")
+    return {}  # unreachable
+
+
+def _read_jobs_jsonl(path: str) -> List[Dict[str, Any]]:
+    p = Path(path)
+    if not p.exists():
+        _die(f"Input file not found: {p}")
+    jobs: List[Dict[str, Any]] = []
+    for line_no, raw in enumerate(p.read_text(encoding="utf-8").splitlines(), start=1):
+        line = raw.strip()
+        if not line or line.startswith("#"):
+            continue
+        try:
+            item: Any
+            if line.startswith("{"):
+                item = json.loads(line)
+            else:
+                item = line
+            jobs.append(_normalize_job(item, idx=line_no))
+        except json.JSONDecodeError as exc:
+            _die(f"Invalid JSON on line {line_no}: {exc}")
+    if not jobs:
+        _die("No jobs found in input file.")
+    if len(jobs) > MAX_BATCH_JOBS:
+        _die(f"Too many jobs ({len(jobs)}). Max is {MAX_BATCH_JOBS}.")
+    return jobs
+
+
+def _merge_non_null(dst: Dict[str, Any], src: Dict[str, Any]) -> Dict[str, Any]:
+    merged = dict(dst)
+    for k, v in src.items():
+        if v is not None:
+            merged[k] = v
+    return merged
+
+
+def _job_output_paths(
+    *,
+    out_dir: Path,
+    output_format: str,
+    idx: int,
+    prompt: str,
+    n: int,
+    explicit_out: Optional[str],
+) -> List[Path]:
+    out_dir.mkdir(parents=True, exist_ok=True)
+    ext = "." + output_format
+
+    if explicit_out:
+        base = Path(explicit_out)
+        if base.suffix == "":
+            base = base.with_suffix(ext)
+        elif base.suffix.lstrip(".").lower() != output_format:
+            _warn(
+                f"Job {idx}: output extension {base.suffix} does not match output-format {output_format}."
+            )
+        base = out_dir / base.name
+    else:
+        slug = _slugify(prompt[:80])
+        base = out_dir / f"{idx:03d}-{slug}{ext}"
+
+    if n == 1:
+        return [base]
+    return [
+        base.with_name(f"{base.stem}-{i}{base.suffix}")
+        for i in range(1, n + 1)
+    ]
+
+
+def _extract_retry_after_seconds(exc: Exception) -> Optional[float]:
+    # Best-effort: openai SDK errors vary by version. Prefer a conservative fallback.
+    for attr in ("retry_after", "retry_after_seconds"):
+        val = getattr(exc, attr, None)
+        if isinstance(val, (int, float)) and val >= 0:
+            return float(val)
+    msg = str(exc)
+    m = re.search(r"retry[- ]after[:= ]+([0-9]+(?:\\.[0-9]+)?)", msg, re.IGNORECASE)
+    if m:
+        try:
+            return float(m.group(1))
+        except Exception:
+            return None
+    return None
+
+
+def _is_rate_limit_error(exc: Exception) -> bool:
+    name = exc.__class__.__name__.lower()
+    if "ratelimit" in name or "rate_limit" in name:
+        return True
+    msg = str(exc).lower()
+    return "429" in msg or "rate limit" in msg or "too many requests" in msg
+
+
+def _is_transient_error(exc: Exception) -> bool:
+    if _is_rate_limit_error(exc):
+        return True
+    name = exc.__class__.__name__.lower()
+    if "timeout" in name or "timedout" in name or "tempor" in name:
+        return True
+    msg = str(exc).lower()
+    return "timeout" in msg or "timed out" in msg or "connection reset" in msg
+
+
+async def _generate_one_with_retries(
+    client: Any,
+    payload: Dict[str, Any],
+    *,
+    attempts: int,
+    job_label: str,
+) -> Any:
+    last_exc: Optional[Exception] = None
+    for attempt in range(1, attempts + 1):
+        try:
+            return await client.images.generate(**payload)
+        except Exception as exc:
+            last_exc = exc
+            if not _is_transient_error(exc):
+                raise
+            if attempt == attempts:
+                raise
+            sleep_s = _extract_retry_after_seconds(exc)
+            if sleep_s is None:
+                sleep_s = min(60.0, 2.0**attempt)
+            print(
+                f"{job_label} attempt {attempt}/{attempts} failed ({exc.__class__.__name__}); retrying in {sleep_s:.1f}s",
+                file=sys.stderr,
+            )
+            await asyncio.sleep(sleep_s)
+    raise last_exc or RuntimeError("unknown error")
+
+
+async def _run_generate_batch(args: argparse.Namespace) -> int:
+    jobs = _read_jobs_jsonl(args.input)
+    out_dir = Path(args.out_dir)
+
+    base_fields = _fields_from_args(args)
+    base_payload = {
+        "model": args.model,
+        "n": args.n,
+        "size": args.size,
+        "quality": args.quality,
+        "background": args.background,
+        "output_format": args.output_format,
+        "output_compression": args.output_compression,
+        "moderation": args.moderation,
+    }
+
+    if args.dry_run:
+        for i, job in enumerate(jobs, start=1):
+            prompt = str(job["prompt"]).strip()
+            fields = _merge_non_null(base_fields, job.get("fields", {}))
+            # Allow flat job keys as well (use_case, scene, etc.)
+            fields = _merge_non_null(fields, {k: job.get(k) for k in base_fields.keys()})
+            augmented = _augment_prompt_fields(args.augment, prompt, fields)
+
+            job_payload = dict(base_payload)
+            job_payload["prompt"] = augmented
+            job_payload = _merge_non_null(job_payload, {k: job.get(k) for k in base_payload.keys()})
+            job_payload = {k: v for k, v in job_payload.items() if v is not None}
+
+            _validate_generate_payload(job_payload)
+            effective_output_format = _normalize_output_format(job_payload.get("output_format"))
+            _validate_transparency(job_payload.get("background"), effective_output_format)
+            job_payload["output_format"] = effective_output_format
+
+            n = int(job_payload.get("n", 1))
+            outputs = _job_output_paths(
+                out_dir=out_dir,
+                output_format=effective_output_format,
+                idx=i,
+                prompt=prompt,
+                n=n,
+                explicit_out=job.get("out"),
+            )
+            downscaled = None
+            if args.downscale_max_dim is not None:
+                downscaled = [
+                    str(_derive_downscale_path(p, args.downscale_suffix)) for p in outputs
+                ]
+            _print_request(
+                {
+                    "endpoint": "/v1/images/generations",
+                    "job": i,
+                    "outputs": [str(p) for p in outputs],
+                    "outputs_downscaled": downscaled,
+                    **job_payload,
+                }
+            )
+        return 0
+
+    client = _create_async_client()
+    sem = asyncio.Semaphore(args.concurrency)
+
+    any_failed = False
+
+    async def run_job(i: int, job: Dict[str, Any]) -> Tuple[int, Optional[str]]:
+        nonlocal any_failed
+        prompt = str(job["prompt"]).strip()
+        job_label = f"[job {i}/{len(jobs)}]"
+
+        fields = _merge_non_null(base_fields, job.get("fields", {}))
+        fields = _merge_non_null(fields, {k: job.get(k) for k in base_fields.keys()})
+        augmented = _augment_prompt_fields(args.augment, prompt, fields)
+
+        payload = dict(base_payload)
+        payload["prompt"] = augmented
+        payload = _merge_non_null(payload, {k: job.get(k) for k in base_payload.keys()})
+        payload = {k: v for k, v in payload.items() if v is not None}
+
+        n = int(payload.get("n", 1))
+        _validate_generate_payload(payload)
+        effective_output_format = _normalize_output_format(payload.get("output_format"))
+        _validate_transparency(payload.get("background"), effective_output_format)
+        payload["output_format"] = effective_output_format
+        outputs = _job_output_paths(
+            out_dir=out_dir,
+            output_format=effective_output_format,
+            idx=i,
+            prompt=prompt,
+            n=n,
+            explicit_out=job.get("out"),
+        )
+        try:
+            async with sem:
+                print(f"{job_label} starting", file=sys.stderr)
+                started = time.time()
+                result = await _generate_one_with_retries(
+                    client,
+                    payload,
+                    attempts=args.max_attempts,
+                    job_label=job_label,
+                )
+                elapsed = time.time() - started
+                print(f"{job_label} completed in {elapsed:.1f}s", file=sys.stderr)
+            images = [item.b64_json for item in result.data]
+            _decode_write_and_downscale(
+                images,
+                outputs,
+                force=args.force,
+                downscale_max_dim=args.downscale_max_dim,
+                downscale_suffix=args.downscale_suffix,
+                output_format=effective_output_format,
+            )
+            return i, None
+        except Exception as exc:
+            any_failed = True
+            print(f"{job_label} failed: {exc}", file=sys.stderr)
+            if args.fail_fast:
+                raise
+            return i, str(exc)
+
+    tasks = [asyncio.create_task(run_job(i, job)) for i, job in enumerate(jobs, start=1)]
+
+    try:
+        await asyncio.gather(*tasks)
+    except Exception:
+        for t in tasks:
+            if not t.done():
+                t.cancel()
+        raise
+
+    return 1 if any_failed else 0
+
+
+def _generate_batch(args: argparse.Namespace) -> None:
+    exit_code = asyncio.run(_run_generate_batch(args))
+    if exit_code:
+        raise SystemExit(exit_code)
+
+
+def _generate(args: argparse.Namespace) -> None:
+    prompt = _read_prompt(args.prompt, args.prompt_file)
+    prompt = _augment_prompt(args, prompt)
+
+    payload = {
+        "model": args.model,
+        "prompt": prompt,
+        "n": args.n,
+        "size": args.size,
+        "quality": args.quality,
+        "background": args.background,
+        "output_format": args.output_format,
+        "output_compression": args.output_compression,
+        "moderation": args.moderation,
+    }
+    payload = {k: v for k, v in payload.items() if v is not None}
+
+    output_format = _normalize_output_format(args.output_format)
+    _validate_transparency(args.background, output_format)
+    payload["output_format"] = output_format
+    output_paths = _build_output_paths(args.out, output_format, args.n, args.out_dir)
+    downscaled = None
+    if args.downscale_max_dim is not None:
+        downscaled = [str(_derive_downscale_path(p, args.downscale_suffix)) for p in output_paths]
+
+    if args.dry_run:
+        _print_request(
+            {
+                "endpoint": "/v1/images/generations",
+                "outputs": [str(p) for p in output_paths],
+                "outputs_downscaled": downscaled,
+                **payload,
+            }
+        )
+        return
+
+    print(
+        "Calling Image API (generation). This can take up to a couple of minutes.",
+        file=sys.stderr,
+    )
+    started = time.time()
+    client = _create_client()
+    result = client.images.generate(**payload)
+    elapsed = time.time() - started
+    print(f"Generation completed in {elapsed:.1f}s.", file=sys.stderr)
+
+    images = [item.b64_json for item in result.data]
+    _decode_write_and_downscale(
+        images,
+        output_paths,
+        force=args.force,
+        downscale_max_dim=args.downscale_max_dim,
+        downscale_suffix=args.downscale_suffix,
+        output_format=output_format,
+    )
+
+
+def _edit(args: argparse.Namespace) -> None:
+    prompt = _read_prompt(args.prompt, args.prompt_file)
+    prompt = _augment_prompt(args, prompt)
+
+    image_paths = _check_image_paths(args.image)
+    mask_path = Path(args.mask) if args.mask else None
+    if mask_path:
+        if not mask_path.exists():
+            _die(f"Mask file not found: {mask_path}")
+        if mask_path.suffix.lower() != ".png":
+            _warn(f"Mask should be a PNG with an alpha channel: {mask_path}")
+        if mask_path.stat().st_size > MAX_IMAGE_BYTES:
+            _warn(f"Mask exceeds 50MB limit: {mask_path}")
+
+    payload = {
+        "model": args.model,
+        "prompt": prompt,
+        "n": args.n,
+        "size": args.size,
+        "quality": args.quality,
+        "background": args.background,
+        "output_format": args.output_format,
+        "output_compression": args.output_compression,
+        "input_fidelity": args.input_fidelity,
+        "moderation": args.moderation,
+    }
+    payload = {k: v for k, v in payload.items() if v is not None}
+
+    output_format = _normalize_output_format(args.output_format)
+    _validate_transparency(args.background, output_format)
+    payload["output_format"] = output_format
+    _validate_input_fidelity(args.input_fidelity)
+    output_paths = _build_output_paths(args.out, output_format, args.n, args.out_dir)
+    downscaled = None
+    if args.downscale_max_dim is not None:
+        downscaled = [str(_derive_downscale_path(p, args.downscale_suffix)) for p in output_paths]
+
+    if args.dry_run:
+        payload_preview = dict(payload)
+        payload_preview["image"] = [str(p) for p in image_paths]
+        if mask_path:
+            payload_preview["mask"] = str(mask_path)
+        _print_request(
+            {
+                "endpoint": "/v1/images/edits",
+                "outputs": [str(p) for p in output_paths],
+                "outputs_downscaled": downscaled,
+                **payload_preview,
+            }
+        )
+        return
+
+    print(
+        f"Calling Image API (edit) with {len(image_paths)} image(s).",
+        file=sys.stderr,
+    )
+    started = time.time()
+    client = _create_client()
+
+    with _open_files(image_paths) as image_files, _open_mask(mask_path) as mask_file:
+        request = dict(payload)
+        request["image"] = image_files if len(image_files) > 1 else image_files[0]
+        if mask_file is not None:
+            request["mask"] = mask_file
+        result = client.images.edit(**request)
+
+    elapsed = time.time() - started
+    print(f"Edit completed in {elapsed:.1f}s.", file=sys.stderr)
+    images = [item.b64_json for item in result.data]
+    _decode_write_and_downscale(
+        images,
+        output_paths,
+        force=args.force,
+        downscale_max_dim=args.downscale_max_dim,
+        downscale_suffix=args.downscale_suffix,
+        output_format=output_format,
+    )
+
+
+def _open_files(paths: List[Path]):
+    return _FileBundle(paths)
+
+
+def _open_mask(mask_path: Optional[Path]):
+    if mask_path is None:
+        return _NullContext()
+    return _SingleFile(mask_path)
+
+
+class _NullContext:
+    def __enter__(self):
+        return None
+
+    def __exit__(self, exc_type, exc, tb):
+        return False
+
+
+class _SingleFile:
+    def __init__(self, path: Path):
+        self._path = path
+        self._handle = None
+
+    def __enter__(self):
+        self._handle = self._path.open("rb")
+        return self._handle
+
+    def __exit__(self, exc_type, exc, tb):
+        if self._handle:
+            try:
+                self._handle.close()
+            except Exception:
+                pass
+        return False
+
+
+class _FileBundle:
+    def __init__(self, paths: List[Path]):
+        self._paths = paths
+        self._handles: List[object] = []
+
+    def __enter__(self):
+        self._handles = [p.open("rb") for p in self._paths]
+        return self._handles
+
+    def __exit__(self, exc_type, exc, tb):
+        for handle in self._handles:
+            try:
+                handle.close()
+            except Exception:
+                pass
+        return False
+
+
+def _add_shared_args(parser: argparse.ArgumentParser) -> None:
+    parser.add_argument("--model", default=DEFAULT_MODEL)
+    parser.add_argument("--prompt")
+    parser.add_argument("--prompt-file")
+    parser.add_argument("--n", type=int, default=1)
+    parser.add_argument("--size", default=DEFAULT_SIZE)
+    parser.add_argument("--quality", default=DEFAULT_QUALITY)
+    parser.add_argument("--background")
+    parser.add_argument("--output-format")
+    parser.add_argument("--output-compression", type=int)
+    parser.add_argument("--moderation")
+    parser.add_argument("--out", default=DEFAULT_OUTPUT_PATH)
+    parser.add_argument("--out-dir")
+    parser.add_argument("--force", action="store_true")
+    parser.add_argument("--dry-run", action="store_true")
+    parser.add_argument("--augment", dest="augment", action="store_true")
+    parser.add_argument("--no-augment", dest="augment", action="store_false")
+    parser.set_defaults(augment=True)
+
+    # Prompt augmentation hints
+    parser.add_argument("--use-case")
+    parser.add_argument("--scene")
+    parser.add_argument("--subject")
+    parser.add_argument("--style")
+    parser.add_argument("--composition")
+    parser.add_argument("--lighting")
+    parser.add_argument("--palette")
+    parser.add_argument("--materials")
+    parser.add_argument("--text")
+    parser.add_argument("--constraints")
+    parser.add_argument("--negative")
+
+    # Post-processing (optional): generate an additional downscaled copy for fast web loading.
+    parser.add_argument("--downscale-max-dim", type=int)
+    parser.add_argument("--downscale-suffix", default=DEFAULT_DOWNSCALE_SUFFIX)
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(
+        description="Fallback CLI for explicit image generation or editing via GPT Image models"
+    )
+    subparsers = parser.add_subparsers(dest="command", required=True)
+
+    gen_parser = subparsers.add_parser("generate", help="Create a new image")
+    _add_shared_args(gen_parser)
+    gen_parser.set_defaults(func=_generate)
+
+    batch_parser = subparsers.add_parser(
+        "generate-batch",
+        help="Generate multiple prompts concurrently (JSONL input)",
+    )
+    _add_shared_args(batch_parser)
+    batch_parser.add_argument("--input", required=True, help="Path to JSONL file (one job per line)")
+    batch_parser.add_argument("--concurrency", type=int, default=DEFAULT_CONCURRENCY)
+    batch_parser.add_argument("--max-attempts", type=int, default=3)
+    batch_parser.add_argument("--fail-fast", action="store_true")
+    batch_parser.set_defaults(func=_generate_batch)
+
+    edit_parser = subparsers.add_parser("edit", help="Edit an existing image")
+    _add_shared_args(edit_parser)
+    edit_parser.add_argument("--image", action="append", required=True)
+    edit_parser.add_argument("--mask")
+    edit_parser.add_argument("--input-fidelity")
+    edit_parser.set_defaults(func=_edit)
+
+    args = parser.parse_args()
+    if args.n < 1 or args.n > 10:
+        _die("--n must be between 1 and 10")
+    if getattr(args, "concurrency", 1) < 1 or getattr(args, "concurrency", 1) > 25:
+        _die("--concurrency must be between 1 and 25")
+    if getattr(args, "max_attempts", 3) < 1 or getattr(args, "max_attempts", 3) > 10:
+        _die("--max-attempts must be between 1 and 10")
+    if args.output_compression is not None and not (0 <= args.output_compression <= 100):
+        _die("--output-compression must be between 0 and 100")
+    if args.command == "generate-batch" and not args.out_dir:
+        _die("generate-batch requires --out-dir")
+    if getattr(args, "downscale_max_dim", None) is not None and args.downscale_max_dim < 1:
+        _die("--downscale-max-dim must be >= 1")
+
+    _validate_model(args.model)
+    _validate_size(args.size, args.model)
+    _validate_quality(args.quality)
+    _validate_background(args.background)
+    _validate_model_specific_options(
+        model=args.model,
+        background=args.background,
+        input_fidelity=getattr(args, "input_fidelity", None),
+    )
+    _ensure_api_key(args.dry_run)
+
+    args.func(args)
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/skills/imagegen/scripts/remove_chroma_key.py b/skills/imagegen/scripts/remove_chroma_key.py
new file mode 100644
index 0000000..5053987
--- /dev/null
+++ b/skills/imagegen/scripts/remove_chroma_key.py
@@ -0,0 +1,440 @@
+#!/usr/bin/env python3
+"""Remove a solid chroma-key background from an image.
+
+This helper supports the imagegen skill's built-in-first transparent workflow:
+generate an image on a flat key color, then convert that key color to alpha.
+"""
+
+from __future__ import annotations
+
+import argparse
+from io import BytesIO
+from pathlib import Path
+import re
+from statistics import median
+import sys
+from typing import Tuple
+
+
+Color = Tuple[int, int, int]
+KEY_DOMINANCE_THRESHOLD = 16.0
+ALPHA_NOISE_FLOOR = 8
+
+
+def _die(message: str, code: int = 1) -> None:
+    print(f"Error: {message}", file=sys.stderr)
+    raise SystemExit(code)
+
+
+def _dependency_hint(package: str) -> str:
+    return (
+        "Activate the repo-selected environment first, then install it with "
+        f"`uv pip install {package}`. If this repo uses a local virtualenv, start with "
+        "`source .venv/bin/activate`; otherwise use this repo's configured shared fallback "
+        "environment."
+    )
+
+
+def _load_pillow():
+    try:
+        from PIL import Image, ImageFilter
+    except ImportError:
+        _die(f"Pillow is required for chroma-key removal. {_dependency_hint('pillow')}")
+    return Image, ImageFilter
+
+
+def _parse_key_color(raw: str) -> Color:
+    value = raw.strip()
+    match = re.fullmatch(r"#?([0-9a-fA-F]{6})", value)
+    if not match:
+        _die("key color must be a hex RGB value like #00ff00.")
+    hex_value = match.group(1)
+    return (
+        int(hex_value[0:2], 16),
+        int(hex_value[2:4], 16),
+        int(hex_value[4:6], 16),
+    )
+
+
+def _validate_args(args: argparse.Namespace) -> None:
+    if args.tolerance < 0 or args.tolerance > 255:
+        _die("--tolerance must be between 0 and 255.")
+    if args.transparent_threshold < 0 or args.transparent_threshold > 255:
+        _die("--transparent-threshold must be between 0 and 255.")
+    if args.opaque_threshold < 0 or args.opaque_threshold > 255:
+        _die("--opaque-threshold must be between 0 and 255.")
+    if args.soft_matte and args.transparent_threshold >= args.opaque_threshold:
+        _die("--transparent-threshold must be lower than --opaque-threshold.")
+    if args.edge_feather < 0 or args.edge_feather > 64:
+        _die("--edge-feather must be between 0 and 64.")
+    if args.edge_contract < 0 or args.edge_contract > 16:
+        _die("--edge-contract must be between 0 and 16.")
+
+    src = Path(args.input)
+    if not src.exists():
+        _die(f"Input image not found: {src}")
+
+    out = Path(args.out)
+    if out.exists() and not args.force:
+        _die(f"Output already exists: {out} (use --force to overwrite)")
+
+    if out.suffix.lower() not in {".png", ".webp"}:
+        _die("--out must end in .png or .webp so the alpha channel is preserved.")
+
+
+def _channel_distance(a: Color, b: Color) -> int:
+    return max(abs(a[0] - b[0]), abs(a[1] - b[1]), abs(a[2] - b[2]))
+
+
+def _clamp_channel(value: float) -> int:
+    return max(0, min(255, int(round(value))))
+
+
+def _smoothstep(value: float) -> float:
+    value = max(0.0, min(1.0, value))
+    return value * value * (3.0 - 2.0 * value)
+
+
+def _soft_alpha(distance: int, transparent_threshold: float, opaque_threshold: float) -> int:
+    if distance <= transparent_threshold:
+        return 0
+    if distance >= opaque_threshold:
+        return 255
+    ratio = (float(distance) - transparent_threshold) / (
+        opaque_threshold - transparent_threshold
+    )
+    return _clamp_channel(255.0 * _smoothstep(ratio))
+
+
+def _dominance_alpha(rgb: Color, key: Color) -> int:
+    spill_channels = _spill_channels(key)
+    if not spill_channels:
+        return 255
+
+    channels = [float(value) for value in rgb]
+    non_spill = [idx for idx in range(3) if idx not in spill_channels]
+    key_strength = (
+        min(channels[idx] for idx in spill_channels)
+        if len(spill_channels) > 1
+        else channels[spill_channels[0]]
+    )
+    non_key_strength = max((channels[idx] for idx in non_spill), default=0.0)
+    dominance = key_strength - non_key_strength
+    if dominance <= 0:
+        return 255
+
+    denominator = max(1.0, float(max(key)) - non_key_strength)
+    alpha = 1.0 - min(1.0, dominance / denominator)
+    return _clamp_channel(alpha * 255.0)
+
+
+def _spill_channels(key: Color) -> list[int]:
+    key_max = max(key)
+    if key_max < 128:
+        return []
+    return [idx for idx, value in enumerate(key) if value >= key_max - 16 and value >= 128]
+
+
+def _key_channel_dominance(rgb: Color, key: Color) -> float:
+    spill_channels = _spill_channels(key)
+    if not spill_channels:
+        return 0.0
+
+    channels = [float(value) for value in rgb]
+    non_spill = [idx for idx in range(3) if idx not in spill_channels]
+    key_strength = (
+        min(channels[idx] for idx in spill_channels)
+        if len(spill_channels) > 1
+        else channels[spill_channels[0]]
+    )
+    non_key_strength = max((channels[idx] for idx in non_spill), default=0.0)
+    return key_strength - non_key_strength
+
+
+def _looks_key_colored(rgb: Color, key: Color, distance: int) -> bool:
+    if distance <= 32:
+        return True
+
+    spill_channels = _spill_channels(key)
+    if not spill_channels:
+        return True
+
+    return _key_channel_dominance(rgb, key) >= KEY_DOMINANCE_THRESHOLD
+
+
+def _cleanup_spill(rgb: Color, key: Color, alpha: int = 255) -> Color:
+    if alpha >= 252:
+        return rgb
+
+    spill_channels = _spill_channels(key)
+    if not spill_channels:
+        return rgb
+
+    channels = [float(value) for value in rgb]
+    non_spill = [idx for idx in range(3) if idx not in spill_channels]
+    if non_spill:
+        anchor = max(channels[idx] for idx in non_spill)
+        cap = max(0.0, anchor - 1.0)
+        for idx in spill_channels:
+            if channels[idx] > cap:
+                channels[idx] = cap
+
+    return (
+        _clamp_channel(channels[0]),
+        _clamp_channel(channels[1]),
+        _clamp_channel(channels[2]),
+    )
+
+
+def _apply_alpha_to_image(
+    image,
+    *,
+    key: Color,
+    tolerance: int,
+    spill_cleanup: bool,
+    soft_matte: bool,
+    transparent_threshold: float,
+    opaque_threshold: float,
+) -> int:
+    pixels = image.load()
+    width, height = image.size
+    transparent = 0
+
+    for y in range(height):
+        for x in range(width):
+            red, green, blue, alpha = pixels[x, y]
+            rgb = (red, green, blue)
+            distance = _channel_distance(rgb, key)
+            key_like = _looks_key_colored(rgb, key, distance)
+            output_alpha = (
+                min(
+                    _soft_alpha(distance, transparent_threshold, opaque_threshold),
+                    _dominance_alpha(rgb, key),
+                )
+                if soft_matte and key_like
+                else (0 if distance <= tolerance else 255)
+            )
+            output_alpha = int(round(output_alpha * (alpha / 255.0)))
+            if 0 < output_alpha <= ALPHA_NOISE_FLOOR:
+                output_alpha = 0
+
+            if output_alpha == 0:
+                pixels[x, y] = (0, 0, 0, 0)
+                transparent += 1
+                continue
+
+            if spill_cleanup and key_like:
+                red, green, blue = _cleanup_spill(rgb, key, output_alpha)
+            pixels[x, y] = (red, green, blue, output_alpha)
+
+    return transparent
+
+
+def _contract_alpha(image, pixels: int):
+    if pixels == 0:
+        return image
+
+    _, ImageFilter = _load_pillow()
+    alpha = image.getchannel("A")
+    for _ in range(pixels):
+        alpha = alpha.filter(ImageFilter.MinFilter(3))
+    image.putalpha(alpha)
+    return image
+
+
+def _apply_edge_feather(image, radius: float):
+    if radius == 0:
+        return image
+
+    _, ImageFilter = _load_pillow()
+    alpha = image.getchannel("A")
+    alpha = alpha.filter(ImageFilter.GaussianBlur(radius=radius))
+    image.putalpha(alpha)
+    return image
+
+
+def _encode_image(image, output_format: str) -> bytes:
+    out = BytesIO()
+    image.save(out, format=output_format.upper())
+    return out.getvalue()
+
+
+def _alpha_counts(image) -> tuple[int, int, int]:
+    pixels = image.load()
+    width, height = image.size
+    total = 0
+    transparent = 0
+    partial = 0
+
+    for y in range(height):
+        for x in range(width):
+            alpha = pixels[x, y][3]
+            total += 1
+            if alpha == 0:
+                transparent += 1
+            elif alpha < 255:
+                partial += 1
+
+    return total, transparent, partial
+
+
+def _sample_border_key(image, mode: str) -> Color:
+    width, height = image.size
+    pixels = image.load()
+    samples: list[Color] = []
+
+    if mode == "corners":
+        patch = max(1, min(width, height, 12))
+        boxes = [
+            (0, 0, patch, patch),
+            (width - patch, 0, width, patch),
+            (0, height - patch, patch, height),
+            (width - patch, height - patch, width, height),
+        ]
+        for left, top, right, bottom in boxes:
+            for y in range(top, bottom):
+                for x in range(left, right):
+                    red, green, blue = pixels[x, y][:3]
+                    samples.append((red, green, blue))
+    else:
+        band = max(1, min(width, height, 6))
+        step = max(1, min(width, height) // 256)
+        for x in range(0, width, step):
+            for y in range(band):
+                red, green, blue = pixels[x, y][:3]
+                samples.append((red, green, blue))
+                red, green, blue = pixels[x, height - 1 - y][:3]
+                samples.append((red, green, blue))
+        for y in range(0, height, step):
+            for x in range(band):
+                red, green, blue = pixels[x, y][:3]
+                samples.append((red, green, blue))
+                red, green, blue = pixels[width - 1 - x, y][:3]
+                samples.append((red, green, blue))
+
+    if not samples:
+        _die("Could not sample background key color from image border.")
+
+    return (
+        int(round(median(sample[0] for sample in samples))),
+        int(round(median(sample[1] for sample in samples))),
+        int(round(median(sample[2] for sample in samples))),
+    )
+
+
+def _remove_chroma_key(args: argparse.Namespace) -> None:
+    Image, _ = _load_pillow()
+    src = Path(args.input)
+    out = Path(args.out)
+
+    with Image.open(src) as image:
+        rgba = image.convert("RGBA")
+    key = (
+        _sample_border_key(rgba, args.auto_key)
+        if args.auto_key != "none"
+        else _parse_key_color(args.key_color)
+    )
+
+    transparent = _apply_alpha_to_image(
+        rgba,
+        key=key,
+        tolerance=args.tolerance,
+        spill_cleanup=args.spill_cleanup,
+        soft_matte=args.soft_matte,
+        transparent_threshold=args.transparent_threshold,
+        opaque_threshold=args.opaque_threshold,
+    )
+    rgba = _contract_alpha(rgba, args.edge_contract)
+    rgba = _apply_edge_feather(rgba, args.edge_feather)
+
+    total, transparent_after, partial_after = _alpha_counts(rgba)
+
+    out.parent.mkdir(parents=True, exist_ok=True)
+    output_format = "PNG" if out.suffix.lower() == ".png" else "WEBP"
+    out.write_bytes(_encode_image(rgba, output_format))
+
+    print(f"Wrote {out}")
+    print(f"Key color: #{key[0]:02x}{key[1]:02x}{key[2]:02x}")
+    print(f"Transparent pixels: {transparent_after}/{total}")
+    print(f"Partially transparent pixels: {partial_after}/{total}")
+    if transparent == 0:
+        print("Warning: no pixels matched the key color before feathering.", file=sys.stderr)
+
+
+def _build_parser() -> argparse.ArgumentParser:
+    parser = argparse.ArgumentParser(
+        description="Remove a solid chroma-key background and write an image with alpha."
+    )
+    parser.add_argument("--input", required=True, help="Input image path.")
+    parser.add_argument("--out", required=True, help="Output .png or .webp path.")
+    parser.add_argument(
+        "--key-color",
+        default="#00ff00",
+        help="Hex RGB key color to remove, for example #00ff00.",
+    )
+    parser.add_argument(
+        "--tolerance",
+        type=int,
+        default=12,
+        help="Hard-key per-channel tolerance for matching the key color, 0-255.",
+    )
+    parser.add_argument(
+        "--auto-key",
+        choices=["none", "corners", "border"],
+        default="none",
+        help="Sample the key color from image corners or border instead of --key-color.",
+    )
+    parser.add_argument(
+        "--soft-matte",
+        action="store_true",
+        help="Use a smooth alpha ramp between transparent and opaque thresholds.",
+    )
+    parser.add_argument(
+        "--transparent-threshold",
+        type=float,
+        default=12.0,
+        help="Soft-matte distance at or below which pixels become fully transparent.",
+    )
+    parser.add_argument(
+        "--opaque-threshold",
+        type=float,
+        default=96.0,
+        help="Soft-matte distance at or above which pixels become fully opaque.",
+    )
+    parser.add_argument(
+        "--edge-feather",
+        type=float,
+        default=0.0,
+        help="Optional alpha blur radius for softened edges, 0-64.",
+    )
+    parser.add_argument(
+        "--edge-contract",
+        type=int,
+        default=0,
+        help="Shrink the visible alpha matte by this many pixels before feathering.",
+    )
+    parser.add_argument(
+        "--spill-cleanup",
+        dest="spill_cleanup",
+        action="store_true",
+        help="Reduce obvious key-color spill on opaque pixels.",
+    )
+    parser.add_argument(
+        "--despill",
+        dest="spill_cleanup",
+        action="store_true",
+        help="Alias for --spill-cleanup; decontaminate key-color edge spill.",
+    )
+    parser.add_argument("--force", action="store_true", help="Overwrite an existing output file.")
+    return parser
+
+
+def main() -> None:
+    parser = _build_parser()
+    args = parser.parse_args()
+    _validate_args(args)
+    _remove_chroma_key(args)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/skills/openai-docs/LICENSE.txt b/skills/openai-docs/LICENSE.txt
new file mode 100644
index 0000000..13e25df
--- /dev/null
+++ b/skills/openai-docs/LICENSE.txt
@@ -0,0 +1,201 @@
+Apache License
+Version 2.0, January 2004
+http://www.apache.org/licenses/
+
+TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+1. Definitions.
+
+   "License" shall mean the terms and conditions for use, reproduction,
+   and distribution as defined by Sections 1 through 9 of this document.
+
+   "Licensor" shall mean the copyright owner or entity authorized by
+   the copyright owner that is granting the License.
+
+   "Legal Entity" shall mean the union of the acting entity and all
+   other entities that control, are controlled by, or are under common
+   control with that entity. For the purposes of this definition,
+   "control" means (i) the power, direct or indirect, to cause the
+   direction or management of such entity, whether by contract or
+   otherwise, or (ii) ownership of fifty percent (50%) or more of the
+   outstanding shares, or (iii) beneficial ownership of such entity.
+
+   "You" (or "Your") shall mean an individual or Legal Entity
+   exercising permissions granted by this License.
+
+   "Source" form shall mean the preferred form for making modifications,
+   including but not limited to software source code, documentation
+   source, and configuration files.
+
+   "Object" form shall mean any form resulting from mechanical
+   transformation or translation of a Source form, including but
+   not limited to compiled object code, generated documentation,
+   and conversions to other media types.
+
+   "Work" shall mean the work of authorship, whether in Source or
+   Object form, made available under the License, as indicated by a
+   copyright notice that is included in or attached to the work
+   (an example is provided in the Appendix below).
+
+   "Derivative Works" shall mean any work, whether in Source or Object
+   form, that is based on (or derived from) the Work and for which the
+   editorial revisions, annotations, elaborations, or other modifications
+   represent, as a whole, an original work of authorship. For the purposes
+   of this License, Derivative Works shall not include works that remain
+   separable from, or merely link (or bind by name) to the interfaces of,
+   the Work and Derivative Works thereof.
+
+   "Contribution" shall mean any work of authorship, including
+   the original version of the Work and any modifications or additions
+   to that Work or Derivative Works thereof, that is intentionally
+   submitted to Licensor for inclusion in the Work by the copyright owner
+   or by an individual or Legal Entity authorized to submit on behalf of
+   the copyright owner. For the purposes of this definition, "submitted"
+   means any form of electronic, verbal, or written communication sent
+   to the Licensor or its representatives, including but not limited to
+   communication on electronic mailing lists, source code control systems,
+   and issue tracking systems that are managed by, or on behalf of, the
+   Licensor for the purpose of discussing and improving the Work, but
+   excluding communication that is conspicuously marked or otherwise
+   designated in writing by the copyright owner as "Not a Contribution."
+
+   "Contributor" shall mean Licensor and any individual or Legal Entity
+   on behalf of whom a Contribution has been received by Licensor and
+   subsequently incorporated within the Work.
+
+2. Grant of Copyright License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   copyright license to reproduce, prepare Derivative Works of,
+   publicly display, publicly perform, sublicense, and distribute the
+   Work and such Derivative Works in Source or Object form.
+
+3. Grant of Patent License. Subject to the terms and conditions of
+   this License, each Contributor hereby grants to You a perpetual,
+   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+   (except as stated in this section) patent license to make, have made,
+   use, offer to sell, sell, import, and otherwise transfer the Work,
+   where such license applies only to those patent claims licensable
+   by such Contributor that are necessarily infringed by their
+   Contribution(s) alone or by combination of their Contribution(s)
+   with the Work to which such Contribution(s) was submitted. If You
+   institute patent litigation against any entity (including a
+   cross-claim or counterclaim in a lawsuit) alleging that the Work
+   or a Contribution incorporated within the Work constitutes direct
+   or contributory patent infringement, then any patent licenses
+   granted to You under this License for that Work shall terminate
+   as of the date such litigation is filed.
+
+4. Redistribution. You may reproduce and distribute copies of the
+   Work or Derivative Works thereof in any medium, with or without
+   modifications, and in Source or Object form, provided that You
+   meet the following conditions:
+
+   (a) You must give any other recipients of the Work or
+       Derivative Works a copy of this License; and
+
+   (b) You must cause any modified files to carry prominent notices
+       stating that You changed the files; and
+
+   (c) You must retain, in the Source form of any Derivative Works
+       that You distribute, all copyright, patent, trademark, and
+       attribution notices from the Source form of the Work,
+       excluding those notices that do not pertain to any part of
+       the Derivative Works; and
+
+   (d) If the Work includes a "NOTICE" text file as part of its
+       distribution, then any Derivative Works that You distribute must
+       include a readable copy of the attribution notices contained
+       within such NOTICE file, excluding those notices that do not
+       pertain to any part of the Derivative Works, in at least one
+       of the following places: within a NOTICE text file distributed
+       as part of the Derivative Works; within the Source form or
+       documentation, if provided along with the Derivative Works; or,
+       within a display generated by the Derivative Works, if and
+       wherever such third-party notices normally appear. The contents
+       of the NOTICE file are for informational purposes only and
+       do not modify the License. You may add Your own attribution
+       notices within Derivative Works that You distribute, alongside
+       or as an addendum to the NOTICE text from the Work, provided
+       that such additional attribution notices cannot be construed
+       as modifying the License.
+
+   You may add Your own copyright statement to Your modifications and
+   may provide additional or different license terms and conditions
+   for use, reproduction, or distribution of Your modifications, or
+   for any such Derivative Works as a whole, provided Your use,
+   reproduction, and distribution of the Work otherwise complies with
+   the conditions stated in this License.
+
+5. Submission of Contributions. Unless You explicitly state otherwise,
+   any Contribution intentionally submitted for inclusion in the Work
+   by You to the Licensor shall be under the terms and conditions of
+   this License, without any additional terms or conditions.
+   Notwithstanding the above, nothing herein shall supersede or modify
+   the terms of any separate license agreement you may have executed
+   with Licensor regarding such Contributions.
+
+6. Trademarks. This License does not grant permission to use the trade
+   names, trademarks, service marks, or product names of the Licensor,
+   except as required for reasonable and customary use in describing the
+   origin of the Work and reproducing the content of the NOTICE file.
+
+7. Disclaimer of Warranty. Unless required by applicable law or
+   agreed to in writing, Licensor provides the Work (and each
+   Contributor provides its Contributions) on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+   implied, including, without limitation, any warranties or conditions
+   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+   PARTICULAR PURPOSE. You are solely responsible for determining the
+   appropriateness of using or redistributing the Work and assume any
+   risks associated with Your exercise of permissions under this License.
+
+8. Limitation of Liability. In no event and under no legal theory,
+   whether in tort (including negligence), contract, or otherwise,
+   unless required by applicable law (such as deliberate and grossly
+   negligent acts) or agreed to in writing, shall any Contributor be
+   liable to You for damages, including any direct, indirect, special,
+   incidental, or consequential damages of any character arising as a
+   result of this License or out of the use or inability to use the
+   Work (including but not limited to damages for loss of goodwill,
+   work stoppage, computer failure or malfunction, or any and all
+   other commercial damages or losses), even if such Contributor
+   has been advised of the possibility of such damages.
+
+9. Accepting Warranty or Additional Liability. While redistributing
+   the Work or Derivative Works thereof, You may choose to offer,
+   and charge a fee for, acceptance of support, warranty, indemnity,
+   or other liability obligations and/or rights consistent with this
+   License. However, in accepting such obligations, You may act only
+   on Your own behalf and on Your sole responsibility, not on behalf of
+   any other Contributor, and only if You agree to indemnify,
+   defend, and hold each Contributor harmless for any liability
+   incurred by, or claims asserted against, such Contributor by reason
+   of your accepting any such warranty or additional liability.
+
+END OF TERMS AND CONDITIONS
+
+APPENDIX: How to apply the Apache License to your work.
+
+   To apply the Apache License to your work, attach the following
+   boilerplate notice, with the fields enclosed by brackets "[]"
+   replaced with your own identifying information. (Don\'t include
+   the brackets!)  The text should be enclosed in the appropriate
+   comment syntax for the file format. We also recommend that a
+   file or class name and description of purpose be included on the
+   same "printed page" as the copyright notice for easier
+   identification within third-party archives.
+
+Copyright [yyyy] [name of copyright owner]
+
+Licensed under the Apache License, Version 2.0 (the "License");
+you may not use this file except in compliance with the License.
+You may obtain a copy of the License at
+
+    http://www.apache.org/licenses/LICENSE-2.0
+
+Unless required by applicable law or agreed to in writing, software
+distributed under the License is distributed on an "AS IS" BASIS,
+WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+See the License for the specific language governing permissions and
+limitations under the License.
diff --git a/skills/openai-docs/SKILL.md b/skills/openai-docs/SKILL.md
new file mode 100644
index 0000000..30526bd
--- /dev/null
+++ b/skills/openai-docs/SKILL.md
@@ -0,0 +1,167 @@
+---
+name: "openai-docs"
+description: "Use when the user asks how to build with OpenAI products or APIs, asks about Codex itself or choosing Codex surfaces, needs up-to-date official documentation with citations, help choosing the latest model for a use case, or model upgrade and prompt-upgrade guidance; use OpenAI docs MCP tools for non-Codex docs questions, use the Codex manual helper first for broad Codex self-knowledge, and restrict fallback browsing to official OpenAI domains."
+---
+
+
+# OpenAI Docs
+
+Provide authoritative, current guidance from OpenAI developer docs using the developers.openai.com MCP server. "Docs MCP" means `mcp__openaiDeveloperDocs__search_openai_docs` and `mcp__openaiDeveloperDocs__fetch_openai_doc`; for API reference, schema, parameter, or required-field questions, also use `mcp__openaiDeveloperDocs__get_openapi_spec` when available. Official-domain web search is fallback after those tools are unavailable or unhelpful. Broad Codex questions use the manual helper before Docs MCP. This skill also owns model selection, API model migration, and prompt-upgrade guidance.
+
+## API Key Setup
+
+For requests to build, run, configure, debug, or implement an API-backed app, script, CLI, generator, or tool, use `openai-platform-api-key` first when available. After that credential gate is resolved, return here for current docs as needed.
+
+Use this skill directly for docs-only questions, citations, model/API guidance, conceptual explanations, and examples that do not require building or running an API-backed artifact.
+
+## Workflow Configuration
+
+### Source Priority
+
+- For Codex self-knowledge, use the Codex source route below; it owns when to use the manual helper, Docs MCP, or bounded uncertainty.
+- For non-Codex OpenAI docs questions, use `mcp__openaiDeveloperDocs__search_openai_docs` to find the most relevant doc pages.
+- For non-Codex OpenAI docs questions, fetch the relevant page with `mcp__openaiDeveloperDocs__fetch_openai_doc` before answering. If search is noisy, run a narrower Docs MCP search; when any plausible official OpenAI docs URL is known or found, try fetching that URL through Docs MCP before relying on web-search content.
+- For API reference, schema, parameter, or required-field questions, use `mcp__openaiDeveloperDocs__get_openapi_spec` when available to verify the API shape alongside the relevant guide or reference page.
+- Use `mcp__openaiDeveloperDocs__list_openai_docs` only when you need to browse or discover non-Codex pages without a clear query.
+- For model-selection, "latest model", or default-model questions, fetch `https://developers.openai.com/api/docs/guides/latest-model.md` first. If that is unavailable, load `references/latest-model.md`.
+- For model upgrades or prompt upgrades, run `node scripts/resolve-latest-model-info.js` only when the target is latest/current/default or otherwise unspecified; otherwise preserve the explicitly requested target.
+- Preserve explicit target requests: if the user names a target model like "migrate to GPT-5.4", keep that requested target even if `latest-model.md` names a newer model. Mention newer guidance only as optional.
+- If current remote guidance is needed, fetch both the returned migration and prompting guide URLs directly. If direct fetch fails, use MCP/search fallback; if that also fails, use bundled fallback references and disclose the fallback.
+
+## OpenAI product snapshots
+
+1. Apps SDK: Build ChatGPT apps by providing a web component UI and an MCP server that exposes your app's tools to ChatGPT.
+2. Responses API: A unified endpoint designed for stateful, multimodal, tool-using interactions in agentic workflows.
+3. Chat Completions API: Generate a model response from a list of messages comprising a conversation.
+4. Codex: OpenAI's coding agent for software development that can write, understand, review, and debug code.
+5. gpt-oss: Open-weight OpenAI reasoning models (gpt-oss-120b and gpt-oss-20b) released under the Apache 2.0 license.
+6. Realtime API: Build low-latency, multimodal experiences including natural speech-to-speech conversations.
+7. Agents SDK: A toolkit for building agentic apps where a model can use tools and context, hand off to other agents, stream partial results, and keep a full trace.
+
+## Codex self-knowledge
+
+Use this path for questions about Codex itself: configuring, extending, operating, troubleshooting, local state, product surfaces, or where Codex behavior should live. A codebase merely mentioning a plugin, skill, hook, MCP server, browser, or automation is not enough. For generic software tasks, answer the software task directly; if asked whether Codex self-knowledge applies, answer that meta question briefly and continue the requested artifact.
+
+### Source Route
+
+The Codex manual is the first source for broad Codex synthesis. Treat the manual and Docs MCP as different lanes, not interchangeable official-doc sources. For published-user Codex product answers, the source route is complete: the manual, Docs MCP when this route calls for it, official OpenAI web fallback, and callable capabilities surfaced in the current session when the question is about that capability. Knowledge bases outside developers.openai.com are outside this route for public product answers.
+
+For broad Codex behavior, setup, customization, skills, plugins, MCP, hooks, `AGENTS.md`, automations, surfaces, local state, or system-map questions:
+
+1. Reuse a same-thread manual and outline path when it is still fresh.
+2. Otherwise run the skill-local helper first in normal writable sessions. Skip it without trying only when the session is explicitly read-only, shell execution is unavailable, or visible policy shows no allowed temp cache.
+3. By default, the helper chooses the first usable temp cache dir in this order: `$TMPDIR/openai-docs-cache`, `%TEMP%\openai-docs-cache`, `%TMP%\openai-docs-cache`, `/private/tmp/openai-docs-cache`, then `/tmp/openai-docs-cache`. Workspace-only write access is not enough for this temp cache.
+4. Run the helper directly unless you need to override the cache dir. The helper falls back to `curl` when native `fetch` is unavailable or when proxy env vars are present, so no shell-specific proxy prefix is required. Resolve `<skill-dir>` to this skill's actual directory; in copied local eval workdirs this is usually `.codex/skills/openai-docs`:
+
+```bash
+node <skill-dir>/scripts/fetch-codex-manual.mjs
+```
+
+If you need to override the cache dir, pass `--cache-dir <cache-dir>`. On Windows, the helper checks `%TEMP%` and `%TMP%` automatically; in PowerShell, `$env:TEMP\\openai-docs-cache` is a typical explicit override.
+
+Treat helper availability as established by explicit read-only/no-shell policy or an actual command result. A guessed sandbox or guessed helper failure is not enough to switch to Docs MCP or web lookup; after an actual helper command failure, continue to the narrowest official next source below.
+
+The helper verifies freshness, writes `codex-manual.md`, and emits `codex-manual.outline.md`. The outline maps source pages and headings to line ranges; use it to choose the relevant manual section, then read or search targeted manual sections for Codex product facts. Use the skill directory to locate and run the helper; after the helper succeeds, use the returned manual and outline paths as the search scope for Codex product facts and term coverage checks.
+
+Reuse the same-thread manual and outline paths for follow-up Codex questions. Refresh first when the manual was fetched more than about a day ago, the path is unusable, the path came from another thread or uncertain provenance, or likely-current information is missing and staleness is plausible.
+
+For questions about whether the manual is current enough to rely on now, run the helper when temp caching is allowed and base the answer on its returned status, manual path, and outline path.
+
+If the manual resolves a Codex claim, answer from it and stop expanding sources for that claim; continue the user's broader task if the docs lookup was only one dependency. Manual source pages and known anchors are enough citation support for manual-covered material.
+
+If the helper is skipped because the session is read-only, has no shell execution, or has no allowed temp cache, the next source is Docs MCP: call `mcp__openaiDeveloperDocs__search_openai_docs`, then `mcp__openaiDeveloperDocs__fetch_openai_doc` for a relevant hit before any web fallback.
+
+If a user names a Codex term or mode that a fresh manual does not use, search the manual for obvious adjacent concepts, then answer that the exact term is not documented and use the closest documented terminology. If the prompt asks how that term maps to Codex behavior, resolve the mapping from adjacent manual sections. If the exact term remains material or likely current after that manual pass, use one narrow Docs MCP search/fetch before bounded uncertainty; otherwise, the source lookup for that terminology or mapping claim is complete.
+
+Use the narrowest official next source only when the manual is unavailable, the helper fails, temp caching is not allowed, another material claim is missing or likely stale, or the user explicitly needs a page-specific citation. Prefer one specific Docs MCP search and, if it returns a clearly relevant page, one fetch; for unresolved Codex capability names, acronyms, scheduling terms, or exact error text, this Docs MCP step is the next source before web search. After the manual plus any permitted Docs MCP gap-fill, resolve remaining gaps as bounded uncertainty. Use official-domain web fallback only after that Docs MCP path is unavailable or unhelpful. If the claim is still not established, stop with bounded uncertainty. If official docs/manual conflict with a callable capability already surfaced in the current session, state the conflict and prefer verified current-session behavior for that environment.
+
+For undocumented or private-looking model slugs, product mode labels, entitlement labels, account access paths, or rollout names, answer from current public docs and bounded uncertainty. Those labels are not a reason to leave the public source route.
+
+For support-style diagnostics, prefer a layer-by-layer answer from the manual over provider-specific web lookups: installed/enabled plugin, bundled app or connector authorization, MCP setup, workspace/admin policy, restart or new-thread expectations, then support or feedback if still unresolved.
+
+If the source route still does not establish a claim, return bounded uncertainty or route to support, an admin, or product feedback instead of widening the investigation.
+
+For unresolved product terminology, answer from the manual plus the allowed official next source. If those sources do not establish the term, answer with bounded uncertainty from those sources.
+
+### Surface Map
+
+When Codex nouns or durable-instruction surfaces overlap, recommend the smallest surface that matches the scope:
+
+- Prompt or thread context -> one-off task constraints.
+- `AGENTS.md` -> durable repo conventions, commands, verification steps, and review expectations; closer nested files apply under their subtree.
+- Project `.codex/config.toml` -> trusted-repo Codex settings such as sandbox, MCP, hooks, model, or reasoning defaults.
+- Global config or global guidance -> personal defaults across repos.
+- Skill -> reusable task workflow with references or scripts.
+- Plugin -> installable bundle with skills plus commands, tools, MCP config, hooks, assets, apps, or marketplace metadata.
+- MCP server or app connector -> live external data/actions or authorized private app/workspace data. Use connectors for private Google Docs, Calendar, Slack, GitHub, Notion, and similar data instead of web search or model memory.
+- Automation -> scheduled checks, reminders, monitors, or follow-up work; use a thread heartbeat when continuity in an existing thread matters.
+- Hook -> lifecycle enforcement around tool calls, commands, or file edits.
+
+Split mixed-scope requests instead of forcing one answer. Example: "always do X, but only for this PR" defaults to prompt/thread context for the current run; use `AGENTS.md` or project config only if it should persist, hooks only for mechanical enforcement, and automations only for scheduled or follow-up work.
+
+Use this quick product map when needed: CLI is terminal-first local repo work; IDE extension is editor-attached coding; Codex app is desktop planning, review, and interactive work; cloud/web is hosted parallel/offloaded work; Browser Use/in-app browser is Codex-controlled web testing; Chrome extension uses the user's Chrome profile; Computer Use controls desktop apps and OS UI. Keep `config.toml` defaults, `requirements.toml` constraints, and managed/admin policy separate.
+
+### Boundaries And Output
+
+- API key auth does not imply ChatGPT, cloud task, or connector access. For plugin/app/auth failures, check bundle availability, plugin installed/enabled state, connector/app authorization, MCP setup, restart/refresh expectations, workspace policy, and per-surface availability before answering.
+- Sandbox or network denials need scoped escalation with a clear justification. Destructive commands, writes outside the workspace, or broad access changes require explicit approval.
+- Memory can provide user preference or context, but explicit prompt instructions win and memory is not a source for current external facts.
+- For affirmative surface-selection answers, use this shape: recommendation, why, what to avoid, and the manual/source evidence used.
+- When page-specific Codex citations are actually needed, these anchors often fit: `concepts/customization#agents-guidance` for `AGENTS.md`, `concepts/customization#skills` for skills, `plugins/build#plugin-structure` for plugins, `concepts/customization#mcp` for MCP, `config-advanced#hooks` for hooks, `app/automations#thread-automations` for thread automations, and `config-reference#configtoml` for config.
+
+## If MCP server is missing
+
+If MCP tools fail or no OpenAI docs resources are available:
+
+1. Run the install command yourself: `codex mcp add openaiDeveloperDocs --url https://developers.openai.com/mcp`
+2. If it fails due to permissions/sandboxing, immediately retry the same command with escalated permissions and include a 1-sentence justification for approval.
+3. Ask the user to run the install command only if the escalated attempt fails.
+4. Ask the user to restart Codex.
+5. Re-run the doc search/fetch after restart.
+
+## Workflow
+
+1. Clarify whether the request is general docs lookup, model selection, a model-string upgrade, prompt-upgrade guidance, or broader API/provider migration.
+2. For Codex self-knowledge requests, follow the Codex self-knowledge source procedure above.
+3. For model-selection or upgrade requests, prefer current remote docs over bundled references when the user asks for latest/current/default guidance.
+   - Fetch `https://developers.openai.com/api/docs/guides/latest-model.md`.
+   - Find the latest model ID and explicit migration or prompt-guidance links.
+   - Prefer explicit links from the latest-model page over derived URLs.
+   - For explicit named-model requests, preserve the requested model target. Mention newer remote guidance only as optional.
+   - For dynamic latest/current/default upgrades, run `node scripts/resolve-latest-model-info.js`, then fetch both returned guide URLs directly when possible.
+   - If direct guide fetch fails, use the developer-docs MCP tools or official OpenAI-domain search to find the same guide content.
+   - If remote docs are unavailable, use bundled fallback references and say that fallback guidance was used.
+4. For model upgrades, keep changes narrow: update active OpenAI API model defaults and directly related prompts only when safe.
+5. Leave historical docs, examples, eval baselines, fixtures, provider comparisons, provider registries, pricing tables, alias defaults, low-cost fallback paths, and ambiguous older model usage unchanged unless the user explicitly asks to upgrade them.
+6. Keep SDK, tooling, IDE, plugin, shell, auth, and provider-environment migrations out of a model-and-prompt upgrade unless the user explicitly asks for them.
+7. If an upgrade needs API-surface changes, schema rewiring, tool-handler changes, or implementation work beyond a literal model-string replacement and prompt edits, report it as blocked or confirmation-needed.
+8. For general docs lookup, search docs with a precise query, fetch the best page and exact section needed, and answer with concise citations.
+
+## Reference map
+
+Read only what you need:
+
+- `https://developers.openai.com/api/docs/guides/latest-model.md` -> current model-selection and "best/latest/current model" questions.
+- `scripts/fetch-codex-manual.mjs` -> current Codex manual fetch, verification, local temp cache, and outline generation.
+- `https://developers.openai.com/codex/codex-manual.md` -> current Codex self-knowledge synthesis, including setup, customization, skills, plugins, MCP, hooks, `AGENTS.md`, automations, and surface behavior; normally access it through the helper path and targeted file reads when temp caching is available.
+- `references/latest-model.md` -> bundled fallback for model-selection and "best/latest/current model" questions.
+- `references/upgrade-guide.md` -> bundled fallback for model upgrade and upgrade-planning requests.
+- `references/prompting-guide.md` -> bundled fallback for prompt rewrites and prompt-behavior upgrades.
+
+## Quality rules
+
+- Treat OpenAI docs as the source of truth; avoid speculation.
+- For Codex self-knowledge, follow the source route above instead of relying on remembered behavior.
+- Keep migration changes narrow and behavior-preserving.
+- Prefer prompt-only upgrades when possible.
+- Avoid inventing pricing, availability, parameters, API changes, or breaking changes.
+- Keep quotes short and within policy limits; prefer paraphrase with citations.
+- If multiple pages differ, call out the difference and cite both.
+- If official docs and verified callable current-session behavior disagree, state the conflict before making broad claims or edits.
+- If docs do not cover the user’s need, say so and offer next steps.
+
+## Tooling notes
+
+- Use MCP doc tools before web search for OpenAI-related markdown docs. The Codex manual flow is the exception: follow the Codex self-knowledge source procedure for broad Codex synthesis.
+- If the MCP server is installed but returns no meaningful results, then use web search as a fallback.
+- When falling back to web search, restrict to official OpenAI domains (developers.openai.com, platform.openai.com) and cite sources.
diff --git a/skills/openai-docs/agents/openai.yaml b/skills/openai-docs/agents/openai.yaml
new file mode 100644
index 0000000..8bbf03c
--- /dev/null
+++ b/skills/openai-docs/agents/openai.yaml
@@ -0,0 +1,14 @@
+interface:
+  display_name: "OpenAI Docs"
+  short_description: "Reference OpenAI docs, Codex self-knowledge, and model migration guidance"
+  icon_small: "./assets/openai-small.svg"
+  icon_large: "./assets/openai.png"
+  default_prompt: "Use OpenAI Docs for official docs lookup, questions about Codex itself or Codex surfaces, model selection, model migration, and prompt-upgrade work."
+
+dependencies:
+  tools:
+    - type: "mcp"
+      value: "openaiDeveloperDocs"
+      description: "OpenAI Developer Docs MCP server"
+      transport: "streamable_http"
+      url: "https://developers.openai.com/mcp"
diff --git a/skills/openai-docs/assets/openai-small.svg b/skills/openai-docs/assets/openai-small.svg
new file mode 100644
index 0000000..1d075dc
--- /dev/null
+++ b/skills/openai-docs/assets/openai-small.svg
@@ -0,0 +1,3 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="14" height="14" fill="currentColor" viewBox="0 0 14 14">
+  <path d="M10.931 3.34a.112.112 0 0 0-.069-.104l-.038-.007c-1.537.05-2.45.318-3.714 1.002v6.683c.48-.248.936-.44 1.414-.58.695-.203 1.417-.292 2.303-.305l.038-.008a.113.113 0 0 0 .066-.104V3.341ZM2.363 9.919c0 .064.051.11.105.111l.33.008c1.162.046 2.042.243 2.975.662-.403-.585-1.008-1.075-1.654-1.292a.991.991 0 0 1-.674-.941v-5.14a6.36 6.36 0 0 0-.59-.076l-.37-.02a.115.115 0 0 0-.122.111v6.577Zm9.455-.001a.998.998 0 0 1-.877.992l-.101.007c-.832.012-1.47.095-2.066.27-.599.174-1.176.448-1.883.863a.444.444 0 0 1-.449 0c-1.299-.763-2.229-1.07-3.689-1.125l-.299-.008a.997.997 0 0 1-.977-.998V3.342c0-.573.478-1.017 1.038-.999l.417.023c.188.015.35.037.513.062v-.754c0-.708.749-1.244 1.429-.903.984.492 1.836 1.449 2.15 2.505 1.216-.617 2.222-.884 3.771-.934l.105.003a.998.998 0 0 1 .918.996v6.576ZM4.332 8.466c0 .049.03.087.07.1l.24.091a4.319 4.319 0 0 1 1.581 1.176V3.721c-.164-.803-.799-1.617-1.584-2.07l-.162-.088c-.025-.012-.054-.013-.088.009a.12.12 0 0 0-.057.102v6.792Z"/>
+</svg>
diff --git a/skills/openai-docs/assets/openai.png b/skills/openai-docs/assets/openai.png
new file mode 100644
index 0000000000000000000000000000000000000000..e9b9eb80cd90ccdfc7e276b07f4046aa9c9d1887
GIT binary patch
literal 1429
zcmbW1X)qfI7>2WsZI&%Dh?dljBaOCEMMKw7ZA6J9aYbCMqq=TtRa|RzO_Vl5(Tby3
z>WGvo5$jf6$Dnm3k*y$7_qxxBm9_eJr$2Uf=6%0+=J|ep?|hH#F_x#Ll%)Uwz-hD<
z%JC%qJ{u@@GLIjMi30$Vo@mrf=a?63lOMvlevr3YeHmW9u)%SZM{6T>Dj>OG-NM(s
zxeg66h^R2ccnS@hB9Zx5zfp_$#T*uKL&buLGL{${$dr@`q~IC?DdR&0Yq0d<K8P63
zoq-ia(lt|gi+>z!?aXm2s}%cPO10FrRE?G-k0{=7K$_&kI=~e$pjYgzE8vVY;O<xd
zh7-$JISb@wBgjW#OZ1&1O&;m2U9KfMN=UULqKFQf`-x@tWG&~CiRI{9?_3=;#l~lR
zK#z)MO6IJRX|$k#ma65P3XlGZ>>46Hm7aP^&cE!{sKcdEAVNXg4w0>eo^HyTDRAUX
z1q<1l*$z0vv6jqHvTYK7N`0u5;6yAk8Hu1q<Wy{rILx>vr9>?%KFBwx(h6KK`f%%#
zP9L?T7T}-#%27<caJiY)8CM_rxL@n9YJDZNu(J9ejFfg_<ecNPs>~gRX#U;>m%`xu
zRx(>rAYhNw6pH4Us6k_8+@3ALmhG5zSAFOj7mD2H0~sQ=I4$p^(D+2UDcut(d(Zp!
z$J7P4kw8<WXpL^om{teTpzUG?*SB;E6jJ+JHsPQr$qRnXhSVG{9g$TC8FX`Rpn&7+
z49+fmGzlrEzf8G|kl-q=EvOW>gyQccMw&gi*xV|;t$}UYUBXtS6J`v8J*FsDliZ(~
z<@+Da;4XO8{*25XsWoe!b=2mY`PSnj0Z7~UQ*|-j*hV&a!&>HP&o)P@{myW|*myuJ
zPL74L-`HWji(Yv(m?iF4r#zM!p1!g6I7dIXic~LBBSC+v<&e%2x^h<IJiw&mW8Z#0
z{_2-+{>38vZ+K%YzU=I56m0T>JWomcJPn6TrJifjM(Wx@?~P{4<?FFY@=pSTUd~o}
zZK;*aN^s}j1WEV4qnQKwZ1F*R%O8oLP)$oaCzXCD=G9&pHSm0{G{lAl`D<rbJ!ccF
z85QDL+)<5fuOZ(l(?EyaR!ECYYzqjdxCOQ|wYt!U3M5cglY$y?<CzeXXL_6rDorOB
zaCnI6Jd%^$mGOf;e;0TE^1W_)bg_09Rn>%}rrY5}h#pwawmf9bv&aQiDux**Y3-i1
zqTMnW8G{DfFvi;3E(l}R$dnUJ(<_$+W=og_k=xR0MMrfK2)TPiox{1oBNwcL>8#m#
z2$uC?K_J`ikEKh0r?2|0pJAYIrydWjz4!V9$3;~TX9@!$D);A=7}tjnb%dew^(*jT
z!cczU%3j<f{C>Ofc-pF{Xw&l)zxDY>N0@3`IgX*{{x>pcJ4^R^O&K$8J*lYk{{3ft
z3HXDsfQ`mNPS^OYH*TNCxEWY;hF<R+^scY<FnNH(oQP8l2?g@@NIEiwbCYYbI|48j
z8ozE+o#IU-lr!8uz1JY-%2OJSVuk1og^-S*(3~~~GPq`>@zMxCh3axXGT}NR5^Abn
zdCpco+Y1il&A)g0(10*jT094hy+6Dx>_H|(eSZ_d9(a-0S=ek~_H;O<t9ybI)3JKg
zbOx4(h)2Y)5Ec$=Bnn#aUqfE~t^>Zvn>M@rc@Zsm>2rYBSEw^m9;T>t);vhumBCh|
zt36@MO*|h0+t^`bH+9yn%$0(3`IN-}RNc3{YL?YaM@F{M$-4!hEikCpNbjV70IV&k
AfB*mh

literal 0
HcmV?d00001

diff --git a/skills/openai-docs/references/latest-model.md b/skills/openai-docs/references/latest-model.md
new file mode 100644
index 0000000..a1ffbfb
--- /dev/null
+++ b/skills/openai-docs/references/latest-model.md
@@ -0,0 +1,37 @@
+# Latest model guide
+
+This file is a curated helper. Every recommendation here must be verified against current OpenAI docs before it is repeated to a user.
+
+## Current model map
+
+| Model ID | Use for |
+| --- | --- |
+| `gpt-5.5` | Latest/default text and reasoning model for most new apps, including coding and tool-heavy workflows |
+| `gpt-5.5-pro` | Maximum reasoning or quality when latency and cost matter less |
+| `gpt-5.4` | Previous default text and reasoning model; use for existing GPT-5.4 integrations |
+| `gpt-5.4-mini` | Lower-cost testing and lighter production workflows |
+| `gpt-5.4-nano` | High-throughput simple tasks and classification |
+| `gpt-5.5` | Explicit no-reasoning text path via `reasoning.effort: none` |
+| `gpt-4.1-mini` | Cheaper no-reasoning text |
+| `gpt-4.1-nano` | Fastest and cheapest no-reasoning text |
+| `gpt-5.3-codex` | Agentic coding, code editing, and tool-heavy coding workflows |
+| `gpt-5.1-codex-mini` | Cheaper coding workflows |
+| `gpt-image-2` | Best image generation and edit quality |
+| `gpt-image-1.5` | Less expensive image generation and edit quality |
+| `gpt-image-1-mini` | Cost-optimized image generation |
+| `gpt-4o-mini-tts` | Text-to-speech |
+| `gpt-4o-mini-transcribe` | Speech-to-text, fast and cost-efficient |
+| `gpt-realtime-1.5` | Realtime voice and multimodal sessions |
+| `gpt-realtime-mini` | Cheaper realtime sessions |
+| `gpt-audio` | Chat Completions audio input and output |
+| `gpt-audio-mini` | Cheaper Chat Completions audio workflows |
+| `sora-2` | Faster iteration and draft video generation |
+| `sora-2-pro` | Higher-quality production video |
+| `omni-moderation-latest` | Text and image moderation |
+| `text-embedding-3-large` | Higher-quality retrieval embeddings; default in this skill because no best-specific row exists |
+| `text-embedding-3-small` | Lower-cost embeddings |
+
+## Maintenance notes
+
+- This file will drift unless it is periodically re-verified against current OpenAI docs.
+- If this file conflicts with current docs, the docs win.
diff --git a/skills/openai-docs/references/prompting-guide.md b/skills/openai-docs/references/prompting-guide.md
new file mode 100644
index 0000000..0d9273c
--- /dev/null
+++ b/skills/openai-docs/references/prompting-guide.md
@@ -0,0 +1,244 @@
+GPT-5.5 works best when prompts define the outcome and leave room for the model to choose an efficient solution path. Compared with earlier models, you can often use shorter, more outcome-oriented prompts: describe what good looks like, what constraints matter, what evidence is available, and what the final answer should contain.
+
+Avoid carrying over every instruction from an older prompt stack. Legacy prompts often over-specify the process because earlier models needed more help staying on track. With GPT-5.5, that can add noise, narrow the model's search space, or lead to overly mechanical answers.
+
+For more detail on GPT-5.5 behavior changes, start with the [Using GPT-5.5 guide](/api/docs/guides/latest-model). This guide focuses on prompt changes that follow from those behavior changes.
+
+The patterns here are starting points. Adapt them to your product surface, tools, evals, and user experience goals.
+
+## Personality and behavior
+
+GPT-5.5's default style is efficient, direct, and task-oriented. This is useful for production systems: responses stay focused, behavior is easier to steer, and the model avoids unnecessary conversational padding.
+
+For customer-facing assistants, support workflows, coaching experiences, and other conversational products, define both personality and collaboration style.
+
+- **Personality** controls how the assistant sounds: tone, warmth, directness, formality, humor, empathy, and level of polish.
+- **Collaboration style** controls how the assistant works: when it asks questions, when it makes assumptions, how proactive it should be, how much context it gives, when it checks work, and how it handles uncertainty or risk.
+
+Keep both short. Personality instructions should shape the user experience. Collaboration instructions should shape task behavior. Neither should replace clear goals, success criteria, tool rules, or stopping conditions.
+
+Example personality block for a steady task-focused assistant:
+
+```text
+# Personality
+You are a capable collaborator: approachable, steady, and direct. Assume the user is competent and acting in good faith, and respond with patience, respect, and practical helpfulness.
+
+Prefer making progress over stopping for clarification when the request is already clear enough to attempt. Use context and reasonable assumptions to move forward. Ask for clarification only when the missing information would materially change the answer or create meaningful risk, and keep any question narrow.
+
+Stay concise without becoming curt. Give enough context for the user to understand and trust the answer, then stop. Use examples, comparisons, or simple analogies when they make the point easier to grasp. When correcting the user or disagreeing, be candid but constructive. When an error is pointed out, acknowledge it plainly and focus on fixing it.
+
+Match the user's tone within professional bounds. Avoid emojis and profanity by default, unless the user explicitly asks for that style or has clearly established it as appropriate for the conversation.
+```
+
+Example personality block for an expressive collaborative assistant:
+
+```text
+# Personality
+Adopt a vivid conversational presence: intelligent, curious, playful when appropriate, and attentive to the user's thinking. Ask good questions when the problem is blurry, then become decisive once there is enough context.
+
+Be warm, collaborative, and polished. Conversation should feel easy and alive, but not chatty for its own sake. Offer a real point of view rather than merely mirroring the user, while staying responsive to their goals and constraints.
+
+Be thoughtful and grounded when the task calls for synthesis or advice. State a clear recommendation when you have enough context, explain important tradeoffs, and name uncertainty without becoming evasive.
+```
+
+For more expressive products, add warmth, curiosity, humor, or point of view explicitly, but keep the block short. Use personality to shape the experience, not to compensate for unclear goals or missing task instructions.
+
+## Improve time to first visible token with a preamble
+
+In streaming applications, users notice how long it takes before the first visible response appears. GPT-5.5 may spend time reasoning, planning, or preparing tool calls before emitting visible text.
+
+For longer or tool-heavy tasks, prompt the model to start with a short preamble: a brief visible update that acknowledges the request and states the first step. This can improve perceived responsiveness without changing the underlying task.
+
+Use this pattern when the task may take more than one step, require tool calls, or involve a long-running agent workflow.
+
+```text
+Before any tool calls for a multi-step task, send a short user-visible update that acknowledges the request and states the first step. Keep it to one or two sentences.
+```
+
+For coding agents that expose separate message phases, you can be more explicit:
+
+```text
+You must always start with an intermediary update before any content in the analysis channel if the task will require calling tools. The user update should acknowledge the request and explain your first step.
+```
+
+## Outcome-first prompts and stopping conditions
+
+GPT-5.5 is strongest when the prompt defines the target outcome, success criteria, constraints, and available context, then lets the model choose the path.
+
+For many tasks, describe the destination rather than every step. This gives the model room to choose the right search, tool, or reasoning strategy for the task.
+
+Prefer this:
+
+```text
+Resolve the customer's issue end to end.
+
+Success means:
+- the eligibility decision is made from the available policy and account data
+- any allowed action is completed before responding
+- the final answer includes completed_actions, customer_message, and blockers
+- if evidence is missing, ask for the smallest missing field
+```
+
+**Avoid unnecessary absolute rules.** Older prompts often use strict instructions like `ALWAYS`, `NEVER`, `must`, and `only` to control model behavior. Use those words for true invariants, such as safety rules, required output fields, or actions that should never happen. For judgment calls, such as when to search, ask for clarification, use a tool, or keep iterating, prefer decision rules instead.
+
+Avoid this style of instruction unless every step is truly required:
+
+```text
+First inspect A, then inspect B, then compare every field, then think through
+all possible exceptions, then decide which tool to call, then call the tool,
+then explain the entire process to the user.
+```
+
+Add explicit stopping conditions:
+
+```text
+Resolve the user query in the fewest useful tool loops, but do not let loop minimization outrank correctness, accessible fallback evidence, calculations, or required citation tags for factual claims.
+
+After each result, ask: "Can I answer the user's core request now with useful evidence and citations for the factual claims?" If yes, answer.
+```
+
+Define missing-evidence behavior:
+
+```text
+Use the minimum evidence sufficient to answer correctly, cite it precisely, then stop.
+```
+
+## Formatting
+
+GPT-5.5 is highly steerable on output format and structure. Use that control when it improves comprehension or product fit.
+
+Set `text.verbosity`, describe the expected output shape, and reserve heavier structure for cases where it improves comprehension or your product UI needs a stable artifact. The API default for `text.verbosity` is `medium`; use `low` when you prefer shorter, more concise responses.
+
+Plain conversational formatting:
+
+```text
+Let formatting serve comprehension. Use plain paragraphs as the default format for normal conversation, explanations, reports, documentation, and technical writeups. Keep the presentation clean and readable without making the structure feel heavier than the content.
+
+Use headers, bold text, bullets, and numbered lists sparingly. Reach for them when the user requests them, when the answer needs clear comparison or ranking, or when the information would be harder to scan as prose. Otherwise, favor short paragraphs and natural transitions.
+
+Respect formatting preferences from the user. If they ask for a terse answer, minimal formatting, no bullets, no headers, or a specific structure, follow that preference unless there is a strong reason not to.
+```
+
+Add explicit audience and length guidance:
+
+```text
+Write for a senior business audience. Keep the answer under 400 words. Use short paragraphs and only include bullets when they improve scannability. Prioritize the conclusion first, then the reasoning, then caveats.
+```
+
+For editing, rewriting, summaries, or customer-facing messages, tell the model what to preserve before asking it to improve style. This pattern is useful when you want polish without expansion.
+
+```text
+Preserve the requested artifact, length, structure, and genre first. Quietly improve clarity, flow, and correctness. Do not add new claims, extra sections, or a more promotional tone unless explicitly requested.
+```
+
+## Grounding, citations, and retrieval budgets
+
+For grounded answers, citation behavior should be part of the prompt. Define what needs support, what counts as enough evidence, and how the model should behave when evidence is missing. Absence of evidence shouldn't automatically become a factual "no." For more details and examples, see the [citation formatting guide](/api/docs/guides/citation-formatting).
+
+### Add an explicit retrieval budget
+
+Retrieval budgets are stopping rules for search. They tell the model when enough evidence is enough.
+
+```text
+For ordinary Q&A, start with one broad search using short, discriminative keywords. If the top results contain enough citable support for the core request, answer from those results instead of searching again.
+
+Make another retrieval call only when:
+- The top results do not answer the core question.
+- A required fact, parameter, owner, date, ID, or source is missing.
+- The user asked for exhaustive coverage, a comparison, or a comprehensive list.
+- A specific document, URL, email, meeting, record, or code artifact must be read.
+- The answer would otherwise contain an important unsupported factual claim.
+
+Do not search again to improve phrasing, add examples, cite nonessential details, or support wording that can safely be made more generic.
+```
+
+## Creative drafting guardrails
+
+For drafting tasks, tell the model which claims must come from sources and which parts may be creatively written. This is especially important for slides, launch copy, customer summaries, talk tracks, leadership blurbs, and narrative framing.
+
+```text
+For creative or generative requests such as slides, leadership blurbs, outbound copy, summaries for sharing, talk tracks, or narrative framing, distinguish source-backed facts from creative wording.
+
+- Use retrieved or provided facts for concrete product, customer, metric, roadmap, date, capability, and competitive claims, and cite those claims.
+- Do not invent specific names, first-party data claims, metrics, roadmap status, customer outcomes, or product capabilities to make the draft sound stronger.
+- If there is little or no citable support, write a useful generic draft with placeholders or clearly labeled assumptions rather than unsupported specifics.
+```
+
+## Frontend engineering and visual taste
+
+For frontend work, refer to the [example instructions](/api/docs/guides/frontend-prompt) for practical ways to steer UI quality. They cover product and user context, design-system alignment, first-screen usability, familiar controls, expected states, responsive behavior, and common generated-UI defaults to avoid, such as generic heroes, nested cards, decorative gradients, visible instructional text, and broken layouts.
+
+## Prompt the model to check its work
+
+Give GPT-5.5 access to tools that let it check outputs when validation is possible.
+
+For coding agents, ask for concrete validation commands:
+
+```text
+After making changes, run the most relevant validation available:
+- targeted unit tests for changed behavior
+- type checks or lint checks when applicable
+- build checks for affected packages
+- a minimal smoke test when full validation is too expensive
+
+If validation cannot be run, explain why and describe the next best check.
+```
+
+For visual artifacts, ask for inspection after rendering:
+
+```text
+Render the artifact before finalizing. Inspect the rendered output for layout, clipping, spacing, missing content, and visual consistency. Revise until the rendered output matches the requirements.
+```
+
+For engineering and planning tasks, make implementation plans traceable:
+
+```text
+For implementation plans, include:
+- requirements and where each is addressed
+- named resources, files, APIs, or systems involved
+- state transitions or data flow where relevant
+- validation commands or checks
+- failure behavior
+- privacy and security considerations
+- open questions that materially affect implementation
+```
+
+## Phase parameter
+
+Starting with GPT-5.4, long-running or tool-heavy Responses workflows can use assistant-item `phase` values to distinguish intermediate updates from final answers. GPT-5.5 uses the same pattern.
+
+If you use `previous_response_id`, the API preserves prior assistant state automatically. If your application manually replays assistant output items into the next request, preserve each original `phase` value and pass it back unchanged. This matters most when a response includes preambles, repeated tool calls, or a final answer after intermediate assistant updates.
+
+```text
+If manually replaying assistant items:
+- Preserve assistant `phase` values exactly.
+- Use `phase: "commentary"` for intermediate user-visible updates.
+- Use `phase: "final_answer"` for the completed answer.
+- Do not add `phase` to user messages.
+```
+
+## Suggested prompt structure
+
+Use this structure as a starting point for complex prompts. Keep each section short. Add detail only where it changes behavior.
+
+```text
+Role: [1-2 sentences defining the model's function, context, and job]
+
+# Personality
+[tone, demeanor, and collaboration style]
+
+# Goal
+[user-visible outcome]
+
+# Success criteria
+[what must be true before the final answer]
+
+# Constraints
+[policy, safety, business, evidence, and side-effect limits]
+
+# Output
+[sections, length, and tone]
+
+# Stop rules
+[when to retry, fallback, abstain, ask, or stop]
+```
diff --git a/skills/openai-docs/references/upgrade-guide.md b/skills/openai-docs/references/upgrade-guide.md
new file mode 100644
index 0000000..b29f137
--- /dev/null
+++ b/skills/openai-docs/references/upgrade-guide.md
@@ -0,0 +1,181 @@
+# Upgrading to GPT-5.5
+
+Use this guide when the user explicitly asks to upgrade an existing integration to GPT-5.5. Pair it with current OpenAI docs lookups. The default target string is `gpt-5.5`.
+
+## Freshness check
+
+Before applying this bundled guide for a latest/current/default model upgrade, run `node scripts/resolve-latest-model-info.js` from the OpenAI Docs skill directory.
+
+- If the command returns `modelSlug: "gpt-5p5"`, continue with this bundled guide and use `references/prompting-guide.md` when prompt updates are needed.
+- If the command returns a different `modelSlug`, fetch both the returned `migrationGuideUrl` and `promptingGuideUrl` and use them as the current source of truth instead of the bundled references.
+- If the command fails, metadata is missing, or either remote guide cannot be fetched, continue with bundled fallback references and say the remote freshness check was unavailable.
+- If the user explicitly named a target model, preserve that target and use current docs only to check compatibility or caveats.
+
+## Upgrade posture
+
+Upgrade with the narrowest safe change set:
+
+- replace the model string first
+- update only the prompts that are directly tied to that model usage
+- do not automatically upgrade older or ambiguous model usages that may be intentionally pinned, such as historical docs, examples, tests, eval baselines, comparison code, or low-cost fallback/routing paths. Unless the user explicitly asks to upgrade all model usage, leave those sites unchanged and list them as confirmation-needed
+- prefer prompt-only upgrades when possible
+- if the upgrade would require API-surface changes, parameter rewrites, tool rewiring, provider migration, or broader code edits, mark it as blocked instead of stretching the scope
+
+## Upgrade workflow
+
+1. Inventory current model usage.
+   - Search for model strings, client calls, and prompt-bearing files.
+   - Include inline prompts, prompt templates, YAML or JSON configs, Markdown docs, and saved prompts when they are clearly tied to a model usage site.
+2. Pair each model usage with its prompt surface.
+   - Prefer the closest prompt surface first: inline system or developer text, then adjacent prompt files, then shared templates.
+   - If you cannot confidently tie a prompt to the model usage, say so instead of guessing.
+3. Classify the source model family.
+   - Common buckets: GPT-5.4, GPT-5.3-Codex or GPT-5.2-Codex, earlier GPT-5.x, GPT-4o or GPT-4.1, reasoning models such as o1 or o3 or o4-mini, third-party model, or mixed and unclear.
+4. Decide the upgrade class.
+   - `model string only`
+   - `model string + light prompt rewrite`
+   - `blocked without code changes`
+5. Run the compatibility gate.
+   - Check whether the current integration can accept `gpt-5.5` without API-surface changes or implementation changes.
+   - Check whether structured outputs, tool schemas, function names, and downstream parsers can remain unchanged.
+   - For long-running Responses or tool-heavy agents, check whether `phase` is already preserved or round-tripped when the host replays assistant items or uses preambles.
+   - If compatibility depends on code changes, return `blocked`.
+   - If compatibility is unclear, return `unknown` rather than improvising.
+6. Apply the upgrade when it is in scope.
+   - Default replacement string: `gpt-5.5`.
+   - Keep the intervention small and behavior-preserving.
+   - Start from the current reasoning effort when it is visible unless there is a measured reason to change it.
+   - For in-scope changes, update the model string and directly related prompts.
+   - For blocked or unknown changes, do not edit; report the blocker or uncertainty.
+7. Summarize the result.
+   - `Current model usage`
+   - `Model-string updates`
+   - `Reasoning-effort handling`
+   - `Prompt updates`
+   - `Structured output and formatting assessment`
+   - `Tool-use assessment` when the flow uses tools, retrieval, or terminal actions
+   - `Phase assessment` when the flow is long-running, replayed, or tool-heavy
+   - `Compatibility check`
+   - `Validation performed`
+
+Output rule:
+
+- For each usage site, state the starting reasoning-effort recommendation.
+- If the repo exposes the current reasoning setting, recommend preserving it first unless current OpenAI docs say otherwise.
+- If the repo does not expose the current setting, recommend not adding one unless current OpenAI docs require it.
+
+## Upgrade outcomes
+
+### `model string only`
+
+Choose this when:
+
+- the source model is GPT-5.4
+- the existing prompts are already short, explicit, and task-bounded
+- the workflow does not rely on strict output formats, tool-call behavior, batch completeness, or long-horizon execution that should be validated after the upgrade
+- there are no obvious compatibility blockers
+
+Default action:
+
+- replace the model string with `gpt-5.5`
+- preserve the current reasoning effort
+- keep prompts unchanged
+- validate behavior with existing tests, realistic spot checks, or an existing eval suite when one is already available
+
+### `model string + light prompt rewrite`
+
+Choose this when:
+
+- the task needs stronger completeness, citation discipline, verification, or dependency handling
+- the upgraded model becomes too verbose, too dense, or hard to scan unless formatting is constrained
+- the workflow has strict output shape requirements and lacks an explicit format contract, schema, or parser validation
+- the workflow is research-heavy and needs stronger handling of sparse or empty retrieval results
+- the workflow is coding-oriented, terminal-based, tool-heavy, or multi-agent, but the existing API surface and tool definitions can remain unchanged
+
+Default action:
+
+- replace the model string with `gpt-5.5`
+- preserve the current reasoning effort for the first pass
+- make only the smallest prompt edits needed for the observed workflow risk
+- read the [GPT-5.5 prompting guide](/api/docs/guides/prompt-guidance?model=gpt-5.5) to choose the smallest prompt changes that recover or improve behavior
+- avoid broad prompt cleanup unrelated to the upgrade
+- for research workflows, add citation rules, retrieval budgets, missing-evidence behavior, and validation guidance from the prompting guide
+- for dependency-aware or tool-heavy workflows, add prerequisite checks, missing-context handling, explicit tool budgets, stop conditions, and validation guidance
+- for coding or terminal workflows, add repo-specific constraints, acceptance criteria, and concrete validation commands
+- for multi-agent support or triage workflows, add task ownership, handoff, completeness, and stopping criteria
+- for long-running Responses agents with preambles or multiple assistant messages, explicitly review whether `phase` is already handled; if adding or preserving `phase` would require code edits, mark the path as `blocked`
+- do not classify a coding or tool-using Responses workflow as `blocked` just because the visible snippet is minimal; prefer `model string + light prompt rewrite` unless the repo clearly shows that a safe GPT-5.5 path would require host-side code changes
+
+### `blocked`
+
+Choose this when:
+
+- the upgrade appears to require API-surface changes
+- the upgrade appears to require parameter rewrites or reasoning-setting changes that are not exposed outside implementation code
+- the upgrade would require changing tool definitions, tool handler wiring, or schema contracts
+- the user is asking for a tooling, IDE, plugin, shell, or environment migration rather than a model and prompt migration
+- the integration depends on provider-specific APIs that do not map to the current OpenAI API surface without implementation work
+- you cannot confidently identify the prompt surface tied to the model usage
+
+Default action:
+
+- do not improvise a broader upgrade
+- report the blocker and explain that the fix is out of scope for this guide
+- if useful, describe the smallest follow-up implementation task that would unblock the migration
+
+## Compatibility checklist
+
+Before applying or recommending a model-and-prompt-only upgrade, check:
+
+1. Can the current host accept the `gpt-5.5` model string without changing client code or API surface?
+2. Are the related prompts identifiable and editable?
+3. Does the host depend on behavior that likely needs API-surface changes, parameter rewrites, provider migration, or tool rewiring?
+4. Would the likely fix be prompt-only, or would it need implementation changes?
+5. Is the prompt surface close enough to the model usage that you can make a targeted change instead of a broad cleanup?
+6. Do strict structured outputs, schemas, or downstream parsers still have an explicit contract?
+7. For long-running Responses or tool-heavy agents, is `phase` already preserved if the host relies on preambles, replayed assistant items, or multiple assistant messages?
+8. Are latency, token, or price assumptions validated by tests, realistic spot checks, or an existing eval suite rather than inferred from general model positioning?
+
+If item 1 is no, items 3 through 4 point to implementation work, or item 7 is no and the fix needs code changes, return `blocked`.
+
+If item 2 is no, return `unknown` unless the user can point to the prompt location.
+
+Important:
+
+- Existing use of tools, agents, or multiple usage sites is not by itself a blocker.
+- If the current host can keep the same API surface and the same tool definitions, prefer `model string + light prompt rewrite` over `blocked`.
+- Reserve `blocked` for cases that truly require implementation changes, not cases that only need stronger prompt steering.
+- Do not claim token savings without task-level validation.
+
+## Scope boundaries
+
+This guide may:
+
+- update or recommend updated model strings
+- update or recommend updated prompts
+- inspect code and prompt files to understand where those changes belong
+- inspect whether existing Responses flows already preserve `phase`
+- flag compatibility blockers
+- propose validation with existing tests, realistic spot checks, or existing eval suites
+
+This guide may not:
+
+- move Chat Completions code to Responses
+- move Responses code to another API surface
+- migrate SDKs, APIs, IDE configuration, shell hooks, plugins, or provider-specific tooling
+- rewrite parameter shapes
+- change tool definitions or tool-call handling
+- change structured-output wiring
+- add or retrofit `phase` handling in implementation code
+- edit business logic, orchestration logic, SDK usage, IDE configuration, shell hooks, or plugin integration behavior except for model-string replacements and directly related prompt edits
+
+If a safe GPT-5.5 upgrade requires any of those changes, mark the path as blocked and out of scope.
+
+## Validation plan
+
+- Validate each upgraded usage site with existing tests, realistic spot checks, or an existing eval suite when one is already available.
+- Compare against the current GPT-5.4 baseline when available.
+- Check task success, retry count, tool-call count, total tokens, latency, output shape, and user-visible quality.
+- For specialized workflows, validate the contract that matters most instead of judging only general output quality.
+- If prompt edits were added, confirm each block is doing real work instead of adding noise.
+- If the workflow has downstream impact, add a lightweight verification pass before finalization.
diff --git a/skills/openai-docs/scripts/fetch-codex-manual.mjs b/skills/openai-docs/scripts/fetch-codex-manual.mjs
new file mode 100644
index 0000000..b260552
--- /dev/null
+++ b/skills/openai-docs/scripts/fetch-codex-manual.mjs
@@ -0,0 +1,598 @@
+#!/usr/bin/env node
+import {
+  access,
+  mkdir,
+  readFile,
+  rename,
+  rm,
+  stat,
+  writeFile,
+} from "node:fs/promises";
+import { constants as fsConstants } from "node:fs";
+import { execFile } from "node:child_process";
+import { createHash } from "node:crypto";
+import path from "node:path";
+import process from "node:process";
+import { pathToFileURL } from "node:url";
+import { inspect, promisify } from "node:util";
+
+const DEFAULT_MANUAL_URL = "https://developers.openai.com/codex/codex-manual.md";
+const DEFAULT_CACHE_DIR_NAME = "openai-docs-cache";
+const CACHE_FILE_NAME = "codex-manual.md";
+const OUTLINE_FILE_NAME = "codex-manual.outline.md";
+const HASH_HEADER = "x-content-sha256";
+const USER_AGENT = "codex-openai-docs";
+const execFileAsync = promisify(execFile);
+
+class ManualFetchError extends Error {
+  constructor(message, options) {
+    super(message, options);
+    this.name = "ManualFetchError";
+  }
+}
+
+const sha256 = (value) => createHash("sha256").update(value).digest("hex");
+
+const withTimeout = async (promiseFactory, timeoutMs) => {
+  const controller = new AbortController();
+  const timeout = setTimeout(() => controller.abort(), timeoutMs);
+  try {
+    return await promiseFactory(controller.signal);
+  } finally {
+    clearTimeout(timeout);
+  }
+};
+
+const proxyConfigured = () =>
+  process.env.HTTP_PROXY ||
+  process.env.HTTPS_PROXY ||
+  process.env.http_proxy ||
+  process.env.https_proxy;
+
+const responseHeaders = (headers) => ({
+  get(name) {
+    return headers.get(name.toLowerCase()) ?? null;
+  },
+});
+
+const makeResponse = ({ body, headers, status }) => ({
+  headers: responseHeaders(headers),
+  ok: status >= 200 && status < 300,
+  status,
+  async text() {
+    return body;
+  },
+});
+
+const parseCurlHeaders = (rawHeaders) => {
+  const normalized = rawHeaders.replace(/\r\n/g, "\n").trim();
+  const blocks = normalized.split(/\n\n+/).filter(Boolean);
+  const headerBlock = [...blocks]
+    .reverse()
+    .find((block) => block.startsWith("HTTP/"));
+
+  if (!headerBlock) {
+    throw new ManualFetchError("curl did not return HTTP response headers.");
+  }
+
+  const [statusLine, ...lines] = headerBlock.split("\n");
+  const statusMatch = /^HTTP\/\S+\s+(\d{3})/.exec(statusLine);
+  if (!statusMatch) {
+    throw new ManualFetchError(
+      `Could not parse HTTP status from curl response: ${statusLine}`
+    );
+  }
+
+  const headers = new Map();
+  lines.forEach((line) => {
+    const separator = line.indexOf(":");
+    if (separator === -1) return;
+    const name = line.slice(0, separator).trim().toLowerCase();
+    const value = line.slice(separator + 1).trim();
+    headers.set(name, value);
+  });
+
+  return {
+    headers,
+    status: Number(statusMatch[1]),
+  };
+};
+
+const tempFilePath = (cacheDir, suffix) =>
+  path.join(
+    cacheDir,
+    `.fetch-codex-manual-${process.pid}-${Date.now()}-${Math.random()
+      .toString(16)
+      .slice(2)}${suffix}`
+  );
+
+const requestManualWithCurl = async (url, { cacheDir, method, timeoutMs }) => {
+  const headerPath = tempFilePath(cacheDir, ".headers");
+  const bodyPath = tempFilePath(cacheDir, ".body");
+  const curlNames =
+    process.platform === "win32" ? ["curl.exe", "curl"] : ["curl"];
+  const args = [
+    "--silent",
+    "--show-error",
+    "--location",
+    "--dump-header",
+    headerPath,
+    "--output",
+    bodyPath,
+    "--user-agent",
+    USER_AGENT,
+    "--max-time",
+    String(Math.max(1, Math.ceil(timeoutMs / 1000))),
+  ];
+
+  if (method === "HEAD") {
+    args.push("--head");
+  } else {
+    args.push("--request", method);
+  }
+  args.push(url);
+
+  let lastError;
+  for (const curlName of curlNames) {
+    try {
+      await execFileAsync(curlName, args, { windowsHide: true });
+      const [rawHeaders, body] = await Promise.all([
+        readFile(headerPath, "utf8"),
+        readFile(bodyPath, "utf8"),
+      ]);
+      const { headers, status } = parseCurlHeaders(rawHeaders);
+      return makeResponse({ body, headers, status });
+    } catch (error) {
+      lastError = error;
+      if (error?.code !== "ENOENT") break;
+    } finally {
+      await Promise.all([
+        rm(headerPath, { force: true }),
+        rm(bodyPath, { force: true }),
+      ]);
+    }
+  }
+
+  if (lastError?.code === "ENOENT") {
+    throw new ManualFetchError("curl is unavailable in this environment.", {
+      cause: lastError,
+    });
+  }
+  throw new ManualFetchError(`${method} ${url} could not be fetched.`, {
+    cause: lastError,
+  });
+};
+
+const requestManualWithFetch = async (url, { method, timeoutMs }) => {
+  if (typeof fetch !== "function") {
+    throw new ManualFetchError(
+      "Native fetch is unavailable in this Node runtime."
+    );
+  }
+
+  return withTimeout(
+    (signal) =>
+      fetch(url, {
+        method,
+        headers: { "User-Agent": USER_AGENT },
+        signal,
+      }),
+    timeoutMs
+  );
+};
+
+const requestManual = async (url, { cacheDir, method, timeoutMs }) => {
+  const preferCurl = Boolean(proxyConfigured()) || typeof fetch !== "function";
+  const transports = preferCurl
+    ? [
+        () => requestManualWithCurl(url, { cacheDir, method, timeoutMs }),
+        () => requestManualWithFetch(url, { method, timeoutMs }),
+      ]
+    : [
+        () => requestManualWithFetch(url, { method, timeoutMs }),
+        () => requestManualWithCurl(url, { cacheDir, method, timeoutMs }),
+      ];
+
+  let lastError;
+  for (const transport of transports) {
+    try {
+      const response = await transport();
+      if (!response.ok) {
+        throw new ManualFetchError(
+          `${method} ${url} failed with HTTP ${response.status}.`
+        );
+      }
+      return response;
+    } catch (error) {
+      lastError = error;
+    }
+  }
+
+  throw new ManualFetchError(`${method} ${url} could not be fetched.`, {
+    cause: lastError,
+  });
+};
+
+const readHeaderSha = (response) => {
+  const value = response.headers.get(HASH_HEADER);
+  if (!value || !/^[a-f0-9]{64}$/i.test(value)) {
+    throw new ManualFetchError(`Manual response is missing ${HASH_HEADER}.`);
+  }
+  return value.toLowerCase();
+};
+
+const nearestExistingParent = async (target) => {
+  let current = target;
+  while (true) {
+    try {
+      const info = await stat(current);
+      return info.isDirectory() ? current : null;
+    } catch (error) {
+      if (error?.code !== "ENOENT") return null;
+    }
+
+    const parent = path.dirname(current);
+    if (parent === current) return null;
+    current = parent;
+  }
+};
+
+const usableCacheDir = async (cacheDir) => {
+  if (!cacheDir) return null;
+  const resolved = path.resolve(cacheDir);
+
+  try {
+    const info = await stat(resolved);
+    if (!info.isDirectory()) return null;
+  } catch (error) {
+    if (error?.code !== "ENOENT") return null;
+  }
+
+  const parent = await nearestExistingParent(resolved);
+  if (!parent) return null;
+
+  try {
+    await access(parent, fsConstants.W_OK | fsConstants.X_OK);
+  } catch {
+    return null;
+  }
+
+  return resolved;
+};
+
+const defaultCacheDirCandidates = () => {
+  const candidates = [];
+  const seen = new Set();
+  const pushCandidate = (candidate) => {
+    if (!candidate || seen.has(candidate)) return;
+    seen.add(candidate);
+    candidates.push(candidate);
+  };
+
+  [process.env.TMPDIR, process.env.TEMP, process.env.TMP].forEach((baseDir) => {
+    if (baseDir) {
+      pushCandidate(path.join(baseDir, DEFAULT_CACHE_DIR_NAME));
+    }
+  });
+
+  if (process.platform !== "win32") {
+    pushCandidate(`/private/tmp/${DEFAULT_CACHE_DIR_NAME}`);
+    pushCandidate(`/tmp/${DEFAULT_CACHE_DIR_NAME}`);
+  }
+
+  return candidates;
+};
+
+const resolveCacheDir = async (cacheDir) => {
+  if (cacheDir) {
+    return usableCacheDir(cacheDir);
+  }
+
+  for (const candidate of defaultCacheDirCandidates()) {
+    const usable = await usableCacheDir(candidate);
+    if (usable) return usable;
+  }
+
+  return null;
+};
+
+const cacheFilePath = (cacheDir) => path.join(cacheDir, CACHE_FILE_NAME);
+
+const outlineFilePath = (cacheDir) => path.join(cacheDir, OUTLINE_FILE_NAME);
+
+const manualLines = (manual) => {
+  const lines = manual.replace(/\r\n/g, "\n").split("\n");
+  if (lines[lines.length - 1] === "") lines.pop();
+  return lines;
+};
+
+const sectionTitle = (rawTitle) =>
+  rawTitle.replace(/\s+#+\s*$/, "").replace(/\s+/g, " ").trim();
+
+const buildOutline = (manual) => {
+  const lines = manualLines(manual);
+  const headings = [];
+  let inFence = false;
+
+  lines.forEach((line, index) => {
+    if (/^\s*(```|~~~)/.test(line)) {
+      inFence = !inFence;
+      return;
+    }
+    if (inFence) return;
+
+    const match = /^(#{1,6})\s+(.+?)\s*$/.exec(line);
+    if (!match) return;
+
+    const level = match[1].length;
+    if (level < 2 || level > 3) return;
+
+    headings.push({
+      level,
+      title: sectionTitle(match[2]),
+      startLine: index + 1,
+      endLine: lines.length,
+    });
+  });
+
+  for (let index = 0; index < headings.length; index += 1) {
+    const heading = headings[index];
+    const nextPeer = headings
+      .slice(index + 1)
+      .find((candidate) => candidate.level <= heading.level);
+    if (nextPeer) {
+      heading.endLine = nextPeer.startLine - 1;
+    }
+  }
+
+  if (headings.length === 0) {
+    return {
+      headingCount: 0,
+      lineCount: lines.length,
+      text: "No markdown headings found.",
+    };
+  }
+
+  const minLevel = Math.min(...headings.map((heading) => heading.level));
+  return {
+    headingCount: headings.length,
+    lineCount: lines.length,
+    text: headings
+      .map((heading) => {
+        const indent = "  ".repeat(heading.level - minLevel);
+        return `${indent}- ${heading.title} (lines ${heading.startLine}-${heading.endLine})`;
+      })
+      .join("\n"),
+  };
+};
+
+const outlineMarkdown = (outline) => `# Codex Manual Outline\n\n${outline.text}\n`;
+
+const manualStatusLine = (status) =>
+  status.cacheStatus === "hit"
+    ? "Manual status: local manual was already current."
+    : "Manual status: local manual was updated.";
+
+const formatResult = ({ status, outlineText }) =>
+  [
+    `Manual path: ${status.manualPath}`,
+    `Outline path: ${status.outlinePath}`,
+    manualStatusLine(status),
+    "",
+    outlineText,
+  ].join("\n");
+
+const readCachedManual = async (cacheDir, expectedSha256) => {
+  try {
+    const manual = await readFile(cacheFilePath(cacheDir), "utf8");
+    return sha256(manual) === expectedSha256 ? manual : null;
+  } catch {
+    return null;
+  }
+};
+
+const writeCachedManual = async (cacheDir, manual) => {
+  await mkdir(cacheDir, { recursive: true });
+  const tmpPath = tempFilePath(cacheDir, `.${CACHE_FILE_NAME}.tmp`);
+  await writeFile(tmpPath, manual, "utf8");
+  await rename(tmpPath, cacheFilePath(cacheDir));
+};
+
+const writeOutline = async (cacheDir, outlineText) => {
+  await mkdir(cacheDir, { recursive: true });
+  const tmpPath = tempFilePath(cacheDir, `.${OUTLINE_FILE_NAME}.tmp`);
+  await writeFile(tmpPath, outlineText, "utf8");
+  await rename(tmpPath, outlineFilePath(cacheDir));
+};
+
+const fetchCodexManual = async ({
+  manualUrl = DEFAULT_MANUAL_URL,
+  cacheDir,
+  timeoutMs = 30000,
+} = {}) => {
+  const resolvedCacheDir = await resolveCacheDir(cacheDir);
+  if (!resolvedCacheDir) {
+    throw new ManualFetchError(
+      "Manual cache directory is unavailable; pass --cache-dir to override or use OpenAI Docs MCP fallback."
+    );
+  }
+  await mkdir(resolvedCacheDir, { recursive: true });
+
+  const headResponse = await requestManual(manualUrl, {
+    cacheDir: resolvedCacheDir,
+    method: "HEAD",
+    timeoutMs,
+  });
+  const expectedSha256 = readHeaderSha(headResponse);
+  const manualPath = cacheFilePath(resolvedCacheDir);
+  const outlinePath = outlineFilePath(resolvedCacheDir);
+  const checkedAt = new Date().toISOString();
+
+  const cachedManual = await readCachedManual(resolvedCacheDir, expectedSha256);
+  if (cachedManual !== null) {
+    const outline = buildOutline(cachedManual);
+    const outlineText = outlineMarkdown(outline);
+    await writeOutline(resolvedCacheDir, outlineText);
+
+    return {
+      outlineText,
+      status: {
+        manualUrl,
+        headerSha256: expectedSha256,
+        fetchedManualSha256: expectedSha256,
+        manualHashMatches: true,
+        cacheStatus: "hit",
+        cacheDir: resolvedCacheDir,
+        manualPath,
+        outlinePath,
+        checkedAt,
+        lineCount: outline.lineCount,
+        headingCount: outline.headingCount,
+      },
+    };
+  }
+
+  const getResponse = await requestManual(manualUrl, {
+    cacheDir: resolvedCacheDir,
+    method: "GET",
+    timeoutMs,
+  });
+  const getHeaderSha256 = readHeaderSha(getResponse);
+  if (getHeaderSha256 !== expectedSha256) {
+    throw new ManualFetchError(
+      `${HASH_HEADER} changed between HEAD and GET for ${manualUrl}.`
+    );
+  }
+
+  const manualText = await getResponse.text();
+  const actualSha256 = sha256(manualText);
+  const manualHashMatches = actualSha256 === expectedSha256;
+  if (!manualHashMatches) {
+    throw new ManualFetchError(
+      `${HASH_HEADER} did not match the fetched manual body for ${manualUrl}.`
+    );
+  }
+
+  await writeCachedManual(resolvedCacheDir, manualText);
+  const outline = buildOutline(manualText);
+  const outlineText = outlineMarkdown(outline);
+  await writeOutline(resolvedCacheDir, outlineText);
+
+  return {
+    outlineText,
+    status: {
+      manualUrl,
+      headerSha256: expectedSha256,
+      fetchedManualSha256: actualSha256,
+      manualHashMatches,
+      cacheStatus: "updated",
+      cacheDir: resolvedCacheDir,
+      manualPath,
+      outlinePath,
+      checkedAt,
+      lineCount: outline.lineCount,
+      headingCount: outline.headingCount,
+    },
+  };
+};
+
+const parseArgs = (argv) => {
+  const args = {
+    manualUrl: DEFAULT_MANUAL_URL,
+    cacheDir: undefined,
+    timeoutMs: 30000,
+    statusJson: false,
+  };
+
+  for (let index = 0; index < argv.length; index += 1) {
+    const arg = argv[index];
+    if (arg === "--manual-url") {
+      args.manualUrl = argv[++index];
+    } else if (arg === "--cache-dir") {
+      args.cacheDir = argv[++index];
+    } else if (arg === "--timeout-ms") {
+      args.timeoutMs = Number(argv[++index]);
+    } else if (arg === "--status-json") {
+      args.statusJson = true;
+    } else {
+      throw new ManualFetchError(`Unknown argument: ${arg}`);
+    }
+  }
+
+  if (!args.manualUrl) {
+    throw new ManualFetchError("--manual-url cannot be empty.");
+  }
+  if (!Number.isFinite(args.timeoutMs) || args.timeoutMs <= 0) {
+    throw new ManualFetchError("--timeout-ms must be a positive number.");
+  }
+
+  return args;
+};
+
+const main = async () => {
+  const args = parseArgs(process.argv.slice(2));
+  const { outlineText, status } = await fetchCodexManual(args);
+
+  process.stdout.write(formatResult({ status, outlineText }));
+
+  if (args.statusJson) {
+    console.error(JSON.stringify(status));
+  }
+};
+
+const envProxyHint = () => {
+  if (proxyConfigured()) {
+    return "Hint: proxy env vars are present. This helper prefers `curl` in proxied sessions; if requests still fail, verify `curl` is installed and the proxy configuration is valid.";
+  }
+  if (typeof fetch !== "function") {
+    return "Hint: native fetch is unavailable in this Node runtime. Install `curl` or use a newer Node version to fetch the manual.";
+  }
+  if (process.platform === "win32") {
+    return "Hint: on Windows, pass a cache dir under `%TEMP%` or `%TMP%`.";
+  }
+  return null;
+};
+
+const formatErrorDetails = (error) => {
+  const details = inspect(error, {
+    breakLength: 120,
+    colors: false,
+    compact: false,
+    depth: 8,
+  });
+  if (!error?.cause) {
+    return details;
+  }
+
+  return `${details}\n\nCause:\n${inspect(error.cause, {
+    breakLength: 120,
+    colors: false,
+    compact: false,
+    depth: 8,
+  })}`;
+};
+
+const isCliEntrypoint = () => {
+  const entrypoint = process.argv[1];
+  if (!entrypoint) {
+    return false;
+  }
+
+  return pathToFileURL(entrypoint).href === import.meta.url;
+};
+
+if (isCliEntrypoint()) {
+  main().catch((error) => {
+    console.error(`Error: ${error.message}`);
+    const hint = envProxyHint();
+    if (hint) {
+      console.error(hint);
+    }
+    console.error("");
+    console.error("Details:");
+    console.error(formatErrorDetails(error));
+    process.exitCode = 1;
+  });
+}
+
+export { DEFAULT_MANUAL_URL, fetchCodexManual };
diff --git a/skills/openai-docs/scripts/resolve-latest-model-info.js b/skills/openai-docs/scripts/resolve-latest-model-info.js
new file mode 100644
index 0000000..1bd16ac
--- /dev/null
+++ b/skills/openai-docs/scripts/resolve-latest-model-info.js
@@ -0,0 +1,147 @@
+#!/usr/bin/env node
+
+const fs = require("node:fs/promises");
+const path = require("node:path");
+
+const DEFAULT_URL =
+  "https://developers.openai.com/api/docs/guides/latest-model.md";
+const DEFAULT_BASE_URL = "https://developers.openai.com";
+
+function parseArgs(argv) {
+  const args = {
+    source: process.env.LATEST_MODEL_URL || DEFAULT_URL,
+    baseUrl: process.env.LATEST_MODEL_BASE_URL || DEFAULT_BASE_URL,
+  };
+
+  for (let i = 2; i < argv.length; i += 1) {
+    const arg = argv[i];
+    if (arg === "--source" || arg === "--url") {
+      args.source = argv[i + 1];
+      i += 1;
+    } else if (arg === "--base-url") {
+      args.baseUrl = argv[i + 1];
+      i += 1;
+    }
+  }
+
+  return args;
+}
+
+async function readSource(source) {
+  if (source.startsWith("file://")) {
+    return fs.readFile(new URL(source), "utf8");
+  }
+
+  if (!/^https?:\/\//.test(source)) {
+    return fs.readFile(path.resolve(source), "utf8");
+  }
+
+  const response = await fetch(source, {
+    headers: { accept: "text/markdown,text/plain,*/*" },
+  });
+
+  if (!response.ok) {
+    throw new Error(`failed to fetch ${source}: ${response.status}`);
+  }
+
+  return response.text();
+}
+
+function parseIndentedInfo(lines, startIndex) {
+  const info = {};
+
+  for (let i = startIndex + 1; i < lines.length; i += 1) {
+    const line = lines[i];
+    if (!line.trim()) {
+      continue;
+    }
+
+    const match = line.match(/^ {2}([A-Za-z][A-Za-z0-9_-]*):\s*(.+?)\s*$/);
+    if (!match) {
+      break;
+    }
+
+    info[match[1]] = match[2].replace(/^["']|["']$/g, "");
+  }
+
+  return info;
+}
+
+function parseFlatInfo(block) {
+  const info = {};
+
+  for (const line of block.split(/\r?\n/)) {
+    const match = line.match(/^\s*([A-Za-z][A-Za-z0-9_-]*):\s*(.+?)\s*$/);
+    if (match) {
+      info[match[1]] = match[2].replace(/^["']|["']$/g, "");
+    }
+  }
+
+  return info;
+}
+
+function extractLatestModelInfo(markdown) {
+  const lines = markdown.split(/\r?\n/);
+  const latestModelInfoIndex = lines.findIndex((line) =>
+    /^latestModelInfo:\s*$/.test(line)
+  );
+
+  if (latestModelInfoIndex >= 0) {
+    return parseIndentedInfo(lines, latestModelInfoIndex);
+  }
+
+  const commentMatch = markdown.match(
+    /<!--\s*latestModelInfo\s*\n([\s\S]*?)\n\s*-->/m
+  );
+  if (commentMatch) {
+    return parseFlatInfo(commentMatch[1]);
+  }
+
+  return undefined;
+}
+
+function modelToSkillSlug(model) {
+  return model.trim().replace(/\./g, "p");
+}
+
+function absoluteUrl(baseUrl, value) {
+  return new URL(value, baseUrl).toString();
+}
+
+function normalizeInfo(info, baseUrl) {
+  const model = info?.model?.trim();
+  const migrationGuide = info?.migrationGuide?.trim();
+  const promptingGuide = info?.promptingGuide?.trim();
+
+  if (!model || !migrationGuide || !promptingGuide) {
+    throw new Error(
+      "latestModelInfo must include model, migrationGuide, and promptingGuide"
+    );
+  }
+
+  return {
+    model,
+    modelSlug: modelToSkillSlug(model),
+    migrationGuideUrl: absoluteUrl(baseUrl, migrationGuide),
+    promptingGuideUrl: absoluteUrl(baseUrl, promptingGuide),
+  };
+}
+
+async function main() {
+  const { source, baseUrl } = parseArgs(process.argv);
+  const markdown = await readSource(source);
+  const info = extractLatestModelInfo(markdown);
+
+  if (!info) {
+    throw new Error(`latestModelInfo block not found in ${source}`);
+  }
+
+  process.stdout.write(
+    `${JSON.stringify(normalizeInfo(info, baseUrl), null, 2)}\n`
+  );
+}
+
+main().catch((error) => {
+  console.error(error.message);
+  process.exit(1);
+});
diff --git a/skills/plugin-creator/SKILL.md b/skills/plugin-creator/SKILL.md
new file mode 100644
index 0000000..af960ec
--- /dev/null
+++ b/skills/plugin-creator/SKILL.md
@@ -0,0 +1,243 @@
+---
+name: plugin-creator
+description: Create and scaffold plugin directories for Codex with a required `.codex-plugin/plugin.json`, optional plugin folders/files, valid manifest defaults, and personal-marketplace entries by default. Use when Codex needs to create a new personal plugin, add optional plugin structure, generate or update marketplace entries for plugin ordering and availability metadata, or update an existing local plugin during development with the CLI-driven cachebuster and reinstall flow.
+---
+
+# Plugin Creator
+
+## Quick Start
+
+1. Run the scaffold script:
+
+```bash
+# Plugin names are normalized to lower-case hyphen-case and must be <= 64 chars.
+# The generated folder and plugin.json name are always the same.
+# Run from the skill root (the directory containing this `SKILL.md`).
+# By default creates in `~/plugins/<plugin-name>`.
+python3 scripts/create_basic_plugin.py <plugin-name>
+```
+
+2. Edit `<plugin-path>/.codex-plugin/plugin.json` when the request gives specific metadata.
+   The scaffold starts with valid defaults and must not contain `[TODO: ...]` placeholders.
+
+3. Generate or update the personal marketplace entry when the plugin should appear in Codex UI ordering:
+
+```bash
+# Personal marketplace entries default to `~/.agents/plugins/marketplace.json`.
+python3 scripts/create_basic_plugin.py my-plugin --with-marketplace
+```
+
+Only specify `--marketplace-name <name>` when the default `personal` marketplace name is already
+taken or installed and you need to seed a different new marketplace file:
+
+```bash
+python3 scripts/create_basic_plugin.py my-plugin \
+  --with-marketplace \
+  --marketplace-name team-local
+```
+
+Only use a repo/team marketplace when the user specifically asks for that destination:
+
+```bash
+python3 scripts/create_basic_plugin.py my-plugin \
+  --path <repo-root>/plugins \
+  --marketplace-path <repo-root>/.agents/plugins/marketplace.json \
+  --with-marketplace
+```
+
+When the user specifies a marketplace path, make sure that marketplace is actually installed before
+telling the user to reinstall from it. The default personal marketplace file at
+`~/.agents/plugins/marketplace.json` is discovered implicitly, but other marketplace paths are not.
+On Windows, use the equivalent path under the user profile.
+
+4. Generate/adjust optional companion folders as needed:
+
+```bash
+python3 scripts/create_basic_plugin.py my-plugin \
+  --path <parent-plugin-directory> \
+  --marketplace-path <marketplace-json-path> \
+  --with-skills --with-hooks --with-scripts --with-assets --with-mcp --with-apps --with-marketplace
+```
+
+`<parent-plugin-directory>` is the directory where the plugin folder `<plugin-name>` will be
+created (for example `~/plugins`).
+
+5. Before handing back a generated plugin, run:
+
+```bash
+python3 scripts/validate_plugin.py <plugin-path>
+```
+
+For updates to an existing local plugin during development, keep the scaffold flow as-is and use the
+reference instead of hand-editing marketplace files:
+
+```bash
+python3 scripts/update_plugin_cachebuster.py <plugin-path>
+```
+
+Prefer the helper default cachebuster unless the user explicitly asks for a specific override.
+See `references/installing-and-updating.md` for the expected cachebuster and reinstall flow while iterating on an existing local plugin.
+
+## What this skill creates
+
+- Default marketplace-backed scaffolds use the personal marketplace file at
+  `~/.agents/plugins/marketplace.json`, with plugins generally being stored in
+  `~/plugins/<plugin-name>/`.
+- Creates plugin root at `/<parent-plugin-directory>/<plugin-name>/`.
+- Always creates `/<parent-plugin-directory>/<plugin-name>/.codex-plugin/plugin.json`.
+- Fills the manifest with the validated schema shape that the ingestion path accepts.
+- Creates or updates `~/.agents/plugins/marketplace.json` when `--with-marketplace` is set.
+  - If the marketplace file does not exist yet, seed a personal marketplace root before adding the first plugin entry.
+- `<plugin-name>` is normalized using skill-creator naming rules:
+  - `My Plugin` → `my-plugin`
+  - `My--Plugin` → `my-plugin`
+  - underscores, spaces, and punctuation are converted to `-`
+  - result is lower-case hyphen-delimited with consecutive hyphens collapsed
+- Supports optional creation of:
+  - `skills/`
+  - `hooks/`
+  - `scripts/`
+  - `assets/`
+  - `.mcp.json`
+  - `.app.json`
+
+## Marketplace workflow
+
+- Personal-marketplace creation defaults to `~/.agents/plugins/marketplace.json`. Here,
+  "personal marketplace" means the marketplace whose file is at that path.
+- Repo/team marketplace creation is opt-in through both `--path` and `--marketplace-path`, only
+  when the user specifically requests it.
+- `--marketplace-name` is an exception path. Use it only when the default `personal` marketplace
+  name is already taken and you need to seed a different new marketplace file.
+- Do not use `--marketplace-name` to rename an existing marketplace file in place. If the file
+  already exists, its top-level `name` must already match.
+- If the user specifies a different marketplace path, treat that marketplace as needing explicit installation via `codex plugin marketplace add`.
+- Prefer `scripts/read_marketplace_name.py` when you need the marketplace name from any
+  `marketplace.json` file. With no argument it reads the default personal marketplace; with an
+  explicit path it works for repo/team marketplaces too.
+- In either location, the generated source path remains `./plugins/<plugin-name>`.
+- Marketplace root metadata supports top-level `name` plus optional `interface.displayName`.
+- Treat plugin order in `plugins[]` as render order in Codex. Append new entries unless a user explicitly asks to reorder the list.
+- `displayName` belongs inside the marketplace `interface` object, not individual `plugins[]` entries.
+- Each generated marketplace entry must include all of:
+  - `policy.installation`
+  - `policy.authentication`
+  - `category`
+- Default new entries to:
+  - `policy.installation: "AVAILABLE"`
+  - `policy.authentication: "ON_INSTALL"`
+- Override defaults only when the user explicitly specifies another allowed value.
+- Allowed `policy.installation` values:
+  - `NOT_AVAILABLE`
+  - `AVAILABLE`
+  - `INSTALLED_BY_DEFAULT`
+- Allowed `policy.authentication` values:
+  - `ON_INSTALL`
+  - `ON_USE`
+- Treat `policy.products` as an override. Omit it unless the user explicitly requests product gating.
+- The generated plugin entry shape is:
+
+```json
+{
+  "name": "plugin-name",
+  "source": {
+    "source": "local",
+    "path": "./plugins/plugin-name"
+  },
+  "policy": {
+    "installation": "AVAILABLE",
+    "authentication": "ON_INSTALL"
+  },
+  "category": "Productivity"
+}
+```
+
+- Use `--force` only when intentionally replacing an existing marketplace entry for the same plugin name.
+- If the target marketplace file does not exist yet, create it with top-level `"name"`, an `"interface"` object containing `"displayName"`, and a `plugins` array, then add the new entry.
+
+- For a brand-new marketplace file, the root object should look like:
+
+```json
+{
+  "name": "personal",
+  "interface": {
+    "displayName": "Personal"
+  },
+  "plugins": [
+    {
+      "name": "plugin-name",
+      "source": {
+        "source": "local",
+        "path": "./plugins/plugin-name"
+      },
+      "policy": {
+        "installation": "AVAILABLE",
+        "authentication": "ON_INSTALL"
+      },
+      "category": "Productivity"
+    }
+  ]
+}
+```
+
+## Required behavior
+
+- Outer folder name and `plugin.json` `"name"` are always the same normalized plugin name.
+- Do not remove required structure; keep `.codex-plugin/plugin.json` present.
+- Do not leave `[TODO: ...]` placeholders in plugin manifests.
+- Keep `apps` and `mcpServers` out of `plugin.json` unless their companion files are actually created.
+- Omit unsupported plugin manifest fields that validation rejects, including `hooks`.
+- If creating files inside an existing plugin path, use `--force` only when overwrite is intentional.
+- Preserve any existing marketplace `interface.displayName`.
+- When generating marketplace entries, always write `policy.installation`, `policy.authentication`, and `category` even if their values are defaults.
+- Add `policy.products` only when the user explicitly asks for that override.
+- Keep marketplace `source.path` relative to the selected marketplace root as `./plugins/<plugin-name>`.
+- Only use `--marketplace-name` when creating a new marketplace file whose name should not be
+  `personal` because that name is already taken or installed elsewhere.
+- If Codex would need approval to write the marketplace file, ask for that approval before
+  proceeding. If the user prefers to run the write themselves, provide the exact scaffold command
+  and then continue from validation or subsequent plugin edits instead of leaving the workflow
+  vague.
+- For updates to an existing local plugin during development, do not hand-edit marketplace config
+  or `marketplace.json`. Use the update flow documented in
+  `references/installing-and-updating.md` and `scripts/update_plugin_cachebuster.py`.
+- Do not tell the user to run `codex plugin marketplace add` for the default personal-marketplace
+  flow. That command is for explicit non-default marketplace configuration, not for the standard
+  `~/.agents/plugins/marketplace.json` path.
+- If the user provided a non-default `--marketplace-path`, make sure that marketplace is installed
+  before giving reinstall instructions. Use `codex plugin marketplace add <path-to-marketplace-root>`
+  when that explicit marketplace has not been configured yet.
+- When the workflow created or updated a marketplace-backed plugin, end the final user-facing
+  response with a short Codex app handoff. Say `To view this in the Codex app:` and write
+  `View <normalized plugin name>` and `Share <normalized plugin name>` as Markdown links, not raw
+  URLs or code spans.
+- The View deeplink uses `codex://plugins/<normalized plugin name>?marketplacePath=<absolute marketplace.json path>`.
+  The Share deeplink uses the same URL with `&mode=share`.
+- Replace the placeholders with the real normalized plugin name and absolute `marketplace.json`
+  path from the scaffolded plugin. URL-encode the path segment and query value when needed.
+- Do not add `pluginName` or `hostId` query parameters to these deeplinks. Codex derives both after
+  the user clicks the link.
+- Do not emit the `View <normalized plugin name>` or `Share <normalized plugin name>` links when no marketplace entry was
+  created or updated.
+
+## Reference to exact spec sample
+
+For the exact canonical sample JSON for both plugin manifests and marketplace entries, use:
+
+- `references/plugin-json-spec.md`
+- `references/installing-and-updating.md` for update/reinstall guidance while
+  iterating on an existing local plugin, plus the new-thread pickup behavior after reinstall
+
+## Validation
+
+After editing `SKILL.md`, run:
+
+```bash
+python3 ../skill-creator/scripts/quick_validate.py .
+```
+
+Before handing back a generated plugin, run:
+
+```bash
+python3 scripts/validate_plugin.py <plugin-path>
+```
diff --git a/skills/plugin-creator/agents/openai.yaml b/skills/plugin-creator/agents/openai.yaml
new file mode 100644
index 0000000..19a9a6f
--- /dev/null
+++ b/skills/plugin-creator/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "Plugin Creator"
+  short_description: "Scaffold plugins and marketplace entries"
+  default_prompt: "Use $plugin-creator to scaffold a valid plugin in the personal marketplace, then validate it before handing it back."
+  icon_small: "./assets/plugin-creator-small.svg"
+  icon_large: "./assets/plugin-creator.png"
diff --git a/skills/plugin-creator/assets/plugin-creator-small.svg b/skills/plugin-creator/assets/plugin-creator-small.svg
new file mode 100644
index 0000000..c6e4f67
--- /dev/null
+++ b/skills/plugin-creator/assets/plugin-creator-small.svg
@@ -0,0 +1,3 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" viewBox="0 0 20 20">
+  <path fill="#0D0D0D" d="M12.03 4.113a3.612 3.612 0 0 1 5.108 5.108l-6.292 6.29c-.324.324-.56.561-.791.752l-.235.176c-.205.14-.422.261-.65.36l-.229.093a4.136 4.136 0 0 1-.586.16l-.764.134-2.394.4c-.142.024-.294.05-.423.06-.098.007-.232.01-.378-.026l-.149-.05a1.081 1.081 0 0 1-.521-.474l-.046-.093a1.104 1.104 0 0 1-.075-.527c.01-.129.035-.28.06-.422l.398-2.394c.1-.602.162-.987.295-1.35l.093-.23c.1-.228.22-.445.36-.65l.176-.235c.19-.232.428-.467.751-.79l6.292-6.292Zm-5.35 7.232c-.35.35-.534.535-.66.688l-.11.147a2.67 2.67 0 0 0-.24.433l-.062.154c-.08.22-.124.462-.232 1.112l-.398 2.394-.001.001h.003l2.393-.399.717-.126a2.63 2.63 0 0 0 .394-.105l.154-.063a2.65 2.65 0 0 0 .433-.24l.147-.11c.153-.126.339-.31.688-.66l4.988-4.988-3.227-3.226-4.987 4.988Zm9.517-6.291a2.281 2.281 0 0 0-3.225 0l-.364.362 3.226 3.227.363-.364c.89-.89.89-2.334 0-3.225ZM4.583 1.783a.3.3 0 0 1 .294.241c.117.585.347 1.092.707 1.48.357.385.859.668 1.549.783a.3.3 0 0 1 0 .592c-.69.115-1.192.398-1.549.783-.315.34-.53.77-.657 1.265l-.05.215a.3.3 0 0 1-.588 0c-.117-.585-.347-1.092-.707-1.48-.357-.384-.859-.668-1.549-.783a.3.3 0 0 1 0-.592c.69-.115 1.192-.398 1.549-.783.36-.388.59-.895.707-1.48l.015-.05a.3.3 0 0 1 .279-.19Z"/>
+</svg>
diff --git a/skills/plugin-creator/assets/plugin-creator.png b/skills/plugin-creator/assets/plugin-creator.png
new file mode 100644
index 0000000000000000000000000000000000000000..4f3d6d82fa78fbdce97af3c17f6a25c683aa3290
GIT binary patch
literal 1563
zcmV+$2ITpPP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1+Ym(K~#7F?cH5#
z99100@!y%5ZPPYs)~0PjXk@GQA{H?sLh4NusZb$>1#i4F!Dtb@FnH%p6OalPi4TDy
zMcTdqNqhk%K`*Qbx>_X{K4hvjHd<=hH0fq{Gsiib9J_g*IrFfyGygA?&1Rp<e)!Lv
z&F&-sMNt$*Q4~c{6h%=KMNyPO4AlSe^Y3O*N_Bv<bom=~{{V|kChCnG>l>Iw2qhkb
ze|)YB#{A1DHe~H{=}oVwFPPA*37~O^y*^+fpb`thKY1$)zGE1LrVQMsu}jdkKwuIF
z!Y>Y|aer<UrQKcdlAZ^Q{2)91&JcVoQ6T*Ma0W$d-2N&9zp9%V!;uSptb5j%eT;^L
z6bObW-<-wIr$^yai2w-<LzX|##Yf)12p@_)$mHZ?=J%(Mjaw-rgCMhbFaPM=oA6ky
z_aOp9(=>ZBkl8tR2W{Vc1+7>_fXyPMKjmfh7264^#1Q8f8yfM)Gsj@1QV6g#maH@I
zP%I~8Ek<RbOv;k}5F1c?Wgoi<*$P7x%A{x|<$X!4K(@n>1&*Sz<4`O%n=C#xm?`ka
z@f*eCnG*Imx=o;)FU8GPEG9%?fE(jGa4*wlOu)drquT{LDa8yFs(BEJAz$>R*gPVE
zqU#+{sHQ>IV#p$cqEO9(Y=$ALItt^-S@v#+A*(J*LO`5i$f|}?GICI;ra;_c$ihcq
zX6#?7t76DPMwx(OH38xkLlzp!uBppVEb<_JVaNhUVVGdAj!ZzYNQ3x|AuFRSya%H+
z?dbZhQ0jjifQKRr5)?-HzW@Ca#_cg2y7h{`C>$TMzDr80D_JB#g2uq?7v-;0HimyF
z%!H*6!ecrjR#+G^-I_yvejNAeo`a<|Y<nL|JL@pN{{Z&hoCdS3mG9aZOIo+R)V&Fh
zMG7Qr44F3+E-_5_P-H-=g&|WxS=iTPHeUbJHw;lE-k_>BMrB2#6*u;OYX9V;b-SyY
zmSuIfx3`<{v8qo<lrTgNCnXS!^5dh5MGZr?4N71b<;O;qiYkU|6O=$P%8!dG6m<;Q
z8kE2>M4|80YXzgSg7L69b@21RF+`z))FOtR$uxAc?!1W*3JruXoD~WPVK^^v5W;X*
zpdf_dzQ8~TL#;qS2tz&JK?uWJzP@9~zdK179`pAt+{P25gyAjUK={;^Ves}2U?==6
zNf;tu_96V2E4^TR<-qwx`(A%qKJ|LP3BwTiGa(EWhXUIZ!jHo1q$CkT<Qb$q9qaZR
z-cXW?A@V*UtEQteHIyV{h&+Mtsqv1jS5@v%l8zzrHX()S?Dki3hC&$2c>~d#9UdUR
zH40%o$QuZQi$i}mMj?#VDT6HUKah5JtJNrku|D+)DV1De$d*y~ogWBegVa9;v@4x`
z{E^m^dv>Y3)-b^IHelgvz;bpZlf!BnL!=DS*wpgU)oZ_Yc0Tbalu)#Ku-%=0qSQQw
zNPQo|`ICR&zKgd<K7%+_%4h~_Ia@yUSS&C^${>uf@(L>gD6zp1DQ&W{*=*XftU-Bx
z{{AAaUi%GI*nGtbL!>kzrBZ3#>yIi-O6)L1N+5D`wYCsZVu>MA1<7o7SqLbx#Skfh
zh!xgWmj{RvYYdUEo2<$LK#4tu$n`2~?FwtF{91jn{I@yA@4gUs43X;z*=U8eRh}nB
zZ@!E}7h*pdGS?vX=F0UC71dDKEG$029y`&?4tIz02f3n9Xus>kIZ7E~2%2`79eMr(
zBrMmT%M$w#UDy9A6bf}v=-|G+IQzzn<<ph_!YmliS%q8QYkJd|jWB@(r}RO&{{H^K
znVFe0E^lVq|8n+{`TD76Tg=x^9nGP>BbTJjk&~1^x!BXwGidKmHbOD6^2FPh=j>?`
zzdy<x8yll1-a(!|N-8#Aa@A!RhIqp1iKi%vq9}@@D2k#eilV55^dCV<^wOW~YLEZ`
N002ovPDHLkV1k6v&87eV

literal 0
HcmV?d00001

diff --git a/skills/plugin-creator/references/installing-and-updating.md b/skills/plugin-creator/references/installing-and-updating.md
new file mode 100644
index 0000000..28b3b88
--- /dev/null
+++ b/skills/plugin-creator/references/installing-and-updating.md
@@ -0,0 +1,143 @@
+# Updating Existing Local Plugins
+
+Use this reference when a plugin already exists and the request is about updating the plugin during 
+local development.
+
+All scripts here are specified relative to the skill root. Update the path for running the scripts
+depending on your current working directory.
+
+## When To Use This Flow
+
+Use this flow when all of the following are true:
+
+- the plugin already exists locally
+- the marketplace entry already points at the plugin source you are editing
+- the user wants Codex to see the updated plugin without manually editing marketplace files
+
+If the user still needs the initial plugin entry or marketplace structure created, use the scaffold
+flow first and only then switch to this reinstall flow.
+
+## Update Loop
+
+1. Update the plugin manifest to a single Codex cachebuster suffix:
+
+```bash
+python3 scripts/update_plugin_cachebuster.py \
+  <plugin-path>
+```
+
+Prefer the default helper behavior here. If you omit `--cachebuster`, the helper uses a UTC
+timestamp down to seconds, which is the recommended path for routine local iteration.
+
+Only use a manual cachebuster override when the user explicitly asks for one or when a workflow
+outside Codex depends on a specific token:
+
+```bash
+python3 scripts/update_plugin_cachebuster.py \
+  <plugin-path> \
+  --cachebuster local-20260519-184516
+```
+
+2. For the default scaffolded flow, read the marketplace name from the personal marketplace file:
+
+```bash
+python3 scripts/read_marketplace_name.py
+```
+
+Here, "personal marketplace" means the marketplace whose file is at
+`~/.agents/plugins/marketplace.json`. On Windows, use the equivalent path under the user profile.
+The helper uses Python's home-directory resolution and prints the marketplace name to use when
+constructing the install command.
+
+To read the name from a different marketplace file, pass the path directly:
+
+```bash
+python3 scripts/read_marketplace_name.py --marketplace-path <path-to-marketplace.json>
+```
+
+3. Reinstall from that marketplace name:
+
+```bash
+codex plugin add <plugin-name>@<marketplace-name-from-marketplace-json>
+```
+
+The default personal marketplace is discovered implicitly from
+`~/.agents/plugins/marketplace.json`. You do not need `codex plugin marketplace add` for that
+path, and `codex plugin marketplace list` is not the right check for whether that default
+marketplace exists.
+
+4. If the plugin is not using the personal marketplace file, check which configured local
+   marketplace is actually surfacing that plugin:
+
+```bash
+codex plugin list
+```
+
+If the plugin is not in the personal marketplace file, confirm which marketplace entry points at
+the plugin source you are editing and make sure that marketplace is still local. If it is a
+different local marketplace, reinstall from that marketplace name instead of forcing the personal
+marketplace flow. If it is not local, stop and help the user resolve the mismatch before
+continuing.
+
+5. If the plugin lives in a different confirmed local marketplace, substitute that marketplace
+   name:
+
+```bash
+codex plugin add <plugin-name>@<local-marketplace>
+```
+
+6. Prompt the user to use a new thread to try the updated plugin, so that Codex picks up new skills
+   and tools.
+
+## Cachebuster Policy
+
+- Preserve the existing version prefix and replace only the suffix.
+- Treat the preserved prefix as everything before `+`.
+- Use the format:
+
+```text
+<base-version>+codex.<cachebuster>
+```
+
+Examples:
+
+- `0.1.0` → `0.1.0+codex.local-20260519-184516`
+- `0.1.0+codex.old-token` → `0.1.0+codex.local-20260519-184516`
+- `1.2.3-beta.1+codex.prev` → `1.2.3-beta.1+codex.local-20260519-184516`
+- `dev-build+other-tag` → `dev-build+codex.local-20260519-184516`
+
+Replace the existing Codex cachebuster instead of appending another one. Do not keep incrementing
+numeric version components just to trigger reinstall behavior.
+
+## Marketplace Rules
+
+- Marketplace manipulation should happen through commands, not by hand-editing `marketplace.json`
+  or `config.toml` during this update/reinstall flow.
+- Prefer the personal marketplace file for the default scaffolded flow.
+- Read the personal marketplace name with
+  `python3 scripts/read_marketplace_name.py` and use the printed value when constructing
+  `codex plugin add <plugin-name>@<marketplace-name>`.
+- For non-default marketplace files, use
+  `python3 scripts/read_marketplace_name.py --marketplace-path <path-to-marketplace.json>` to read
+  the name before constructing reinstall commands.
+- Do not tell the user to run `codex plugin marketplace add` for the default personal-marketplace
+  flow. That marketplace is discovered implicitly by Codex.
+- If the user specified a different marketplace path, make sure that marketplace is installed
+  before giving install or reinstall instructions. Non-default marketplace paths are not
+  discovered implicitly.
+- Use `codex plugin list` when the plugin lives in a different configured marketplace and you need
+  to confirm which marketplace is surfacing that plugin.
+- If a non-default local marketplace has not been configured yet, install it with
+  `codex plugin marketplace add <path-to-marketplace-root>` before telling the user to run
+  `codex plugin add <plugin-name>@<marketplace-name>`.
+- If the plugin is not in the personal marketplace file, confirm that the selected marketplace is
+  local before telling the user to reinstall from it.
+- If the selected marketplace is not local, stop and help the user resolve that mismatch rather
+  than pretending the normal local reinstall flow applies.
+- If the plugin source is not already the source referenced by the chosen marketplace entry, stop
+  and fix that first. This update flow does not rewrite marketplace entries.
+
+## After Reinstall
+
+After reinstalling, prompt the user to start a new thread for testing. That is the safe boundary for
+picking up the updated plugin and its MCP tools.
diff --git a/skills/plugin-creator/references/plugin-json-spec.md b/skills/plugin-creator/references/plugin-json-spec.md
new file mode 100644
index 0000000..5eb2251
--- /dev/null
+++ b/skills/plugin-creator/references/plugin-json-spec.md
@@ -0,0 +1,194 @@
+# Plugin JSON sample spec
+
+```json
+{
+  "name": "plugin-name",
+  "version": "1.2.0",
+  "description": "Brief plugin description",
+  "author": {
+    "name": "Author Name",
+    "email": "author@example.com",
+    "url": "https://github.com/author"
+  },
+  "homepage": "https://docs.example.com/plugin",
+  "repository": "https://github.com/author/plugin",
+  "license": "MIT",
+  "keywords": ["keyword1", "keyword2"],
+  "skills": "./skills/",
+  "hooks": "./hooks.json",
+  "mcpServers": "./.mcp.json",
+  "apps": "./.app.json",
+  "interface": {
+    "displayName": "Plugin Display Name",
+    "shortDescription": "Short description for subtitle",
+    "longDescription": "Long description for details page",
+    "developerName": "OpenAI",
+    "category": "Productivity",
+    "capabilities": ["Interactive", "Write"],
+    "websiteURL": "https://openai.com/",
+    "privacyPolicyURL": "https://openai.com/policies/row-privacy-policy/",
+    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
+    "defaultPrompt": [
+      "Summarize my inbox and draft replies for me.",
+      "Find open bugs and turn them into Linear tickets.",
+      "Review today's meetings and flag scheduling gaps."
+    ],
+    "brandColor": "#3B82F6",
+    "composerIcon": "./assets/icon.png",
+    "logo": "./assets/logo.png",
+    "screenshots": [
+      "./assets/screenshot1.png",
+      "./assets/screenshot2.png",
+      "./assets/screenshot3.png"
+    ]
+  }
+}
+```
+
+## Field guide
+
+### Top-level fields
+
+- `name` (`string`): Plugin identifier (kebab-case, no spaces). Required if `plugin.json` is provided and used as manifest name and component namespace.
+- `version` (`string`): Plugin semantic version.
+- `description` (`string`): Short purpose summary.
+- `author` (`object`): Publisher identity.
+  - `name` (`string`): Author or team name.
+  - `email` (`string`): Contact email.
+  - `url` (`string`): Author/team homepage or profile URL.
+- `homepage` (`string`): Documentation URL for plugin usage.
+- `repository` (`string`): Source code URL.
+- `license` (`string`): License identifier (for example `MIT`, `Apache-2.0`).
+- `keywords` (`array` of `string`): Search/discovery tags.
+- `skills` (`string`): Relative path to skill directories/files.
+- `hooks` (`string`): Hook config path.
+- `mcpServers` (`string`): MCP config path.
+- `apps` (`string`): App manifest path for plugin integrations.
+- `interface` (`object`): Interface/UX metadata block for plugin presentation.
+
+### `interface` fields
+
+- `displayName` (`string`): User-facing title shown for the plugin.
+- `shortDescription` (`string`): Brief subtitle used in compact views.
+- `longDescription` (`string`): Longer description used on details screens.
+- `developerName` (`string`): Human-readable publisher name.
+- `category` (`string`): Plugin category bucket.
+- `capabilities` (`array` of `string`): Capability list from implementation.
+- `websiteURL` (`string`): Public website for the plugin.
+- `privacyPolicyURL` (`string`): Privacy policy URL.
+- `termsOfServiceURL` (`string`): Terms of service URL.
+- `defaultPrompt` (`array` of `string`): Starter prompts shown in composer/UX context.
+  - Include at most 3 strings. Entries after the first 3 are ignored and will not be included.
+  - Each string is capped at 128 characters. Longer entries are truncated.
+  - Prefer short starter prompts around 50 characters so they scan well in the UI.
+- `brandColor` (`string`): Theme color for the plugin card.
+- `composerIcon` (`string`): Path to icon asset.
+- `logo` (`string`): Path to logo asset.
+- `screenshots` (`array` of `string`): List of screenshot asset paths.
+  - Screenshot entries must be PNG filenames and stored under `./assets/`.
+  - Keep file paths relative to plugin root.
+
+### Path conventions and defaults
+
+- Path values should be relative and begin with `./`.
+- `skills`, `hooks`, and `mcpServers` are supplemented on top of default component discovery; they do not replace defaults.
+- Custom path values must follow the plugin root convention and naming/namespacing rules.
+- This repo’s scaffold writes `.codex-plugin/plugin.json`; treat that as the manifest location this skill generates.
+
+# Marketplace JSON sample spec
+
+`marketplace.json` depends on where the plugin should live. New plugin creation defaults to the
+personal marketplace unless the caller explicitly requests a repo-local destination:
+
+- Personal plugin: `~/.agents/plugins/marketplace.json`
+- Repo/team plugin: `<repo-root>/.agents/plugins/marketplace.json`
+
+```json
+{
+  "name": "openai-curated",
+  "interface": {
+    "displayName": "ChatGPT Official"
+  },
+  "plugins": [
+    {
+      "name": "linear",
+      "source": {
+        "source": "local",
+        "path": "./plugins/linear"
+      },
+      "policy": {
+        "installation": "AVAILABLE",
+        "authentication": "ON_INSTALL"
+      },
+      "category": "Productivity"
+    }
+  ]
+}
+```
+
+## Marketplace field guide
+
+### Top-level fields
+
+- `name` (`string`): Marketplace identifier or catalog name.
+- `interface` (`object`, optional): Marketplace presentation metadata.
+- `plugins` (`array`): Ordered plugin entries. This order determines how Codex renders plugins.
+
+### `interface` fields
+
+- `displayName` (`string`, optional): User-facing marketplace title.
+
+### Plugin entry fields
+
+- `name` (`string`): Plugin identifier. Match the plugin folder name and `plugin.json` `name`.
+- `source` (`object`): Plugin source descriptor.
+  - `source` (`string`): Use `local` for this repo workflow.
+  - `path` (`string`): Relative plugin path based on the marketplace root.
+    - Personal plugin in `~/.agents/plugins/marketplace.json`: `./plugins/<plugin-name>`
+    - Repo/team plugin: `./plugins/<plugin-name>`
+  - The same relative path convention is used for both personal and repo/team marketplaces.
+    - Example: with `~/.agents/plugins/marketplace.json`, `./plugins/<plugin-name>` resolves to
+      `~/plugins/<plugin-name>`.
+- `policy` (`object`): Marketplace policy block. Always include it.
+  - `installation` (`string`): Availability policy.
+    - Allowed values: `NOT_AVAILABLE`, `AVAILABLE`, `INSTALLED_BY_DEFAULT`
+    - Default for new entries: `AVAILABLE`
+  - `authentication` (`string`): Authentication timing policy.
+    - Allowed values: `ON_INSTALL`, `ON_USE`
+    - Default for new entries: `ON_INSTALL`
+  - `products` (`array` of `string`, optional): Product override for this plugin entry. Omit it unless product gating is explicitly requested.
+- `category` (`string`): Display category bucket. Always include it.
+
+### Marketplace generation rules
+
+- `displayName` belongs under the top-level `interface` object, not individual plugin entries.
+- When creating a new marketplace file from scratch, seed `interface.displayName` alongside top-level `name`.
+- Always include `policy.installation`, `policy.authentication`, and `category` on every generated or updated plugin entry.
+- Treat `policy.products` as an override and omit it unless explicitly requested.
+- Append new entries unless the user explicitly requests reordering.
+- Replace an existing entry for the same plugin only when overwrite is intentional.
+- Default new plugin creation to the personal marketplace.
+- Use a repo/team marketplace only when the user specifically requests that destination.
+- Only override the marketplace `name` when the default `personal` name is already taken or
+  installed and you need to seed a different new marketplace file.
+- Choose marketplace location to match the selected destination:
+  - Personal plugin: `~/.agents/plugins/marketplace.json`
+  - Repo/team plugin: `<repo-root>/.agents/plugins/marketplace.json`
+
+### Plugin validation notes
+
+- The validator mirrors the workspace plugin ingestion schema so generated plugins follow the same
+  manifest contract from the start.
+- Plugin manifests must include real values for `name`, `version`, `description`,
+  `author.name`, and the required `interface` fields.
+- `version` must use strict semver.
+- `websiteURL`, `privacyPolicyURL`, and `termsOfServiceURL` must be absolute `https://` URLs when
+  present.
+- `composerIcon`, `logo`, and `screenshots` must point to real files inside the plugin archive when
+  present.
+- `apps` and `mcpServers` should appear in `plugin.json` only when `.app.json` and `.mcp.json`
+  actually exist.
+- Validation rejects unsupported manifest fields such as `hooks`, so the scaffold keeps them out of
+  generated manifests.
+- Run `scripts/validate_plugin.py <plugin-path>` before handing back a generated plugin. It adds one
+  intentional preflight check that rejects leftover `[TODO: ...]` placeholders.
diff --git a/skills/plugin-creator/scripts/create_basic_plugin.py b/skills/plugin-creator/scripts/create_basic_plugin.py
new file mode 100644
index 0000000..78b9fca
--- /dev/null
+++ b/skills/plugin-creator/scripts/create_basic_plugin.py
@@ -0,0 +1,324 @@
+#!/usr/bin/env python3
+"""Scaffold a plugin directory and optionally update marketplace.json."""
+
+from __future__ import annotations
+
+import argparse
+import json
+import re
+from pathlib import Path
+from typing import Any
+
+
+MAX_PLUGIN_NAME_LENGTH = 64
+DEFAULT_INSTALL_POLICY = "AVAILABLE"
+DEFAULT_AUTH_POLICY = "ON_INSTALL"
+DEFAULT_CATEGORY = "Productivity"
+DEFAULT_MARKETPLACE_NAME = "personal"
+VALID_INSTALL_POLICIES = {"NOT_AVAILABLE", "AVAILABLE", "INSTALLED_BY_DEFAULT"}
+VALID_AUTH_POLICIES = {"ON_INSTALL", "ON_USE"}
+DEFAULT_PLUGIN_PARENT = Path.home() / "plugins"
+DEFAULT_MARKETPLACE_PATH = Path.home() / ".agents" / "plugins" / "marketplace.json"
+
+
+def normalize_plugin_name(plugin_name: str) -> str:
+    """Normalize a plugin name to lowercase hyphen-case."""
+    normalized = plugin_name.strip().lower()
+    normalized = re.sub(r"[^a-z0-9]+", "-", normalized)
+    normalized = normalized.strip("-")
+    normalized = re.sub(r"-{2,}", "-", normalized)
+    return normalized
+
+
+def validate_plugin_name(plugin_name: str) -> None:
+    if not plugin_name:
+        raise ValueError("Plugin name must include at least one letter or digit.")
+    if len(plugin_name) > MAX_PLUGIN_NAME_LENGTH:
+        raise ValueError(
+            f"Plugin name '{plugin_name}' is too long ({len(plugin_name)} characters). "
+            f"Maximum is {MAX_PLUGIN_NAME_LENGTH} characters."
+        )
+
+
+def validate_marketplace_name(marketplace_name: str) -> None:
+    if not marketplace_name:
+        raise ValueError("Marketplace name must include at least one letter or digit.")
+    if re.fullmatch(r"[A-Za-z0-9_-]+", marketplace_name) is None:
+        raise ValueError(
+            "Marketplace name may only contain ASCII letters, digits, `_`, and `-`."
+        )
+
+
+def display_name_from_plugin_name(plugin_name: str) -> str:
+    return " ".join(part.capitalize() for part in re.split(r"[-_]+", plugin_name))
+
+
+def build_plugin_json(plugin_name: str, *, with_mcp: bool, with_apps: bool) -> dict[str, Any]:
+    display_name = display_name_from_plugin_name(plugin_name)
+    payload: dict[str, Any] = {
+        "name": plugin_name,
+        "version": "0.1.0",
+        "description": f"{display_name} plugin",
+        "author": {
+            "name": "Local developer",
+        },
+        "skills": "./skills/",
+        "interface": {
+            "displayName": display_name,
+            "shortDescription": f"Use {display_name} in Codex.",
+            "longDescription": f"{display_name} adds a local Codex plugin scaffold.",
+            "developerName": "Local developer",
+            "category": DEFAULT_CATEGORY,
+            "capabilities": [],
+            "defaultPrompt": f"Help me use {display_name}.",
+        },
+    }
+    if with_mcp:
+        payload["mcpServers"] = "./.mcp.json"
+    if with_apps:
+        payload["apps"] = "./.app.json"
+    return payload
+
+
+def build_marketplace_entry(
+    plugin_name: str,
+    install_policy: str,
+    auth_policy: str,
+    category: str,
+) -> dict[str, Any]:
+    return {
+        "name": plugin_name,
+        "source": {
+            "source": "local",
+            "path": f"./plugins/{plugin_name}",
+        },
+        "policy": {
+            "installation": install_policy,
+            "authentication": auth_policy,
+        },
+        "category": category,
+    }
+
+
+def load_json(path: Path) -> dict[str, Any]:
+    with path.open() as handle:
+        return json.load(handle)
+
+
+def build_default_marketplace(marketplace_name: str) -> dict[str, Any]:
+    return {
+        "name": marketplace_name,
+        "interface": {
+            "displayName": display_name_from_plugin_name(marketplace_name),
+        },
+        "plugins": [],
+    }
+
+
+def validate_marketplace_interface(payload: dict[str, Any]) -> None:
+    interface = payload.get("interface")
+    if interface is not None and not isinstance(interface, dict):
+        raise ValueError("marketplace.json field 'interface' must be an object.")
+
+
+def update_marketplace_json(
+    marketplace_path: Path,
+    marketplace_name: str | None,
+    plugin_name: str,
+    install_policy: str,
+    auth_policy: str,
+    category: str,
+    force: bool,
+) -> None:
+    if marketplace_path.exists():
+        payload = load_json(marketplace_path)
+    else:
+        payload = build_default_marketplace(marketplace_name or DEFAULT_MARKETPLACE_NAME)
+
+    if not isinstance(payload, dict):
+        raise ValueError(f"{marketplace_path} must contain a JSON object.")
+
+    validate_marketplace_interface(payload)
+
+    existing_marketplace_name = payload.get("name")
+    if marketplace_name is not None:
+        if not isinstance(existing_marketplace_name, str) or not existing_marketplace_name.strip():
+            raise ValueError(f"{marketplace_path} must contain a non-empty string 'name'.")
+        if existing_marketplace_name != marketplace_name:
+            raise ValueError(
+                f"{marketplace_path} already uses marketplace name "
+                f"'{existing_marketplace_name}'. Create a new marketplace file to use "
+                f"'{marketplace_name}' instead."
+            )
+
+    plugins = payload.setdefault("plugins", [])
+    if not isinstance(plugins, list):
+        raise ValueError(f"{marketplace_path} field 'plugins' must be an array.")
+
+    new_entry = build_marketplace_entry(plugin_name, install_policy, auth_policy, category)
+
+    for index, entry in enumerate(plugins):
+        if isinstance(entry, dict) and entry.get("name") == plugin_name:
+            if not force:
+                raise FileExistsError(
+                    f"Marketplace entry '{plugin_name}' already exists in {marketplace_path}. "
+                    "Use --force to overwrite that entry."
+                )
+            plugins[index] = new_entry
+            break
+    else:
+        plugins.append(new_entry)
+
+    write_json(marketplace_path, payload, force=True)
+
+
+def write_json(path: Path, data: dict, force: bool) -> None:
+    if path.exists() and not force:
+        raise FileExistsError(f"{path} already exists. Use --force to overwrite.")
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with path.open("w") as handle:
+        json.dump(data, handle, indent=2)
+        handle.write("\n")
+
+
+def create_stub_file(path: Path, payload: dict, force: bool) -> None:
+    if path.exists() and not force:
+        return
+    path.parent.mkdir(parents=True, exist_ok=True)
+    with path.open("w") as handle:
+        json.dump(payload, handle, indent=2)
+        handle.write("\n")
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description="Create a plugin skeleton with a validation-ready plugin.json."
+    )
+    parser.add_argument("plugin_name")
+    parser.add_argument(
+        "--path",
+        default=str(DEFAULT_PLUGIN_PARENT),
+        help=(
+            "Parent directory for plugin creation (defaults to <home>/plugins). "
+            "Pass an explicit repo path only when a repo/team plugin is intended."
+        ),
+    )
+    parser.add_argument("--with-skills", action="store_true", help="Create skills/ directory")
+    parser.add_argument("--with-hooks", action="store_true", help="Create hooks/ directory")
+    parser.add_argument("--with-scripts", action="store_true", help="Create scripts/ directory")
+    parser.add_argument("--with-assets", action="store_true", help="Create assets/ directory")
+    parser.add_argument("--with-mcp", action="store_true", help="Create .mcp.json placeholder")
+    parser.add_argument("--with-apps", action="store_true", help="Create .app.json placeholder")
+    parser.add_argument(
+        "--with-marketplace",
+        action="store_true",
+        help=(
+            "Create or update <home>/.agents/plugins/marketplace.json by default. "
+            "Marketplace entries always point to ./plugins/<plugin-name> relative to the "
+            "marketplace root."
+        ),
+    )
+    parser.add_argument(
+        "--marketplace-path",
+        default=str(DEFAULT_MARKETPLACE_PATH),
+        help=(
+            "Path to marketplace.json (defaults to <home>/.agents/plugins/marketplace.json). "
+            "Pass a repo-rooted marketplace path only when a repo/team plugin is intended."
+        ),
+    )
+    parser.add_argument(
+        "--marketplace-name",
+        help=(
+            "Marketplace name to seed into a new marketplace.json. Use this only when the default "
+            "'personal' marketplace name is already taken and you need a different new marketplace."
+        ),
+    )
+    parser.add_argument(
+        "--install-policy",
+        default=DEFAULT_INSTALL_POLICY,
+        choices=sorted(VALID_INSTALL_POLICIES),
+        help="Marketplace policy.installation value",
+    )
+    parser.add_argument(
+        "--auth-policy",
+        default=DEFAULT_AUTH_POLICY,
+        choices=sorted(VALID_AUTH_POLICIES),
+        help="Marketplace policy.authentication value",
+    )
+    parser.add_argument(
+        "--category",
+        default=DEFAULT_CATEGORY,
+        help="Marketplace category value",
+    )
+    parser.add_argument("--force", action="store_true", help="Overwrite existing files")
+    return parser.parse_args()
+
+
+def main() -> None:
+    args = parse_args()
+    raw_plugin_name = args.plugin_name
+    plugin_name = normalize_plugin_name(raw_plugin_name)
+    if plugin_name != raw_plugin_name:
+        print(f"Note: Normalized plugin name from '{raw_plugin_name}' to '{plugin_name}'.")
+    validate_plugin_name(plugin_name)
+    marketplace_name = None
+    if args.marketplace_name is not None:
+        marketplace_name = args.marketplace_name.strip()
+        validate_marketplace_name(marketplace_name)
+
+    plugin_root = (Path(args.path).expanduser().resolve() / plugin_name)
+    plugin_root.mkdir(parents=True, exist_ok=True)
+
+    plugin_json_path = plugin_root / ".codex-plugin" / "plugin.json"
+    write_json(
+        plugin_json_path,
+        build_plugin_json(plugin_name, with_mcp=args.with_mcp, with_apps=args.with_apps),
+        args.force,
+    )
+
+    optional_directories = {
+        "skills": args.with_skills,
+        "hooks": args.with_hooks,
+        "scripts": args.with_scripts,
+        "assets": args.with_assets,
+    }
+    for folder, enabled in optional_directories.items():
+        if enabled:
+            (plugin_root / folder).mkdir(parents=True, exist_ok=True)
+
+    if args.with_mcp:
+        create_stub_file(
+            plugin_root / ".mcp.json",
+            {"mcpServers": {}},
+            args.force,
+        )
+
+    if args.with_apps:
+        create_stub_file(
+            plugin_root / ".app.json",
+            {
+                "apps": {},
+            },
+            args.force,
+        )
+
+    if args.with_marketplace:
+        marketplace_path = Path(args.marketplace_path).expanduser().resolve()
+        update_marketplace_json(
+            marketplace_path,
+            marketplace_name,
+            plugin_name,
+            args.install_policy,
+            args.auth_policy,
+            args.category,
+            args.force,
+        )
+
+    print(f"Created plugin scaffold: {plugin_root}")
+    print(f"plugin manifest: {plugin_json_path}")
+    if args.with_marketplace:
+        print(f"marketplace manifest: {marketplace_path}")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/skills/plugin-creator/scripts/read_marketplace_name.py b/skills/plugin-creator/scripts/read_marketplace_name.py
new file mode 100644
index 0000000..597e9f7
--- /dev/null
+++ b/skills/plugin-creator/scripts/read_marketplace_name.py
@@ -0,0 +1,48 @@
+#!/usr/bin/env python3
+"""Print the top-level marketplace name from any marketplace.json file."""
+
+from __future__ import annotations
+
+import argparse
+import json
+import sys
+from pathlib import Path
+
+
+def default_marketplace_path() -> Path:
+    return Path.home() / ".agents" / "plugins" / "marketplace.json"
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description=(
+            "Print the top-level marketplace name from marketplace.json. Defaults to the personal "
+            "marketplace path under the current home directory."
+        )
+    )
+    parser.add_argument(
+        "--marketplace-path",
+        default=str(default_marketplace_path()),
+        help="Path to marketplace.json",
+    )
+    return parser.parse_args()
+
+
+def main() -> None:
+    args = parse_args()
+    marketplace_path = Path(args.marketplace_path).expanduser().resolve()
+    payload = json.loads(marketplace_path.read_text(encoding="utf-8"))
+    if not isinstance(payload, dict):
+        raise ValueError(f"{marketplace_path} must contain a JSON object.")
+    name = payload.get("name")
+    if not isinstance(name, str) or not name.strip():
+        raise ValueError(f"{marketplace_path} must contain a non-empty string 'name'.")
+    print(name.strip())
+
+
+if __name__ == "__main__":
+    try:
+        main()
+    except Exception as err:  # noqa: BLE001 - CLI should surface a single clear message.
+        print(str(err), file=sys.stderr)
+        raise SystemExit(1) from err
diff --git a/skills/plugin-creator/scripts/update_plugin_cachebuster.py b/skills/plugin-creator/scripts/update_plugin_cachebuster.py
new file mode 100644
index 0000000..82d19e5
--- /dev/null
+++ b/skills/plugin-creator/scripts/update_plugin_cachebuster.py
@@ -0,0 +1,78 @@
+#!/usr/bin/env python3
+"""Rewrite a local plugin version to a single Codex cachebuster suffix."""
+
+from __future__ import annotations
+
+import argparse
+import json
+import re
+import sys
+from datetime import datetime, timezone
+from pathlib import Path
+
+
+CACHEBUSTER_PREFIX = "codex"
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(
+        description=(
+            "Rewrite a local plugin's version so it preserves everything before '+' and uses "
+            "a single +codex.<cachebuster> suffix."
+        )
+    )
+    parser.add_argument("plugin_path", help="Path to the plugin root directory")
+    parser.add_argument(
+        "--cachebuster",
+        help="Optional cachebuster token to embed in the plugin version",
+    )
+    return parser.parse_args()
+
+
+def main() -> None:
+    args = parse_args()
+    plugin_root = Path(args.plugin_path).expanduser().resolve()
+    manifest_path = plugin_root / ".codex-plugin" / "plugin.json"
+    manifest = load_manifest(manifest_path)
+
+    version = manifest.get("version")
+    if not isinstance(version, str) or not version.strip():
+        raise ValueError(f"{manifest_path} must contain a non-empty string 'version'.")
+    cachebuster = sanitize_cachebuster(args.cachebuster or default_cachebuster())
+    next_version = with_cachebuster(version, cachebuster)
+    manifest["version"] = next_version
+    manifest_path.write_text(json.dumps(manifest, indent=2) + "\n", encoding="utf-8")
+
+    print(f"Updated plugin version: {version} -> {next_version}")
+
+
+def load_manifest(manifest_path: Path) -> dict[str, object]:
+    if not manifest_path.is_file():
+        raise FileNotFoundError(f"missing manifest: {manifest_path}")
+    payload = json.loads(manifest_path.read_text(encoding="utf-8"))
+    if not isinstance(payload, dict):
+        raise ValueError(f"{manifest_path} must contain a JSON object.")
+    return payload
+def sanitize_cachebuster(value: str) -> str:
+    sanitized = re.sub(r"[^a-z0-9-]+", "-", value.strip().lower())
+    sanitized = re.sub(r"-{2,}", "-", sanitized).strip("-")
+    if not sanitized:
+        raise ValueError("Cachebuster must contain at least one letter or digit.")
+    return sanitized
+
+
+def default_cachebuster() -> str:
+    return datetime.now(timezone.utc).strftime("%Y%m%d%H%M%S")
+
+
+def with_cachebuster(version: str, cachebuster: str) -> str:
+    version_prefix = version.split("+", 1)[0]
+    return f"{version_prefix}+{CACHEBUSTER_PREFIX}.{cachebuster}"
+
+
+if __name__ == "__main__":
+    try:
+        main()
+    except Exception as err:  # noqa: BLE001 - CLI should surface a single clear message.
+        print(str(err), file=sys.stderr)
+        raise SystemExit(1) from err
diff --git a/skills/plugin-creator/scripts/validate_plugin.py b/skills/plugin-creator/scripts/validate_plugin.py
new file mode 100644
index 0000000..6f49cb0
--- /dev/null
+++ b/skills/plugin-creator/scripts/validate_plugin.py
@@ -0,0 +1,593 @@
+#!/usr/bin/env python3
+"""Validate a generated plugin against the plugin ingestion contract."""
+
+from __future__ import annotations
+
+import argparse
+import json
+import re
+from pathlib import Path, PurePosixPath
+from typing import Any
+from urllib.parse import urlparse
+
+import yaml
+
+
+TODO_MARKER = "[TODO:"
+SEMVER_RE = re.compile(
+    r"^(0|[1-9]\d*)\."
+    r"(0|[1-9]\d*)\."
+    r"(0|[1-9]\d*)"
+    r"(?:-(?:0|[1-9]\d*|\d*[A-Za-z-][0-9A-Za-z-]*)(?:\."
+    r"(?:0|[1-9]\d*|\d*[A-Za-z-][0-9A-Za-z-]*))*)?"
+    r"(?:\+[0-9A-Za-z-]+(?:\.[0-9A-Za-z-]+)*)?$"
+)
+HEX_COLOR_RE = re.compile(r"^#[0-9A-F]{6}$", re.IGNORECASE)
+
+
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser(description="Validate a local Codex plugin.")
+    parser.add_argument("plugin_path", help="Path to the plugin root directory")
+    return parser.parse_args()
+
+
+def main() -> None:
+    args = parse_args()
+    plugin_root = Path(args.plugin_path).expanduser().resolve()
+    errors = validate_plugin(plugin_root)
+    if errors:
+        print("Plugin validation failed:")
+        for error in errors:
+            print(f"- {error}")
+        raise SystemExit(1)
+    print(f"Plugin validation passed: {plugin_root}")
+
+
+def validate_plugin(plugin_root: Path) -> list[str]:
+    errors: list[str] = []
+    manifest_path = plugin_root / ".codex-plugin" / "plugin.json"
+    manifest = load_json_object(manifest_path, errors)
+    if manifest is None:
+        return errors
+
+    reject_todo_markers(manifest, "$", errors)
+    validate_manifest_shape(plugin_root, manifest, errors)
+    return errors
+
+
+def load_json_object(path: Path, errors: list[str]) -> dict[str, Any] | None:
+    if not path.is_file():
+        errors.append("missing `.codex-plugin/plugin.json`")
+        return None
+    try:
+        payload = json.loads(path.read_text(encoding="utf-8"))
+    except OSError:
+        errors.append("unable to read `.codex-plugin/plugin.json`")
+        return None
+    except json.JSONDecodeError:
+        errors.append("`.codex-plugin/plugin.json` must be valid JSON")
+        return None
+    if not isinstance(payload, dict):
+        errors.append("`.codex-plugin/plugin.json` must contain a JSON object")
+        return None
+    return payload
+
+
+def reject_todo_markers(value: Any, path: str, errors: list[str]) -> None:
+    if isinstance(value, str):
+        if TODO_MARKER in value:
+            errors.append(f"{path} still contains a `[TODO: ...]` placeholder")
+        return
+    if isinstance(value, list):
+        for index, item in enumerate(value):
+            reject_todo_markers(item, f"{path}[{index}]", errors)
+        return
+    if isinstance(value, dict):
+        for key, item in value.items():
+            reject_todo_markers(item, f"{path}.{key}", errors)
+
+
+def validate_manifest_shape(
+    plugin_root: Path,
+    manifest: dict[str, Any],
+    errors: list[str],
+) -> None:
+    allowed_keys = {
+        "id",
+        "name",
+        "version",
+        "description",
+        "skills",
+        "apps",
+        "mcpServers",
+        "interface",
+        "author",
+        "homepage",
+        "repository",
+        "license",
+        "keywords",
+    }
+    for key in sorted(set(manifest) - allowed_keys):
+        errors.append(f"plugin.json field `{key}` is not accepted by plugin validation")
+
+    validate_optional_non_empty_string(manifest, "id", errors)
+    require_non_empty_string(manifest, "name", errors)
+    version = require_non_empty_string(manifest, "version", errors)
+    if version is not None and SEMVER_RE.fullmatch(version) is None:
+        errors.append("plugin.json field `version` must be strict semver")
+    require_non_empty_string(manifest, "description", errors)
+
+    author = require_object(manifest, "author", errors)
+    if author is not None:
+        reject_unknown_fields(author, {"name", "email", "url"}, "author", errors)
+        require_non_empty_string(author, "name", errors, prefix="author")
+        validate_optional_non_empty_string(author, "email", errors, prefix="author")
+        validate_optional_https_url(author, "url", errors, prefix="author")
+
+    validate_optional_contract_path(manifest, "skills", "skills", errors)
+    validate_optional_contract_path(manifest, "apps", ".app.json", errors)
+    validate_optional_contract_path(manifest, "mcpServers", ".mcp.json", errors)
+
+    if manifest.get("apps") is not None:
+        validate_app_manifest(
+            plugin_root / ".app.json",
+            errors,
+        )
+    if manifest.get("mcpServers") is not None:
+        validate_mcp_manifest(
+            plugin_root / ".mcp.json",
+            errors,
+        )
+    validate_skill_manifests(plugin_root, errors)
+
+    interface = require_object(manifest, "interface", errors)
+    if interface is None:
+        return
+    reject_unknown_fields(
+        interface,
+        {
+            "displayName",
+            "shortDescription",
+            "longDescription",
+            "developerName",
+            "category",
+            "capabilities",
+            "websiteURL",
+            "privacyPolicyURL",
+            "termsOfServiceURL",
+            "brandColor",
+            "composerIcon",
+            "logo",
+            "screenshots",
+            "defaultPrompt",
+            "default_prompt",
+        },
+        "interface",
+        errors,
+    )
+    for field in (
+        "displayName",
+        "shortDescription",
+        "longDescription",
+        "developerName",
+        "category",
+    ):
+        require_non_empty_string(interface, field, errors, prefix="interface")
+    if "defaultPrompt" not in interface and "default_prompt" not in interface:
+        errors.append(
+            "plugin.json field `interface.defaultPrompt` or `interface.default_prompt` is required"
+        )
+    capabilities = interface.get("capabilities")
+    if not isinstance(capabilities, list) or not all(
+        isinstance(value, str) and value.strip() for value in capabilities
+    ):
+        errors.append("plugin.json field `interface.capabilities` must be an array of strings")
+    for field in ("websiteURL", "privacyPolicyURL", "termsOfServiceURL"):
+        validate_optional_https_url(interface, field, errors, prefix="interface")
+    brand_color = interface.get("brandColor")
+    if brand_color is not None and (
+        not isinstance(brand_color, str) or HEX_COLOR_RE.fullmatch(brand_color) is None
+    ):
+        errors.append("plugin.json field `interface.brandColor` must use `#RRGGBB`")
+    for field in ("composerIcon", "logo"):
+        validate_optional_asset_path(plugin_root, plugin_root, interface, field, errors)
+    screenshots = interface.get("screenshots", [])
+    if not isinstance(screenshots, list):
+        errors.append("plugin.json field `interface.screenshots` must be an array")
+    else:
+        for index, raw_path in enumerate(screenshots):
+            validate_asset_path(
+                plugin_root,
+                plugin_root,
+                raw_path,
+                f"interface.screenshots[{index}]",
+                errors,
+            )
+
+
+def require_object(
+    payload: dict[str, Any],
+    key: str,
+    errors: list[str],
+) -> dict[str, Any] | None:
+    value = payload.get(key)
+    if not isinstance(value, dict):
+        errors.append(f"plugin.json field `{key}` must be an object")
+        return None
+    return value
+
+
+def require_non_empty_string(
+    payload: dict[str, Any],
+    key: str,
+    errors: list[str],
+    *,
+    prefix: str | None = None,
+) -> str | None:
+    value = payload.get(key)
+    field = f"{prefix}.{key}" if prefix is not None else key
+    if not isinstance(value, str) or not value.strip():
+        errors.append(f"plugin.json field `{field}` must be a non-empty string")
+        return None
+    return value
+
+
+def validate_optional_non_empty_string(
+    payload: dict[str, Any],
+    key: str,
+    errors: list[str],
+    *,
+    prefix: str | None = None,
+) -> None:
+    value = payload.get(key)
+    if value is None:
+        return
+    field = f"{prefix}.{key}" if prefix is not None else key
+    if not isinstance(value, str) or not value.strip():
+        errors.append(f"plugin.json field `{field}` must be a non-empty string")
+
+
+def reject_unknown_fields(
+    payload: dict[str, Any],
+    allowed_keys: set[str],
+    prefix: str,
+    errors: list[str],
+) -> None:
+    for key in sorted(set(payload) - allowed_keys):
+        errors.append(f"plugin.json field `{prefix}.{key}` is not accepted by plugin validation")
+
+
+def validate_optional_https_url(
+    payload: dict[str, Any],
+    key: str,
+    errors: list[str],
+    *,
+    prefix: str,
+) -> None:
+    value = payload.get(key)
+    if value is None:
+        return
+    parsed = urlparse(value) if isinstance(value, str) else None
+    if parsed is None or parsed.scheme != "https" or not parsed.netloc:
+        errors.append(f"plugin.json field `{prefix}.{key}` must be an absolute `https://` URL")
+
+
+def validate_optional_contract_path(
+    payload: dict[str, Any],
+    key: str,
+    expected: str,
+    errors: list[str],
+) -> None:
+    value = payload.get(key)
+    if value is None:
+        return
+    normalized = normalize_contract_path(value) if isinstance(value, str) else None
+    if normalized != expected:
+        errors.append(f"plugin.json field `{key}` must resolve to `{expected}`")
+
+
+def normalize_contract_path(raw_path: str) -> str | None:
+    path = Path(raw_path)
+    if path.is_absolute():
+        return None
+    normalized = path.as_posix().rstrip("/")
+    return normalized or None
+
+
+def validate_app_manifest(path: Path, errors: list[str]) -> None:
+    payload = load_companion_json_object(path, "`.app.json`", errors)
+    if payload is None:
+        return
+    reject_companion_unknown_fields(payload, {"apps"}, "`.app.json`", errors)
+    apps = payload.get("apps")
+    if not isinstance(apps, dict):
+        errors.append("`.app.json` field `apps` must be an object")
+        return
+    for key, value in apps.items():
+        if not isinstance(value, dict):
+            errors.append(f"`.app.json` app `{key}` must be an object")
+            continue
+        reject_companion_unknown_fields(
+            value, {"id", "category"}, f"`.app.json` app `{key}`", errors
+        )
+        app_id = value.get("id")
+        if not isinstance(app_id, str) or not app_id.strip():
+            errors.append(f"`.app.json` app `{key}` field `id` must be a non-empty string")
+        category = value.get("category")
+        if category is not None and (not isinstance(category, str) or not category.strip()):
+            errors.append(
+                f"`.app.json` app `{key}` field `category` must be a non-empty string"
+            )
+
+
+def validate_mcp_manifest(path: Path, errors: list[str]) -> None:
+    payload = load_companion_json_object(path, "`.mcp.json`", errors)
+    if payload is None:
+        return
+    reject_companion_unknown_fields(payload, {"mcpServers"}, "`.mcp.json`", errors)
+    servers = payload.get("mcpServers")
+    if not isinstance(servers, dict):
+        errors.append("`.mcp.json` field `mcpServers` must be an object")
+        return
+    for key, value in servers.items():
+        if not isinstance(key, str) or not key.strip():
+            errors.append("`.mcp.json` server names must be non-empty strings")
+        if not isinstance(value, dict):
+            errors.append(f"`.mcp.json` server `{key}` must be an object")
+
+
+def load_companion_json_object(
+    path: Path,
+    label: str,
+    errors: list[str],
+) -> dict[str, Any] | None:
+    if not path.is_file():
+        errors.append(f"{label} is required when its plugin.json field is present")
+        return None
+    try:
+        payload = json.loads(path.read_text(encoding="utf-8"))
+    except (OSError, json.JSONDecodeError):
+        errors.append(f"{label} must contain valid JSON")
+        return None
+    if not isinstance(payload, dict):
+        errors.append(f"{label} must contain a JSON object")
+        return None
+    return payload
+
+
+def reject_companion_unknown_fields(
+    payload: dict[str, Any],
+    allowed_keys: set[str],
+    prefix: str,
+    errors: list[str],
+) -> None:
+    for key in sorted(set(payload) - allowed_keys):
+        errors.append(f"{prefix} field `{key}` is not accepted by plugin validation")
+
+
+def validate_skill_manifests(plugin_root: Path, errors: list[str]) -> None:
+    skills_root = plugin_root / "skills"
+    if not skills_root.is_dir():
+        return
+    for skill_root in sorted(skills_root.iterdir(), key=lambda path: path.name):
+        if skill_root.name.startswith(".") or not skill_root.is_dir():
+            continue
+        validate_skill_manifest(skill_root, errors)
+
+
+def validate_skill_manifest(skill_root: Path, errors: list[str]) -> None:
+    skill_md_path = skill_root / "SKILL.md"
+    if not skill_md_path.is_file():
+        errors.append(f"skill `{skill_root.name}` is missing `SKILL.md`")
+        return
+    try:
+        contents = skill_md_path.read_text(encoding="utf-8")
+    except OSError:
+        errors.append(f"unable to read skill `{skill_root.name}`")
+        return
+    if not contents.startswith("---\n"):
+        errors.append(f"skill `{skill_root.name}` must start with YAML frontmatter")
+        return
+    frontmatter_end = contents.find("\n---", 4)
+    if frontmatter_end == -1:
+        errors.append(f"skill `{skill_root.name}` frontmatter is not closed")
+        return
+    try:
+        frontmatter = yaml.safe_load(contents[4:frontmatter_end])
+    except yaml.YAMLError:
+        errors.append(f"skill `{skill_root.name}` frontmatter must be valid YAML")
+        return
+    if not isinstance(frontmatter, dict):
+        errors.append(f"skill `{skill_root.name}` frontmatter must be an object")
+        return
+    skill_name = frontmatter.get("name")
+    if not isinstance(skill_name, str) or not skill_name.strip():
+        errors.append(f"skill `{skill_root.name}` frontmatter field `name` must be non-empty")
+    description = frontmatter.get("description")
+    if not isinstance(description, str) or not description.strip():
+        errors.append(
+            f"skill `{skill_root.name}` frontmatter field `description` must be non-empty"
+        )
+    disable_model_invocation = frontmatter.get("disable-model-invocation")
+    if disable_model_invocation is None:
+        disable_model_invocation = frontmatter.get("disable_model_invocation")
+    if disable_model_invocation not in (None, False):
+        errors.append(
+            f"skill `{skill_root.name}` frontmatter field `disable-model-invocation` must be false"
+        )
+    agent_yaml_path = skill_root / "agents" / "openai.yaml"
+    if agent_yaml_path.is_file():
+        validate_skill_agent_manifest(
+            plugin_root=skill_root.parent.parent,
+            skill_root=skill_root,
+            agent_yaml_path=agent_yaml_path,
+            errors=errors,
+        )
+
+
+def validate_skill_agent_manifest(
+    *,
+    plugin_root: Path,
+    skill_root: Path,
+    agent_yaml_path: Path,
+    errors: list[str],
+) -> None:
+    try:
+        payload = yaml.safe_load(agent_yaml_path.read_text(encoding="utf-8"))
+    except OSError:
+        errors.append(f"unable to read skill `{skill_root.name}` agent YAML")
+        return
+    except yaml.YAMLError:
+        errors.append(f"skill `{skill_root.name}` agent YAML must be valid YAML")
+        return
+    if not isinstance(payload, dict):
+        errors.append(f"skill `{skill_root.name}` agent YAML must be an object")
+        return
+
+    reject_skill_agent_unknown_fields(
+        payload,
+        {"interface", "policy", "dependencies"},
+        skill_root,
+        errors,
+    )
+    interface = payload.get("interface")
+    if not isinstance(interface, dict):
+        errors.append(f"skill `{skill_root.name}` agent field `interface` must be an object")
+        return
+    reject_skill_agent_unknown_fields(
+        interface,
+        {
+            "display_name",
+            "short_description",
+            "icon_small",
+            "icon_large",
+            "brand_color",
+            "default_prompt",
+        },
+        skill_root,
+        errors,
+        prefix="interface",
+    )
+    for field in ("display_name", "short_description"):
+        value = interface.get(field)
+        if not isinstance(value, str) or not value.strip():
+            errors.append(
+                f"skill `{skill_root.name}` agent field `interface.{field}` must be non-empty"
+            )
+    for field in ("icon_small", "icon_large"):
+        validate_optional_asset_path(
+            skill_root,
+            plugin_root,
+            interface,
+            field,
+            errors,
+            prefix=f"skill `{skill_root.name}` agent field `interface",
+        )
+    brand_color = interface.get("brand_color")
+    if brand_color is not None and (
+        not isinstance(brand_color, str) or HEX_COLOR_RE.fullmatch(brand_color) is None
+    ):
+        errors.append(
+            f"skill `{skill_root.name}` agent field `interface.brand_color` must use `#RRGGBB`"
+        )
+    default_prompt = interface.get("default_prompt")
+    if default_prompt is not None and (
+        not isinstance(default_prompt, str) or not default_prompt.strip()
+    ):
+        errors.append(
+            f"skill `{skill_root.name}` agent field `interface.default_prompt` must be non-empty"
+        )
+
+    policy = payload.get("policy")
+    if policy is not None:
+        if not isinstance(policy, dict):
+            errors.append(f"skill `{skill_root.name}` agent field `policy` must be an object")
+        else:
+            reject_skill_agent_unknown_fields(
+                policy,
+                {"allow_implicit_invocation"},
+                skill_root,
+                errors,
+                prefix="policy",
+            )
+            allow_implicit_invocation = policy.get("allow_implicit_invocation")
+            if allow_implicit_invocation is not None and not isinstance(
+                allow_implicit_invocation,
+                bool,
+            ):
+                errors.append(
+                    f"skill `{skill_root.name}` agent field "
+                    "`policy.allow_implicit_invocation` must be a boolean"
+                )
+
+    dependencies = payload.get("dependencies")
+    if dependencies is not None:
+        if not isinstance(dependencies, dict):
+            errors.append(
+                f"skill `{skill_root.name}` agent field `dependencies` must be an object"
+            )
+        else:
+            reject_skill_agent_unknown_fields(
+                dependencies,
+                {"tools"},
+                skill_root,
+                errors,
+                prefix="dependencies",
+            )
+
+
+def reject_skill_agent_unknown_fields(
+    payload: dict[str, Any],
+    allowed_keys: set[str],
+    skill_root: Path,
+    errors: list[str],
+    *,
+    prefix: str | None = None,
+) -> None:
+    for key in sorted(set(payload) - allowed_keys):
+        field = f"{prefix}.{key}" if prefix is not None else key
+        errors.append(
+            f"skill `{skill_root.name}` agent field `{field}` is not accepted by plugin validation"
+        )
+
+
+def validate_optional_asset_path(
+    base_dir: Path,
+    allowed_root: Path,
+    payload: dict[str, Any],
+    key: str,
+    errors: list[str],
+    *,
+    prefix: str = "interface",
+) -> None:
+    raw_path = payload.get(key)
+    if raw_path is None:
+        return
+    validate_asset_path(base_dir, allowed_root, raw_path, f"{prefix}.{key}", errors)
+
+
+def validate_asset_path(
+    base_dir: Path,
+    allowed_root: Path,
+    raw_path: Any,
+    field: str,
+    errors: list[str],
+) -> None:
+    label = field if field.startswith("skill `") else f"plugin.json field `{field}`"
+    if not isinstance(raw_path, str) or not raw_path.strip():
+        errors.append(f"{label} must be a non-empty relative path")
+        return
+    candidate = PurePosixPath(raw_path.replace("\\", "/"))
+    if candidate.is_absolute() or any(part in {"", ".", ".."} for part in candidate.parts):
+        errors.append(f"{label} must stay inside the plugin archive")
+        return
+    resolved_path = (base_dir / candidate.as_posix()).resolve()
+    if not resolved_path.is_relative_to(allowed_root.resolve()):
+        errors.append(f"{label} must stay inside the plugin archive")
+        return
+    if not resolved_path.is_file():
+        errors.append(f"{label} points to a missing file")
+
+
+if __name__ == "__main__":
+    main()
diff --git a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
new file mode 100644
index 0000000..859b6e9
--- /dev/null
+++ b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
@@ -0,0 +1,11 @@
+---
+name: "prompt-0ca565e9-3d44-45f1-832d-caa438aceddb"
+description: "文档编辑"
+metadata:
+  short-description: "文档编辑"
+---
+
+# 文档编辑
+
+**规约：定义型修改先找单一权威，禁止外挂补丁。**
+当修改 prompt/schema/状态机/协议语义时，先定位“唯一权威定义区”，优先直接重写该定义；如果改动只是往附近追加说明、例外或补充规则，而没有收束原定义，默认视为错误方案。提交前必须自问：我是在降低信息熵，还是在制造第二套语义。
diff --git a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
new file mode 100644
index 0000000..80922d4
--- /dev/null
+++ b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "文档编辑"
+  short_description: "文档编辑"
+  default_prompt: "Use $prompt-0ca565e9-3d44-45f1-832d-caa438aceddb."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
new file mode 100644
index 0000000..3cf610f
--- /dev/null
+++ b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971"
+description: "始终批判自己"
+metadata:
+  short-description: "始终批判自己"
+---
+
+# 始终批判自己
+
+始终批判自己，批判性思维，做了若干决策后，他们会综合作用产生效果，需要批判其中每一项，最终按优先级和最终预期收益看情况保留
diff --git a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
new file mode 100644
index 0000000..26b71cf
--- /dev/null
+++ b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "始终批判自己"
+  short_description: "始终批判自己"
+  default_prompt: "Use $prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
new file mode 100644
index 0000000..ef1315d
--- /dev/null
+++ b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-1323c8c8-88a0-40d2-89df-14fc9533a122"
+description: "尽量减少确认项"
+metadata:
+  short-description: "尽量减少确认项"
+---
+
+# 尽量减少确认项
+
+实现情况不要找用户确认，因为看代码就可以知道了，得自己看
diff --git a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
new file mode 100644
index 0000000..2010a57
--- /dev/null
+++ b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "尽量减少确认项"
+  short_description: "尽量减少确认项"
+  default_prompt: "Use $prompt-1323c8c8-88a0-40d2-89df-14fc9533a122."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
new file mode 100644
index 0000000..dc879e8
--- /dev/null
+++ b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-144929a0-ae69-404b-9f58-a8696378e4e3"
+description: "Patch 式改动审阅"
+metadata:
+  short-description: "Patch 式改动审阅"
+---
+
+# Patch 式改动审阅
+
+对于代码改动，你需要在我最终同意"落盘 diff"前，仅能 告知我 改动 位置 以及 代码 diff 详情，为我按 hunks 力度解释其修改动机和服务对象，并在 最终落盘时还要观察 最新状态代码一致性
diff --git a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
new file mode 100644
index 0000000..2d610b2
--- /dev/null
+++ b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "Patch 式改动审阅"
+  short_description: "Patch 式改动审阅"
+  default_prompt: "Use $prompt-144929a0-ae69-404b-9f58-a8696378e4e3."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
new file mode 100644
index 0000000..3c935ad
--- /dev/null
+++ b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-15d9a907-a363-4ec7-81ad-806f9418ad72"
+description: "pua严肃设计"
+metadata:
+  short-description: "pua严肃设计"
+---
+
+# pua严肃设计
+
+请严肃设计，我们在设计一套精密仪器，跨时代产品
diff --git a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
new file mode 100644
index 0000000..d6bc16b
--- /dev/null
+++ b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "pua严肃设计"
+  short_description: "pua严肃设计"
+  default_prompt: "Use $prompt-15d9a907-a363-4ec7-81ad-806f9418ad72."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
new file mode 100644
index 0000000..6b7f96d
--- /dev/null
+++ b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
@@ -0,0 +1,16 @@
+---
+name: "prompt-193dd3cd-2722-413b-b88c-12c2af645f80"
+description: "使用 agent-browser 排查运行时状态"
+metadata:
+  short-description: "使用 agent-browser 排查运行时状态"
+---
+
+# 使用 agent-browser 排查运行时状态
+
+使用 agent-browser 排查运行时状态，
+# 业务指引
+请你 操作 agent-browser 打开 https://10.126.126.231:8111/ 然后通过侧栏进入 HY workspace， 打开 dever_for_dev 项目
+## 运行时 worknote 目录 
+- 我给予你 /opt/store_team_dev/zyc/dever_for_dev/attic/.agent-browser-runtime-workdir 这个工作目录 ，在每个 节点 把你 阶段性 的 操作截图 给我检查，截图 请 前缀 添加时间轴，格式为 <date>-<time>-<截图名称>.<图片文件格式>
+## 开发日常情况适应
+- 需要你去记忆这个情况: 我们在 不断迭代着 界面，所以有时候界面一下子 崩掉了是因为有其他组件在热更新，你要 适应这个情况，当你感觉 遇到了这个问题，你向我 确认 刚刚 是否 出现热更新，我往往 会 回答 "对,是的" 或者 "我不确定"，这种 情况 就希望 你不要被之前 状态误导，请你 重新 排查我们关注的 问题。
diff --git a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
new file mode 100644
index 0000000..fa510bd
--- /dev/null
+++ b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "使用 agent-browser 排查运行时状态"
+  short_description: "使用 agent-browser 排查运行时状态"
+  default_prompt: "Use $prompt-193dd3cd-2722-413b-b88c-12c2af645f80."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
new file mode 100644
index 0000000..c380b4c
--- /dev/null
+++ b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
@@ -0,0 +1,27 @@
+---
+name: "prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7"
+description: "状态机正确性"
+metadata:
+  short-description: "状态机正确性"
+---
+
+# 状态机正确性
+
+高度抽象规约（公式级）
+任何副作用（发请求/写缓存/写 store/patch UI）都必须是一个纯函数式映射：Effect = f(ActorIdentity, IntentId, TargetIdentity, Payload)
+禁止让 Effect 依赖任何隐式上下文：currentXxx/globalXxx/数组下标对齐/默认回退对象/闭包里过期的 selectedXxx；因为这些在“列表重排 + 异步回写 + 流式并发”下会漂移，导致“写对了 payload，但写错了容器”。
+落地要点（必须同时满足）
+ActorIdentity（我是谁/谁在做）：谁发起这次 effect（组件/Hook/Stream/Workspace），用于界定权限与并发域（如 workspaceId、agentKey/machineKey）。
+IntentId（我这次想做什么）：一次用户意图/事务的稳定编号（如 click/open 的 seq），用于丢弃过期回写。
+TargetIdentity（我对谁做）：被操作对象的最小不可歧义闭包（按场景至少包含：machineKey/agentId + projectId + bucket/filterKey + sessionId/cursor）。
+写入前校验：在真正 setQueryData/setState 前，二次校验 Actor/Intent/Target 仍匹配当前上下文；不匹配就丢弃/重取，不能“凑合写”。
+具体例子（对照）
+1) TanStack Query 列表/分页
+正确：queryKey 与返回数据都绑定 machineKey+projectId+bucket+filterKey(+cursor)；渲染/回写前校验这些字段一致。
+错误：useQueries 用 i * buckets + j 取结果，projects 列表一重排就把 A 项目的结果读成 B 项目的。
+2) SSE/Stream patch
+正确：patch 必须携带 agentId/machineKey + projectId + sessionId，并且只允许更新对应 identity 的 queryKey 容器。
+错误：只带 sessionId 就去更新“当前项目的 sessions 列表”（TargetIdentity 缺失）。
+3) UI 选择态（跨 await）
+正确：点击会话生成 intentSeq，await 返回后如果 intentSeq 已变化则不写入（IntentId 防过期回写）；并且写入的目标必须是同一个 agentId+projectId+sessionId。
+错误：await 回来直接 setSelectedSession(x)，同时依赖“当前 selectedProject”作为目标（隐式 current 指针）。
diff --git a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
new file mode 100644
index 0000000..2d1858c
--- /dev/null
+++ b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "状态机正确性"
+  short_description: "状态机正确性"
+  default_prompt: "Use $prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
new file mode 100644
index 0000000..a8dad69
--- /dev/null
+++ b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-2d53cebd-afd4-4d35-94e9-74436da3148a"
+description: "关注收束"
+metadata:
+  short-description: "关注收束"
+---
+
+# 关注收束
+
+关注收束，如果当前实现可以复用一些东西，优先复用
diff --git a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
new file mode 100644
index 0000000..e95a2ae
--- /dev/null
+++ b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "关注收束"
+  short_description: "关注收束"
+  default_prompt: "Use $prompt-2d53cebd-afd4-4d35-94e9-74436da3148a."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
new file mode 100644
index 0000000..d381fe9
--- /dev/null
+++ b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-2eaed145-d789-4b27-93b9-8ea990830b3a"
+description: "提示词模板位置"
+metadata:
+  short-description: "提示词模板位置"
+---
+
+# 提示词模板位置
+
+dever项目所有提示词模板都应该放在独立的ts源码文件中，这样分离的更清楚，更好做提示词版本管理
diff --git a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
new file mode 100644
index 0000000..15fea0c
--- /dev/null
+++ b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "提示词模板位置"
+  short_description: "提示词模板位置"
+  default_prompt: "Use $prompt-2eaed145-d789-4b27-93b9-8ea990830b3a."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
new file mode 100644
index 0000000..b8f8bf8
--- /dev/null
+++ b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb"
+description: "长期主义"
+metadata:
+  short-description: "长期主义"
+---
+
+# 长期主义
+
+长期主义，解决一个问题时，要往上递归思考根因，想一下能不能做让未来更复利的事情，宁愿早期breakchange，也不要长期埋雷，做简单的缝缝补补
diff --git a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
new file mode 100644
index 0000000..7237bab
--- /dev/null
+++ b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "长期主义"
+  short_description: "长期主义"
+  default_prompt: "Use $prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
new file mode 100644
index 0000000..b9417ca
--- /dev/null
+++ b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca"
+description: "更改前需要用户 review"
+metadata:
+  short-description: "更改前需要用户 review"
+---
+
+# 更改前需要用户 review
+
+要执行内容改动，需要先输出计划，待用户 review 并回复后执行
diff --git a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
new file mode 100644
index 0000000..10dda57
--- /dev/null
+++ b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "更改前需要用户 review"
+  short_description: "更改前需要用户 review"
+  default_prompt: "Use $prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
new file mode 100644
index 0000000..c699703
--- /dev/null
+++ b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8"
+description: "变更简洁重设计"
+metadata:
+  short-description: "变更简洁重设计"
+---
+
+# 变更简洁重设计
+
+变更不要像修补丁一样增量修改，每次补一块，要考虑尽量的复用，必要时重新设计，来达到更简洁的结构，次要的才是说让变化比较少，我们宁愿breakchange，也不要留下丑陋冗余的代码结构
diff --git a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
new file mode 100644
index 0000000..291eaad
--- /dev/null
+++ b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "变更简洁重设计"
+  short_description: "变更简洁重设计"
+  default_prompt: "Use $prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
new file mode 100644
index 0000000..63fbb03
--- /dev/null
+++ b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-615e1231-fe33-47f8-bf35-29fdf3766d98"
+description: "悬浮菜单组件复用"
+metadata:
+  short-description: "悬浮菜单组件复用"
+---
+
+# 悬浮菜单组件复用
+
+组件复用，悬浮菜单，我觉得是完全可以复用一个的，现在出现在 右键菜单，会话选择模型，等地方，其他的你也得找，得收束成一套原始组件，这样代码冗余就小很多；决策者请定位已有核心组件，并逐步把大家收束到一起
diff --git a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
new file mode 100644
index 0000000..aea2244
--- /dev/null
+++ b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "悬浮菜单组件复用"
+  short_description: "悬浮菜单组件复用"
+  default_prompt: "Use $prompt-615e1231-fe33-47f8-bf35-29fdf3766d98."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
new file mode 100644
index 0000000..561a4f6
--- /dev/null
+++ b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2"
+description: "dever_canvas仅做参考"
+metadata:
+  short-description: "dever_canvas仅做参考"
+---
+
+# dever_canvas仅做参考
+
+dever_canvas 那一套是给你参考的，不是拿来直接用的
diff --git a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
new file mode 100644
index 0000000..4b8c732
--- /dev/null
+++ b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "dever_canvas仅做参考"
+  short_description: "dever_canvas仅做参考"
+  default_prompt: "Use $prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
new file mode 100644
index 0000000..f2b1ec4
--- /dev/null
+++ b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-8c5cc431-635c-4c94-9deb-a502e77160eb"
+description: "关注 dever_yew 开发"
+metadata:
+  short-description: "关注 dever_yew 开发"
+---
+
+# 关注 dever_yew 开发
+
+目前 dever 项目 使用和开发的 UI 界面是由 dever_yew 提供的，原 react 实现 dever_ui 目前是历史工程，不要改动，仅做参考
diff --git a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
new file mode 100644
index 0000000..8d3b586
--- /dev/null
+++ b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "关注 dever_yew 开发"
+  short_description: "关注 dever_yew 开发"
+  default_prompt: "Use $prompt-8c5cc431-635c-4c94-9deb-a502e77160eb."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
new file mode 100644
index 0000000..6464ddb
--- /dev/null
+++ b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c"
+description: "对话信息对接参考 codex 源码"
+metadata:
+  short-description: "对话信息对接参考 codex 源码"
+---
+
+# 对话信息对接参考 codex 源码
+
+对话信息对接参考 codex 源码，工程内 attic/codex 存放了 codex cli 的源码，对接 app-server 等 codex app-server 给予的能力对接参考该工程代码
diff --git a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
new file mode 100644
index 0000000..a8ca1af
--- /dev/null
+++ b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "对话信息对接参考 codex 源码"
+  short_description: "对话信息对接参考 codex 源码"
+  default_prompt: "Use $prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
new file mode 100644
index 0000000..6f96d9c
--- /dev/null
+++ b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
@@ -0,0 +1,15 @@
+---
+name: "prompt-ac42abf9-6df8-4539-99c7-e402e905a03b"
+description: "逻辑收束到agent"
+metadata:
+  short-description: "逻辑收束到agent"
+---
+
+# 逻辑收束到agent
+
+规约：Manager/Agent 边界（强制收束）
+
+前端只允许访问 manager：所有 API 必须走 /api/router/:agentId/...（local 也一样）。
+manager 只负责：请求转发（router）、agent registry、（未来）登录鉴权、（可选）静态资源托管；严禁在 manager 实现任何业务能力与持久化。
+大部分“后端能力 + 数据落盘”（projects/sessions/chat/fs/git/terminal/notifications/uiState/uiWorkspaces/uiDock/uiScroll 等）必须在 agent 内实现与持久化；manager 不得读写 .dever/agent_data.json 或任何业务数据文件。
+发现 manager 出现新增 /api/* 实现模块或 store/JSON 持久化代码，一律视为架构违规：要么迁到 agent，要么删除并改为转发。
diff --git a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
new file mode 100644
index 0000000..1d669e7
--- /dev/null
+++ b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "逻辑收束到agent"
+  short_description: "逻辑收束到agent"
+  default_prompt: "Use $prompt-ac42abf9-6df8-4539-99c7-e402e905a03b."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
new file mode 100644
index 0000000..b0743b2
--- /dev/null
+++ b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315"
+description: "mvp"
+metadata:
+  short-description: "mvp"
+---
+
+# mvp
+
+dever_doc/mvp/target.md  我移动到了这里，作为我们的工作目标，现在我们就开始工作，过程记录按照步骤记录在 mvp文件夹里就行，合理拆分成文件
diff --git a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
new file mode 100644
index 0000000..86a71f3
--- /dev/null
+++ b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "mvp"
+  short_description: "mvp"
+  default_prompt: "Use $prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
new file mode 100644
index 0000000..8901c6e
--- /dev/null
+++ b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
@@ -0,0 +1,10 @@
+---
+name: "prompt-f118ab91-390b-48e2-a962-3abe4d54211e"
+description: "完美主义"
+metadata:
+  short-description: "完美主义"
+---
+
+# 完美主义
+
+完成之前，核对下有没有问题，设计上有没有不完善，尽量一次性做到完美；完美不代表复杂，完美是刚好在简单和复杂直接达到平衡
diff --git a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
new file mode 100644
index 0000000..9600439
--- /dev/null
+++ b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
@@ -0,0 +1,6 @@
+interface:
+  display_name: "完美主义"
+  short_description: "完美主义"
+  default_prompt: "Use $prompt-f118ab91-390b-48e2-a962-3abe4d54211e."
+policy:
+  allow_implicit_invocation: false
diff --git a/skills/rs-skill-smoke-09e1daf7/SKILL.md b/skills/rs-skill-smoke-09e1daf7/SKILL.md
new file mode 100644
index 0000000..eb9b22f
--- /dev/null
+++ b/skills/rs-skill-smoke-09e1daf7/SKILL.md
@@ -0,0 +1,8 @@
+---
+name: rs-skill-smoke-09e1daf7
+description: Used by project_contract_smoke.
+---
+
+# RS Skill Smoke
+
+Used by project_contract_smoke.
diff --git a/skills/rs-skill-smoke-529efbc9/SKILL.md b/skills/rs-skill-smoke-529efbc9/SKILL.md
new file mode 100644
index 0000000..85c8a95
--- /dev/null
+++ b/skills/rs-skill-smoke-529efbc9/SKILL.md
@@ -0,0 +1,8 @@
+---
+name: rs-skill-smoke-529efbc9
+description: Used by project_contract_smoke.
+---
+
+# rs-skill-smoke-529efbc9
+
+Used by project_contract_smoke.
diff --git a/skills/rs-skill-smoke-cde1029f/SKILL.md b/skills/rs-skill-smoke-cde1029f/SKILL.md
new file mode 100644
index 0000000..4611722
--- /dev/null
+++ b/skills/rs-skill-smoke-cde1029f/SKILL.md
@@ -0,0 +1,8 @@
+---
+name: rs-skill-smoke-cde1029f
+description: Used by project_contract_smoke.
+---
+
+# RS Skill Smoke
+
+Used by project_contract_smoke.
diff --git a/skills/skill-creator/SKILL.md b/skills/skill-creator/SKILL.md
new file mode 100644
index 0000000..57f4e58
--- /dev/null
+++ b/skills/skill-creator/SKILL.md
@@ -0,0 +1,416 @@
+---
+name: skill-creator
+description: Guide for creating effective skills. This skill should be used when users want to create a new skill (or update an existing skill) that extends Codex's capabilities with specialized knowledge, workflows, or tool integrations.
+metadata:
+  short-description: Create or update a skill
+---
+
+# Skill Creator
+
+This skill provides guidance for creating effective skills.
+
+## About Skills
+
+Skills are modular, self-contained folders that extend Codex's capabilities by providing
+specialized knowledge, workflows, and tools. Think of them as "onboarding guides" for specific
+domains or tasks—they transform Codex from a general-purpose agent into a specialized agent
+equipped with procedural knowledge that no model can fully possess.
+
+### What Skills Provide
+
+1. Specialized workflows - Multi-step procedures for specific domains
+2. Tool integrations - Instructions for working with specific file formats or APIs
+3. Domain expertise - Company-specific knowledge, schemas, business logic
+4. Bundled resources - Scripts, references, and assets for complex and repetitive tasks
+
+## Core Principles
+
+### Concise is Key
+
+The context window is a public good. Skills share the context window with everything else Codex needs: system prompt, conversation history, other Skills' metadata, and the actual user request.
+
+**Default assumption: Codex is already very smart.** Only add context Codex doesn't already have. Challenge each piece of information: "Does Codex really need this explanation?" and "Does this paragraph justify its token cost?"
+
+Prefer concise examples over verbose explanations.
+
+### Set Appropriate Degrees of Freedom
+
+Match the level of specificity to the task's fragility and variability:
+
+**High freedom (text-based instructions)**: Use when multiple approaches are valid, decisions depend on context, or heuristics guide the approach.
+
+**Medium freedom (pseudocode or scripts with parameters)**: Use when a preferred pattern exists, some variation is acceptable, or configuration affects behavior.
+
+**Low freedom (specific scripts, few parameters)**: Use when operations are fragile and error-prone, consistency is critical, or a specific sequence must be followed.
+
+Think of Codex as exploring a path: a narrow bridge with cliffs needs specific guardrails (low freedom), while an open field allows many routes (high freedom).
+
+### Protect Validation Integrity
+
+You may use subagents during iteration to validate whether a skill works on realistic tasks or whether a suspected problem is real. This is most useful when you want an independent pass on the skill's behavior, outputs, or failure modes after a revision.  Only do this when it is possible to start new subagents.
+
+When using subagents for validation, treat that as an evaluation surface. The goal is to learn whether the skill generalizes, not whether another agent can reconstruct the answer from leaked context.
+
+Prefer raw artifacts such as example prompts, outputs, diffs, logs, or traces. Give the minimum task-local context needed to perform the validation. Avoid passing the intended answer, suspected bug, intended fix, or your prior conclusions unless the validation explicitly requires them.
+
+### Anatomy of a Skill
+
+Every skill consists of a required SKILL.md file and optional bundled resources:
+
+```
+skill-name/
+├── SKILL.md (required)
+│   ├── YAML frontmatter metadata (required)
+│   │   ├── name: (required)
+│   │   └── description: (required)
+│   └── Markdown instructions (required)
+├── agents/ (recommended)
+│   └── openai.yaml - UI metadata for skill lists and chips
+└── Bundled Resources (optional)
+    ├── scripts/          - Executable code (Python/Bash/etc.)
+    ├── references/       - Documentation intended to be loaded into context as needed
+    └── assets/           - Files used in output (templates, icons, fonts, etc.)
+```
+
+#### SKILL.md (required)
+
+Every SKILL.md consists of:
+
+- **Frontmatter** (YAML): Contains `name` and `description` fields. These are the only fields that Codex reads to determine when the skill gets used, thus it is very important to be clear and comprehensive in describing what the skill is, and when it should be used.
+- **Body** (Markdown): Instructions and guidance for using the skill. Only loaded AFTER the skill triggers (if at all).
+
+#### Agents metadata (recommended)
+
+- UI-facing metadata for skill lists and chips
+- Read references/openai_yaml.md before generating values and follow its descriptions and constraints
+- Create: human-facing `display_name`, `short_description`, and `default_prompt` by reading the skill
+- Generate deterministically by passing the values as `--interface key=value` to `scripts/generate_openai_yaml.py` or `scripts/init_skill.py`
+- On updates: validate `agents/openai.yaml` still matches SKILL.md; regenerate if stale
+- Only include other optional interface fields (icons, brand color) if explicitly provided
+- See references/openai_yaml.md for field definitions and examples
+
+#### Bundled Resources (optional)
+
+##### Scripts (`scripts/`)
+
+Executable code (Python/Bash/etc.) for tasks that require deterministic reliability or are repeatedly rewritten.
+
+- **When to include**: When the same code is being rewritten repeatedly or deterministic reliability is needed
+- **Example**: `scripts/rotate_pdf.py` for PDF rotation tasks
+- **Benefits**: Token efficient, deterministic, may be executed without loading into context
+- **Note**: Scripts may still need to be read by Codex for patching or environment-specific adjustments
+
+##### References (`references/`)
+
+Documentation and reference material intended to be loaded as needed into context to inform Codex's process and thinking.
+
+- **When to include**: For documentation that Codex should reference while working
+- **Examples**: `references/finance.md` for financial schemas, `references/mnda.md` for company NDA template, `references/policies.md` for company policies, `references/api_docs.md` for API specifications
+- **Use cases**: Database schemas, API documentation, domain knowledge, company policies, detailed workflow guides
+- **Benefits**: Keeps SKILL.md lean, loaded only when Codex determines it's needed
+- **Best practice**: If files are large (>10k words), include grep search patterns in SKILL.md
+- **Avoid duplication**: Information should live in either SKILL.md or references files, not both. Prefer references files for detailed information unless it's truly core to the skill—this keeps SKILL.md lean while making information discoverable without hogging the context window. Keep only essential procedural instructions and workflow guidance in SKILL.md; move detailed reference material, schemas, and examples to references files.
+
+##### Assets (`assets/`)
+
+Files not intended to be loaded into context, but rather used within the output Codex produces.
+
+- **When to include**: When the skill needs files that will be used in the final output
+- **Examples**: `assets/logo.png` for brand assets, `assets/slides.pptx` for PowerPoint templates, `assets/frontend-template/` for HTML/React boilerplate, `assets/font.ttf` for typography
+- **Use cases**: Templates, images, icons, boilerplate code, fonts, sample documents that get copied or modified
+- **Benefits**: Separates output resources from documentation, enables Codex to use files without loading them into context
+
+#### What to Not Include in a Skill
+
+A skill should only contain essential files that directly support its functionality. Do NOT create extraneous documentation or auxiliary files, including:
+
+- README.md
+- INSTALLATION_GUIDE.md
+- QUICK_REFERENCE.md
+- CHANGELOG.md
+- etc.
+
+The skill should only contain the information needed for an AI agent to do the job at hand. It should not contain auxiliary context about the process that went into creating it, setup and testing procedures, user-facing documentation, etc. Creating additional documentation files just adds clutter and confusion.
+
+### Progressive Disclosure Design Principle
+
+Skills use a three-level loading system to manage context efficiently:
+
+1. **Metadata (name + description)** - Always in context (~100 words)
+2. **SKILL.md body** - When skill triggers (<5k words)
+3. **Bundled resources** - As needed by Codex (Unlimited because scripts can be executed without reading into context window)
+
+#### Progressive Disclosure Patterns
+
+Keep SKILL.md body to the essentials and under 500 lines to minimize context bloat. Split content into separate files when approaching this limit. When splitting out content into other files, it is very important to reference them from SKILL.md and describe clearly when to read them, to ensure the reader of the skill knows they exist and when to use them.
+
+**Key principle:** When a skill supports multiple variations, frameworks, or options, keep only the core workflow and selection guidance in SKILL.md. Move variant-specific details (patterns, examples, configuration) into separate reference files.
+
+**Pattern 1: High-level guide with references**
+
+```markdown
+# PDF Processing
+
+## Quick start
+
+Extract text with pdfplumber:
+[code example]
+
+## Advanced features
+
+- **Form filling**: See [FORMS.md](FORMS.md) for complete guide
+- **API reference**: See [REFERENCE.md](REFERENCE.md) for all methods
+- **Examples**: See [EXAMPLES.md](EXAMPLES.md) for common patterns
+```
+
+Codex loads FORMS.md, REFERENCE.md, or EXAMPLES.md only when needed.
+
+**Pattern 2: Domain-specific organization**
+
+For Skills with multiple domains, organize content by domain to avoid loading irrelevant context:
+
+```
+bigquery-skill/
+├── SKILL.md (overview and navigation)
+└── reference/
+    ├── finance.md (revenue, billing metrics)
+    ├── sales.md (opportunities, pipeline)
+    ├── product.md (API usage, features)
+    └── marketing.md (campaigns, attribution)
+```
+
+When a user asks about sales metrics, Codex only reads sales.md.
+
+Similarly, for skills supporting multiple frameworks or variants, organize by variant:
+
+```
+cloud-deploy/
+├── SKILL.md (workflow + provider selection)
+└── references/
+    ├── aws.md (AWS deployment patterns)
+    ├── gcp.md (GCP deployment patterns)
+    └── azure.md (Azure deployment patterns)
+```
+
+When the user chooses AWS, Codex only reads aws.md.
+
+**Pattern 3: Conditional details**
+
+Show basic content, link to advanced content:
+
+```markdown
+# DOCX Processing
+
+## Creating documents
+
+Use docx-js for new documents. See [DOCX-JS.md](DOCX-JS.md).
+
+## Editing documents
+
+For simple edits, modify the XML directly.
+
+**For tracked changes**: See [REDLINING.md](REDLINING.md)
+**For OOXML details**: See [OOXML.md](OOXML.md)
+```
+
+Codex reads REDLINING.md or OOXML.md only when the user needs those features.
+
+**Important guidelines:**
+
+- **Avoid deeply nested references** - Keep references one level deep from SKILL.md. All reference files should link directly from SKILL.md.
+- **Structure longer reference files** - For files longer than 100 lines, include a table of contents at the top so Codex can see the full scope when previewing.
+
+## Skill Creation Process
+
+Skill creation involves these steps:
+
+1. Understand the skill with concrete examples
+2. Plan reusable skill contents (scripts, references, assets)
+3. Initialize the skill (run init_skill.py)
+4. Edit the skill (implement resources and write SKILL.md)
+5. Validate the skill (run quick_validate.py)
+6. Iterate based on real usage and forward-test complex skills.
+
+Follow these steps in order, skipping only if there is a clear reason why they are not applicable.
+
+### Skill Naming
+
+- Use lowercase letters, digits, and hyphens only; normalize user-provided titles to hyphen-case (e.g., "Plan Mode" -> `plan-mode`).
+- When generating names, generate a name under 64 characters (letters, digits, hyphens).
+- Prefer short, verb-led phrases that describe the action.
+- Namespace by tool when it improves clarity or triggering (e.g., `gh-address-comments`, `linear-address-issue`).
+- Name the skill folder exactly after the skill name.
+
+### Step 1: Understanding the Skill with Concrete Examples
+
+Skip this step only when the skill's usage patterns are already clearly understood. It remains valuable even when working with an existing skill.
+
+To create an effective skill, clearly understand concrete examples of how the skill will be used. This understanding can come from either direct user examples or generated examples that are validated with user feedback.
+
+For example, when building an image-editor skill, relevant questions include:
+
+- "What functionality should the image-editor skill support? Editing, rotating, anything else?"
+- "Can you give some examples of how this skill would be used?"
+- "I can imagine users asking for things like 'Remove the red-eye from this image' or 'Rotate this image'. Are there other ways you imagine this skill being used?"
+- "What would a user say that should trigger this skill?"
+- "Where should I create this skill? If you do not have a preference, I will place it in `$CODEX_HOME/skills` (or `~/.codex/skills` when `CODEX_HOME` is unset) so Codex can discover it automatically."
+
+To avoid overwhelming users, avoid asking too many questions in a single message. Start with the most important questions and follow up as needed for better effectiveness.
+
+Conclude this step when there is a clear sense of the functionality the skill should support.
+
+### Step 2: Planning the Reusable Skill Contents
+
+To turn concrete examples into an effective skill, analyze each example by:
+
+1. Considering how to execute on the example from scratch
+2. Identifying what scripts, references, and assets would be helpful when executing these workflows repeatedly
+
+Example: When building a `pdf-editor` skill to handle queries like "Help me rotate this PDF," the analysis shows:
+
+1. Rotating a PDF requires re-writing the same code each time
+2. A `scripts/rotate_pdf.py` script would be helpful to store in the skill
+
+Example: When designing a `frontend-webapp-builder` skill for queries like "Build me a todo app" or "Build me a dashboard to track my steps," the analysis shows:
+
+1. Writing a frontend webapp requires the same boilerplate HTML/React each time
+2. An `assets/hello-world/` template containing the boilerplate HTML/React project files would be helpful to store in the skill
+
+Example: When building a `big-query` skill to handle queries like "How many users have logged in today?" the analysis shows:
+
+1. Querying BigQuery requires re-discovering the table schemas and relationships each time
+2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill
+
+To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets.
+
+### Step 3: Initializing the Skill
+
+At this point, it is time to actually create the skill.
+
+Skip this step only if the skill being developed already exists. In this case, continue to the next step.
+
+Before running `init_skill.py`, ask where the user wants the skill created. If they do not specify a location, default to `$CODEX_HOME/skills`; when `CODEX_HOME` is unset, fall back to `~/.codex/skills` so the skill is auto-discovered.
+
+When creating a new skill from scratch, always run the `init_skill.py` script. The script conveniently generates a new template skill directory that automatically includes everything a skill requires, making the skill creation process much more efficient and reliable.
+
+Usage:
+
+```bash
+scripts/init_skill.py <skill-name> --path <output-directory> [--resources scripts,references,assets] [--examples]
+```
+
+Examples:
+
+```bash
+scripts/init_skill.py my-skill --path "${CODEX_HOME:-$HOME/.codex}/skills"
+scripts/init_skill.py my-skill --path "${CODEX_HOME:-$HOME/.codex}/skills" --resources scripts,references
+scripts/init_skill.py my-skill --path ~/work/skills --resources scripts --examples
+```
+
+The script:
+
+- Creates the skill directory at the specified path
+- Generates a SKILL.md template with proper frontmatter and TODO placeholders
+- Creates `agents/openai.yaml` using agent-generated `display_name`, `short_description`, and `default_prompt` passed via `--interface key=value`
+- Optionally creates resource directories based on `--resources`
+- Optionally adds example files when `--examples` is set
+
+After initialization, customize the SKILL.md and add resources as needed. If you used `--examples`, replace or delete placeholder files.
+
+Generate `display_name`, `short_description`, and `default_prompt` by reading the skill, then pass them as `--interface key=value` to `init_skill.py` or regenerate with:
+
+```bash
+scripts/generate_openai_yaml.py <path/to/skill-folder> --interface key=value
+```
+
+Only include other optional interface fields when the user explicitly provides them. For full field descriptions and examples, see references/openai_yaml.md.
+
+### Step 4: Edit the Skill
+
+When editing the (newly-generated or existing) skill, remember that the skill is being created for another instance of Codex to use. Include information that would be beneficial and non-obvious to Codex. Consider what procedural knowledge, domain-specific details, or reusable assets would help another Codex instance execute these tasks more effectively.
+
+After substantial revisions, or if the skill is particularly tricky, you should use subagents to forward-test the skill on realistic tasks or artifacts. When doing so, pass the artifact under validation rather than your diagnosis of what is wrong, and keep the prompt generic enough that success depends on transferable reasoning rather than hidden ground truth.
+
+#### Start with Reusable Skill Contents
+
+To begin implementation, start with the reusable resources identified above: `scripts/`, `references/`, and `assets/` files. Note that this step may require user input. For example, when implementing a `brand-guidelines` skill, the user may need to provide brand assets or templates to store in `assets/`, or documentation to store in `references/`.
+
+Added scripts must be tested by actually running them to ensure there are no bugs and that the output matches what is expected. If there are many similar scripts, only a representative sample needs to be tested to ensure confidence that they all work while balancing time to completion.
+
+If you used `--examples`, delete any placeholder files that are not needed for the skill. Only create resource directories that are actually required.
+
+#### Update SKILL.md
+
+**Writing Guidelines:** Always use imperative/infinitive form.
+
+##### Frontmatter
+
+Write the YAML frontmatter with `name` and `description`:
+
+- `name`: The skill name
+- `description`: This is the primary triggering mechanism for your skill, and helps Codex understand when to use the skill.
+  - Include both what the Skill does and specific triggers/contexts for when to use it.
+  - Include all "when to use" information here - Not in the body. The body is only loaded after triggering, so "When to Use This Skill" sections in the body are not helpful to Codex.
+  - Example description for a `docx` skill: "Comprehensive document creation, editing, and analysis with support for tracked changes, comments, formatting preservation, and text extraction. Use when Codex needs to work with professional documents (.docx files) for: (1) Creating new documents, (2) Modifying or editing content, (3) Working with tracked changes, (4) Adding comments, or any other document tasks"
+
+Do not include any other fields in YAML frontmatter.
+
+##### Body
+
+Write instructions for using the skill and its bundled resources.
+
+### Step 5: Validate the Skill
+
+Once development of the skill is complete, validate the skill folder to catch basic issues early:
+
+```bash
+scripts/quick_validate.py <path/to/skill-folder>
+```
+
+The validation script checks YAML frontmatter format, required fields, and naming rules. If validation fails, fix the reported issues and run the command again.
+
+### Step 6: Iterate
+
+After testing the skill, you may detect the skill is complex enough that it requires forward-testing; or users may request improvements.
+
+User testing often this happens right after using the skill, with fresh context of how the skill performed.
+
+**Forward-testing and iteration workflow:**
+
+1. Use the skill on real tasks
+2. Notice struggles or inefficiencies
+3. Identify how SKILL.md or bundled resources should be updated
+4. Implement changes and test again
+5. Forward-test if it is reasonable and appropriate
+
+## Forward-testing
+
+To forward-test, launch subagents as a way to stress test the skill with minimal context.
+Subagents should *not* know that they are being asked to test the skill.  They should be treated as
+an agent asked to perform a task by the user.  Prompts to subagents should look like:
+  `Use $skill-x at /path/to/skill-x to solve problem y`
+Not:
+  `Review the skill at /path/to/skill-x; pretend a user asks you to...`
+
+Decision rule for forward-testing:
+  - Err on the side of forward-testing
+  - Ask for approval if you think there's a risk that forward-testing would:
+    * take a long time,
+    * require additional approvals from the user, or
+    * modify live production systems
+
+  In these cases, show the user your proposed prompt and request (1) a yes/no decision, and
+  (2) any suggested modifictions.
+
+Considerations when forward-testing:
+   - use fresh threads for independent passes
+   - pass the skill, and a request in a similar way the user would.
+   - pass raw artifacts, not your conclusions
+   - avoid showing expected answers or intended fixes
+   - rebuild context from source artifacts after each iteration
+   - review the subagent's output and reasoning and emitted artifacts
+   - avoid leaving artifacts the agent can find on disk between iterations;
+     clean up subagents' artifacts to avoid additional contamination.
+
+If forward-testing only succeeds when subagents see leaked context, tighten the skill or the
+forward-testing setup before trusting the result.
diff --git a/skills/skill-creator/agents/openai.yaml b/skills/skill-creator/agents/openai.yaml
new file mode 100644
index 0000000..3095c60
--- /dev/null
+++ b/skills/skill-creator/agents/openai.yaml
@@ -0,0 +1,5 @@
+interface:
+  display_name: "Skill Creator"
+  short_description: "Create or update a skill"
+  icon_small: "./assets/skill-creator-small.svg"
+  icon_large: "./assets/skill-creator.png"
diff --git a/skills/skill-creator/assets/skill-creator-small.svg b/skills/skill-creator/assets/skill-creator-small.svg
new file mode 100644
index 0000000..c6e4f67
--- /dev/null
+++ b/skills/skill-creator/assets/skill-creator-small.svg
@@ -0,0 +1,3 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" viewBox="0 0 20 20">
+  <path fill="#0D0D0D" d="M12.03 4.113a3.612 3.612 0 0 1 5.108 5.108l-6.292 6.29c-.324.324-.56.561-.791.752l-.235.176c-.205.14-.422.261-.65.36l-.229.093a4.136 4.136 0 0 1-.586.16l-.764.134-2.394.4c-.142.024-.294.05-.423.06-.098.007-.232.01-.378-.026l-.149-.05a1.081 1.081 0 0 1-.521-.474l-.046-.093a1.104 1.104 0 0 1-.075-.527c.01-.129.035-.28.06-.422l.398-2.394c.1-.602.162-.987.295-1.35l.093-.23c.1-.228.22-.445.36-.65l.176-.235c.19-.232.428-.467.751-.79l6.292-6.292Zm-5.35 7.232c-.35.35-.534.535-.66.688l-.11.147a2.67 2.67 0 0 0-.24.433l-.062.154c-.08.22-.124.462-.232 1.112l-.398 2.394-.001.001h.003l2.393-.399.717-.126a2.63 2.63 0 0 0 .394-.105l.154-.063a2.65 2.65 0 0 0 .433-.24l.147-.11c.153-.126.339-.31.688-.66l4.988-4.988-3.227-3.226-4.987 4.988Zm9.517-6.291a2.281 2.281 0 0 0-3.225 0l-.364.362 3.226 3.227.363-.364c.89-.89.89-2.334 0-3.225ZM4.583 1.783a.3.3 0 0 1 .294.241c.117.585.347 1.092.707 1.48.357.385.859.668 1.549.783a.3.3 0 0 1 0 .592c-.69.115-1.192.398-1.549.783-.315.34-.53.77-.657 1.265l-.05.215a.3.3 0 0 1-.588 0c-.117-.585-.347-1.092-.707-1.48-.357-.384-.859-.668-1.549-.783a.3.3 0 0 1 0-.592c.69-.115 1.192-.398 1.549-.783.36-.388.59-.895.707-1.48l.015-.05a.3.3 0 0 1 .279-.19Z"/>
+</svg>
diff --git a/skills/skill-creator/assets/skill-creator.png b/skills/skill-creator/assets/skill-creator.png
new file mode 100644
index 0000000000000000000000000000000000000000..4f3d6d82fa78fbdce97af3c17f6a25c683aa3290
GIT binary patch
literal 1563
zcmV+$2ITpPP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1+Ym(K~#7F?cH5#
z99100@!y%5ZPPYs)~0PjXk@GQA{H?sLh4NusZb$>1#i4F!Dtb@FnH%p6OalPi4TDy
zMcTdqNqhk%K`*Qbx>_X{K4hvjHd<=hH0fq{Gsiib9J_g*IrFfyGygA?&1Rp<e)!Lv
z&F&-sMNt$*Q4~c{6h%=KMNyPO4AlSe^Y3O*N_Bv<bom=~{{V|kChCnG>l>Iw2qhkb
ze|)YB#{A1DHe~H{=}oVwFPPA*37~O^y*^+fpb`thKY1$)zGE1LrVQMsu}jdkKwuIF
z!Y>Y|aer<UrQKcdlAZ^Q{2)91&JcVoQ6T*Ma0W$d-2N&9zp9%V!;uSptb5j%eT;^L
z6bObW-<-wIr$^yai2w-<LzX|##Yf)12p@_)$mHZ?=J%(Mjaw-rgCMhbFaPM=oA6ky
z_aOp9(=>ZBkl8tR2W{Vc1+7>_fXyPMKjmfh7264^#1Q8f8yfM)Gsj@1QV6g#maH@I
zP%I~8Ek<RbOv;k}5F1c?Wgoi<*$P7x%A{x|<$X!4K(@n>1&*Sz<4`O%n=C#xm?`ka
z@f*eCnG*Imx=o;)FU8GPEG9%?fE(jGa4*wlOu)drquT{LDa8yFs(BEJAz$>R*gPVE
zqU#+{sHQ>IV#p$cqEO9(Y=$ALItt^-S@v#+A*(J*LO`5i$f|}?GICI;ra;_c$ihcq
zX6#?7t76DPMwx(OH38xkLlzp!uBppVEb<_JVaNhUVVGdAj!ZzYNQ3x|AuFRSya%H+
z?dbZhQ0jjifQKRr5)?-HzW@Ca#_cg2y7h{`C>$TMzDr80D_JB#g2uq?7v-;0HimyF
z%!H*6!ecrjR#+G^-I_yvejNAeo`a<|Y<nL|JL@pN{{Z&hoCdS3mG9aZOIo+R)V&Fh
zMG7Qr44F3+E-_5_P-H-=g&|WxS=iTPHeUbJHw;lE-k_>BMrB2#6*u;OYX9V;b-SyY
zmSuIfx3`<{v8qo<lrTgNCnXS!^5dh5MGZr?4N71b<;O;qiYkU|6O=$P%8!dG6m<;Q
z8kE2>M4|80YXzgSg7L69b@21RF+`z))FOtR$uxAc?!1W*3JruXoD~WPVK^^v5W;X*
zpdf_dzQ8~TL#;qS2tz&JK?uWJzP@9~zdK179`pAt+{P25gyAjUK={;^Ves}2U?==6
zNf;tu_96V2E4^TR<-qwx`(A%qKJ|LP3BwTiGa(EWhXUIZ!jHo1q$CkT<Qb$q9qaZR
z-cXW?A@V*UtEQteHIyV{h&+Mtsqv1jS5@v%l8zzrHX()S?Dki3hC&$2c>~d#9UdUR
zH40%o$QuZQi$i}mMj?#VDT6HUKah5JtJNrku|D+)DV1De$d*y~ogWBegVa9;v@4x`
z{E^m^dv>Y3)-b^IHelgvz;bpZlf!BnL!=DS*wpgU)oZ_Yc0Tbalu)#Ku-%=0qSQQw
zNPQo|`ICR&zKgd<K7%+_%4h~_Ia@yUSS&C^${>uf@(L>gD6zp1DQ&W{*=*XftU-Bx
z{{AAaUi%GI*nGtbL!>kzrBZ3#>yIi-O6)L1N+5D`wYCsZVu>MA1<7o7SqLbx#Skfh
zh!xgWmj{RvYYdUEo2<$LK#4tu$n`2~?FwtF{91jn{I@yA@4gUs43X;z*=U8eRh}nB
zZ@!E}7h*pdGS?vX=F0UC71dDKEG$029y`&?4tIz02f3n9Xus>kIZ7E~2%2`79eMr(
zBrMmT%M$w#UDy9A6bf}v=-|G+IQzzn<<ph_!YmliS%q8QYkJd|jWB@(r}RO&{{H^K
znVFe0E^lVq|8n+{`TD76Tg=x^9nGP>BbTJjk&~1^x!BXwGidKmHbOD6^2FPh=j>?`
zzdy<x8yll1-a(!|N-8#Aa@A!RhIqp1iKi%vq9}@@D2k#eilV55^dCV<^wOW~YLEZ`
N002ovPDHLkV1k6v&87eV

literal 0
HcmV?d00001

diff --git a/skills/skill-creator/license.txt b/skills/skill-creator/license.txt
new file mode 100644
index 0000000..d645695
--- /dev/null
+++ b/skills/skill-creator/license.txt
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/skills/skill-creator/references/openai_yaml.md b/skills/skill-creator/references/openai_yaml.md
new file mode 100644
index 0000000..90f9e8e
--- /dev/null
+++ b/skills/skill-creator/references/openai_yaml.md
@@ -0,0 +1,49 @@
+# openai.yaml fields (full example + descriptions)
+
+`agents/openai.yaml` is an extended, product-specific config intended for the machine/harness to read, not the agent. Other product-specific config can also live in the `agents/` folder.
+
+## Full example
+
+```yaml
+interface:
+  display_name: "Optional user-facing name"
+  short_description: "Optional user-facing description"
+  icon_small: "./assets/small-400px.png"
+  icon_large: "./assets/large-logo.svg"
+  brand_color: "#3B82F6"
+  default_prompt: "Optional surrounding prompt to use the skill with"
+
+dependencies:
+  tools:
+    - type: "mcp"
+      value: "github"
+      description: "GitHub MCP server"
+      transport: "streamable_http"
+      url: "https://api.githubcopilot.com/mcp/"
+
+policy:
+  allow_implicit_invocation: true
+```
+
+## Field descriptions and constraints
+
+Top-level constraints:
+
+- Quote all string values.
+- Keep keys unquoted.
+- For `interface.default_prompt`: generate a helpful, short (typically 1 sentence) example starting prompt based on the skill. It must explicitly mention the skill as `$skill-name` (e.g., "Use $skill-name-here to draft a concise weekly status update.").
+
+- `interface.display_name`: Human-facing title shown in UI skill lists and chips.
+- `interface.short_description`: Human-facing short UI blurb (25–64 chars) for quick scanning.
+- `interface.icon_small`: Path to a small icon asset (relative to skill dir). Default to `./assets/` and place icons in the skill's `assets/` folder.
+- `interface.icon_large`: Path to a larger logo asset (relative to skill dir). Default to `./assets/` and place icons in the skill's `assets/` folder.
+- `interface.brand_color`: Hex color used for UI accents (e.g., badges).
+- `interface.default_prompt`: Default prompt snippet inserted when invoking the skill.
+- `dependencies.tools[].type`: Dependency category. Only `mcp` is supported for now.
+- `dependencies.tools[].value`: Identifier of the tool or dependency.
+- `dependencies.tools[].description`: Human-readable explanation of the dependency.
+- `dependencies.tools[].transport`: Connection type when `type` is `mcp`.
+- `dependencies.tools[].url`: MCP server URL when `type` is `mcp`.
+- `policy.allow_implicit_invocation`: When false, the skill is not injected into
+  the model context by default, but can still be invoked explicitly via `$skill`.
+  Defaults to true.
diff --git a/skills/skill-creator/scripts/generate_openai_yaml.py b/skills/skill-creator/scripts/generate_openai_yaml.py
new file mode 100644
index 0000000..3fd7405
--- /dev/null
+++ b/skills/skill-creator/scripts/generate_openai_yaml.py
@@ -0,0 +1,226 @@
+#!/usr/bin/env python3
+"""
+OpenAI YAML Generator - Creates agents/openai.yaml for a skill folder.
+
+Usage:
+    generate_openai_yaml.py <skill_dir> [--name <skill_name>] [--interface key=value]
+"""
+
+import argparse
+import re
+import sys
+from pathlib import Path
+
+ACRONYMS = {
+    "GH",
+    "MCP",
+    "API",
+    "CI",
+    "CLI",
+    "LLM",
+    "PDF",
+    "PR",
+    "UI",
+    "URL",
+    "SQL",
+}
+
+BRANDS = {
+    "openai": "OpenAI",
+    "openapi": "OpenAPI",
+    "github": "GitHub",
+    "pagerduty": "PagerDuty",
+    "datadog": "DataDog",
+    "sqlite": "SQLite",
+    "fastapi": "FastAPI",
+}
+
+SMALL_WORDS = {"and", "or", "to", "up", "with"}
+
+ALLOWED_INTERFACE_KEYS = {
+    "display_name",
+    "short_description",
+    "icon_small",
+    "icon_large",
+    "brand_color",
+    "default_prompt",
+}
+
+
+def yaml_quote(value):
+    escaped = value.replace("\\", "\\\\").replace('"', '\\"').replace("\n", "\\n")
+    return f'"{escaped}"'
+
+
+def format_display_name(skill_name):
+    words = [word for word in skill_name.split("-") if word]
+    formatted = []
+    for index, word in enumerate(words):
+        lower = word.lower()
+        upper = word.upper()
+        if upper in ACRONYMS:
+            formatted.append(upper)
+            continue
+        if lower in BRANDS:
+            formatted.append(BRANDS[lower])
+            continue
+        if index > 0 and lower in SMALL_WORDS:
+            formatted.append(lower)
+            continue
+        formatted.append(word.capitalize())
+    return " ".join(formatted)
+
+
+def generate_short_description(display_name):
+    description = f"Help with {display_name} tasks"
+
+    if len(description) < 25:
+        description = f"Help with {display_name} tasks and workflows"
+    if len(description) < 25:
+        description = f"Help with {display_name} tasks with guidance"
+
+    if len(description) > 64:
+        description = f"Help with {display_name}"
+    if len(description) > 64:
+        description = f"{display_name} helper"
+    if len(description) > 64:
+        description = f"{display_name} tools"
+    if len(description) > 64:
+        suffix = " helper"
+        max_name_length = 64 - len(suffix)
+        trimmed = display_name[:max_name_length].rstrip()
+        description = f"{trimmed}{suffix}"
+    if len(description) > 64:
+        description = description[:64].rstrip()
+
+    if len(description) < 25:
+        description = f"{description} workflows"
+        if len(description) > 64:
+            description = description[:64].rstrip()
+
+    return description
+
+
+def read_frontmatter_name(skill_dir):
+    skill_md = Path(skill_dir) / "SKILL.md"
+    if not skill_md.exists():
+        print(f"[ERROR] SKILL.md not found in {skill_dir}")
+        return None
+    content = skill_md.read_text()
+    match = re.match(r"^---\n(.*?)\n---", content, re.DOTALL)
+    if not match:
+        print("[ERROR] Invalid SKILL.md frontmatter format.")
+        return None
+    frontmatter_text = match.group(1)
+
+    import yaml
+
+    try:
+        frontmatter = yaml.safe_load(frontmatter_text)
+    except yaml.YAMLError as exc:
+        print(f"[ERROR] Invalid YAML frontmatter: {exc}")
+        return None
+    if not isinstance(frontmatter, dict):
+        print("[ERROR] Frontmatter must be a YAML dictionary.")
+        return None
+    name = frontmatter.get("name", "")
+    if not isinstance(name, str) or not name.strip():
+        print("[ERROR] Frontmatter 'name' is missing or invalid.")
+        return None
+    return name.strip()
+
+
+def parse_interface_overrides(raw_overrides):
+    overrides = {}
+    optional_order = []
+    for item in raw_overrides:
+        if "=" not in item:
+            print(f"[ERROR] Invalid interface override '{item}'. Use key=value.")
+            return None, None
+        key, value = item.split("=", 1)
+        key = key.strip()
+        value = value.strip()
+        if not key:
+            print(f"[ERROR] Invalid interface override '{item}'. Key is empty.")
+            return None, None
+        if key not in ALLOWED_INTERFACE_KEYS:
+            allowed = ", ".join(sorted(ALLOWED_INTERFACE_KEYS))
+            print(f"[ERROR] Unknown interface field '{key}'. Allowed: {allowed}")
+            return None, None
+        overrides[key] = value
+        if key not in ("display_name", "short_description") and key not in optional_order:
+            optional_order.append(key)
+    return overrides, optional_order
+
+
+def write_openai_yaml(skill_dir, skill_name, raw_overrides):
+    overrides, optional_order = parse_interface_overrides(raw_overrides)
+    if overrides is None:
+        return None
+
+    display_name = overrides.get("display_name") or format_display_name(skill_name)
+    short_description = overrides.get("short_description") or generate_short_description(display_name)
+
+    if not (25 <= len(short_description) <= 64):
+        print(
+            "[ERROR] short_description must be 25-64 characters "
+            f"(got {len(short_description)})."
+        )
+        return None
+
+    interface_lines = [
+        "interface:",
+        f"  display_name: {yaml_quote(display_name)}",
+        f"  short_description: {yaml_quote(short_description)}",
+    ]
+
+    for key in optional_order:
+        value = overrides.get(key)
+        if value is not None:
+            interface_lines.append(f"  {key}: {yaml_quote(value)}")
+
+    agents_dir = Path(skill_dir) / "agents"
+    agents_dir.mkdir(parents=True, exist_ok=True)
+    output_path = agents_dir / "openai.yaml"
+    output_path.write_text("\n".join(interface_lines) + "\n")
+    print(f"[OK] Created agents/openai.yaml")
+    return output_path
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description="Create agents/openai.yaml for a skill directory.",
+    )
+    parser.add_argument("skill_dir", help="Path to the skill directory")
+    parser.add_argument(
+        "--name",
+        help="Skill name override (defaults to SKILL.md frontmatter)",
+    )
+    parser.add_argument(
+        "--interface",
+        action="append",
+        default=[],
+        help="Interface override in key=value format (repeatable)",
+    )
+    args = parser.parse_args()
+
+    skill_dir = Path(args.skill_dir).resolve()
+    if not skill_dir.exists():
+        print(f"[ERROR] Skill directory not found: {skill_dir}")
+        sys.exit(1)
+    if not skill_dir.is_dir():
+        print(f"[ERROR] Path is not a directory: {skill_dir}")
+        sys.exit(1)
+
+    skill_name = args.name or read_frontmatter_name(skill_dir)
+    if not skill_name:
+        sys.exit(1)
+
+    result = write_openai_yaml(skill_dir, skill_name, args.interface)
+    if result:
+        sys.exit(0)
+    sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/skills/skill-creator/scripts/init_skill.py b/skills/skill-creator/scripts/init_skill.py
new file mode 100644
index 0000000..69673ea
--- /dev/null
+++ b/skills/skill-creator/scripts/init_skill.py
@@ -0,0 +1,400 @@
+#!/usr/bin/env python3
+"""
+Skill Initializer - Creates a new skill from template
+
+Usage:
+    init_skill.py <skill-name> --path <path> [--resources scripts,references,assets] [--examples] [--interface key=value]
+
+Examples:
+    init_skill.py my-new-skill --path skills/public
+    init_skill.py my-new-skill --path skills/public --resources scripts,references
+    init_skill.py my-api-helper --path skills/private --resources scripts --examples
+    init_skill.py custom-skill --path /custom/location
+    init_skill.py my-skill --path skills/public --interface short_description="Short UI label"
+"""
+
+import argparse
+import re
+import sys
+from pathlib import Path
+
+from generate_openai_yaml import write_openai_yaml
+
+MAX_SKILL_NAME_LENGTH = 64
+ALLOWED_RESOURCES = {"scripts", "references", "assets"}
+
+SKILL_TEMPLATE = """---
+name: {skill_name}
+description: [TODO: Complete and informative explanation of what the skill does and when to use it. Include WHEN to use this skill - specific scenarios, file types, or tasks that trigger it.]
+---
+
+# {skill_title}
+
+## Overview
+
+[TODO: 1-2 sentences explaining what this skill enables]
+
+## Structuring This Skill
+
+[TODO: Choose the structure that best fits this skill's purpose. Common patterns:
+
+**1. Workflow-Based** (best for sequential processes)
+- Works well when there are clear step-by-step procedures
+- Example: DOCX skill with "Workflow Decision Tree" -> "Reading" -> "Creating" -> "Editing"
+- Structure: ## Overview -> ## Workflow Decision Tree -> ## Step 1 -> ## Step 2...
+
+**2. Task-Based** (best for tool collections)
+- Works well when the skill offers different operations/capabilities
+- Example: PDF skill with "Quick Start" -> "Merge PDFs" -> "Split PDFs" -> "Extract Text"
+- Structure: ## Overview -> ## Quick Start -> ## Task Category 1 -> ## Task Category 2...
+
+**3. Reference/Guidelines** (best for standards or specifications)
+- Works well for brand guidelines, coding standards, or requirements
+- Example: Brand styling with "Brand Guidelines" -> "Colors" -> "Typography" -> "Features"
+- Structure: ## Overview -> ## Guidelines -> ## Specifications -> ## Usage...
+
+**4. Capabilities-Based** (best for integrated systems)
+- Works well when the skill provides multiple interrelated features
+- Example: Product Management with "Core Capabilities" -> numbered capability list
+- Structure: ## Overview -> ## Core Capabilities -> ### 1. Feature -> ### 2. Feature...
+
+Patterns can be mixed and matched as needed. Most skills combine patterns (e.g., start with task-based, add workflow for complex operations).
+
+Delete this entire "Structuring This Skill" section when done - it's just guidance.]
+
+## [TODO: Replace with the first main section based on chosen structure]
+
+[TODO: Add content here. See examples in existing skills:
+- Code samples for technical skills
+- Decision trees for complex workflows
+- Concrete examples with realistic user requests
+- References to scripts/templates/references as needed]
+
+## Resources (optional)
+
+Create only the resource directories this skill actually needs. Delete this section if no resources are required.
+
+### scripts/
+Executable code (Python/Bash/etc.) that can be run directly to perform specific operations.
+
+**Examples from other skills:**
+- PDF skill: `fill_fillable_fields.py`, `extract_form_field_info.py` - utilities for PDF manipulation
+- DOCX skill: `document.py`, `utilities.py` - Python modules for document processing
+
+**Appropriate for:** Python scripts, shell scripts, or any executable code that performs automation, data processing, or specific operations.
+
+**Note:** Scripts may be executed without loading into context, but can still be read by Codex for patching or environment adjustments.
+
+### references/
+Documentation and reference material intended to be loaded into context to inform Codex's process and thinking.
+
+**Examples from other skills:**
+- Product management: `communication.md`, `context_building.md` - detailed workflow guides
+- BigQuery: API reference documentation and query examples
+- Finance: Schema documentation, company policies
+
+**Appropriate for:** In-depth documentation, API references, database schemas, comprehensive guides, or any detailed information that Codex should reference while working.
+
+### assets/
+Files not intended to be loaded into context, but rather used within the output Codex produces.
+
+**Examples from other skills:**
+- Brand styling: PowerPoint template files (.pptx), logo files
+- Frontend builder: HTML/React boilerplate project directories
+- Typography: Font files (.ttf, .woff2)
+
+**Appropriate for:** Templates, boilerplate code, document templates, images, icons, fonts, or any files meant to be copied or used in the final output.
+
+---
+
+**Not every skill requires all three types of resources.**
+"""
+
+EXAMPLE_SCRIPT = '''#!/usr/bin/env python3
+"""
+Example helper script for {skill_name}
+
+This is a placeholder script that can be executed directly.
+Replace with actual implementation or delete if not needed.
+
+Example real scripts from other skills:
+- pdf/scripts/fill_fillable_fields.py - Fills PDF form fields
+- pdf/scripts/convert_pdf_to_images.py - Converts PDF pages to images
+"""
+
+def main():
+    print("This is an example script for {skill_name}")
+    # TODO: Add actual script logic here
+    # This could be data processing, file conversion, API calls, etc.
+
+if __name__ == "__main__":
+    main()
+'''
+
+EXAMPLE_REFERENCE = """# Reference Documentation for {skill_title}
+
+This is a placeholder for detailed reference documentation.
+Replace with actual reference content or delete if not needed.
+
+Example real reference docs from other skills:
+- product-management/references/communication.md - Comprehensive guide for status updates
+- product-management/references/context_building.md - Deep-dive on gathering context
+- bigquery/references/ - API references and query examples
+
+## When Reference Docs Are Useful
+
+Reference docs are ideal for:
+- Comprehensive API documentation
+- Detailed workflow guides
+- Complex multi-step processes
+- Information too lengthy for main SKILL.md
+- Content that's only needed for specific use cases
+
+## Structure Suggestions
+
+### API Reference Example
+- Overview
+- Authentication
+- Endpoints with examples
+- Error codes
+- Rate limits
+
+### Workflow Guide Example
+- Prerequisites
+- Step-by-step instructions
+- Common patterns
+- Troubleshooting
+- Best practices
+"""
+
+EXAMPLE_ASSET = """# Example Asset File
+
+This placeholder represents where asset files would be stored.
+Replace with actual asset files (templates, images, fonts, etc.) or delete if not needed.
+
+Asset files are NOT intended to be loaded into context, but rather used within
+the output Codex produces.
+
+Example asset files from other skills:
+- Brand guidelines: logo.png, slides_template.pptx
+- Frontend builder: hello-world/ directory with HTML/React boilerplate
+- Typography: custom-font.ttf, font-family.woff2
+- Data: sample_data.csv, test_dataset.json
+
+## Common Asset Types
+
+- Templates: .pptx, .docx, boilerplate directories
+- Images: .png, .jpg, .svg, .gif
+- Fonts: .ttf, .otf, .woff, .woff2
+- Boilerplate code: Project directories, starter files
+- Icons: .ico, .svg
+- Data files: .csv, .json, .xml, .yaml
+
+Note: This is a text placeholder. Actual assets can be any file type.
+"""
+
+
+def normalize_skill_name(skill_name):
+    """Normalize a skill name to lowercase hyphen-case."""
+    normalized = skill_name.strip().lower()
+    normalized = re.sub(r"[^a-z0-9]+", "-", normalized)
+    normalized = normalized.strip("-")
+    normalized = re.sub(r"-{2,}", "-", normalized)
+    return normalized
+
+
+def title_case_skill_name(skill_name):
+    """Convert hyphenated skill name to Title Case for display."""
+    return " ".join(word.capitalize() for word in skill_name.split("-"))
+
+
+def parse_resources(raw_resources):
+    if not raw_resources:
+        return []
+    resources = [item.strip() for item in raw_resources.split(",") if item.strip()]
+    invalid = sorted({item for item in resources if item not in ALLOWED_RESOURCES})
+    if invalid:
+        allowed = ", ".join(sorted(ALLOWED_RESOURCES))
+        print(f"[ERROR] Unknown resource type(s): {', '.join(invalid)}")
+        print(f"   Allowed: {allowed}")
+        sys.exit(1)
+    deduped = []
+    seen = set()
+    for resource in resources:
+        if resource not in seen:
+            deduped.append(resource)
+            seen.add(resource)
+    return deduped
+
+
+def create_resource_dirs(skill_dir, skill_name, skill_title, resources, include_examples):
+    for resource in resources:
+        resource_dir = skill_dir / resource
+        resource_dir.mkdir(exist_ok=True)
+        if resource == "scripts":
+            if include_examples:
+                example_script = resource_dir / "example.py"
+                example_script.write_text(EXAMPLE_SCRIPT.format(skill_name=skill_name))
+                example_script.chmod(0o755)
+                print("[OK] Created scripts/example.py")
+            else:
+                print("[OK] Created scripts/")
+        elif resource == "references":
+            if include_examples:
+                example_reference = resource_dir / "api_reference.md"
+                example_reference.write_text(EXAMPLE_REFERENCE.format(skill_title=skill_title))
+                print("[OK] Created references/api_reference.md")
+            else:
+                print("[OK] Created references/")
+        elif resource == "assets":
+            if include_examples:
+                example_asset = resource_dir / "example_asset.txt"
+                example_asset.write_text(EXAMPLE_ASSET)
+                print("[OK] Created assets/example_asset.txt")
+            else:
+                print("[OK] Created assets/")
+
+
+def init_skill(skill_name, path, resources, include_examples, interface_overrides):
+    """
+    Initialize a new skill directory with template SKILL.md.
+
+    Args:
+        skill_name: Name of the skill
+        path: Path where the skill directory should be created
+        resources: Resource directories to create
+        include_examples: Whether to create example files in resource directories
+
+    Returns:
+        Path to created skill directory, or None if error
+    """
+    # Determine skill directory path
+    skill_dir = Path(path).resolve() / skill_name
+
+    # Check if directory already exists
+    if skill_dir.exists():
+        print(f"[ERROR] Skill directory already exists: {skill_dir}")
+        return None
+
+    # Create skill directory
+    try:
+        skill_dir.mkdir(parents=True, exist_ok=False)
+        print(f"[OK] Created skill directory: {skill_dir}")
+    except Exception as e:
+        print(f"[ERROR] Error creating directory: {e}")
+        return None
+
+    # Create SKILL.md from template
+    skill_title = title_case_skill_name(skill_name)
+    skill_content = SKILL_TEMPLATE.format(skill_name=skill_name, skill_title=skill_title)
+
+    skill_md_path = skill_dir / "SKILL.md"
+    try:
+        skill_md_path.write_text(skill_content)
+        print("[OK] Created SKILL.md")
+    except Exception as e:
+        print(f"[ERROR] Error creating SKILL.md: {e}")
+        return None
+
+    # Create agents/openai.yaml
+    try:
+        result = write_openai_yaml(skill_dir, skill_name, interface_overrides)
+        if not result:
+            return None
+    except Exception as e:
+        print(f"[ERROR] Error creating agents/openai.yaml: {e}")
+        return None
+
+    # Create resource directories if requested
+    if resources:
+        try:
+            create_resource_dirs(skill_dir, skill_name, skill_title, resources, include_examples)
+        except Exception as e:
+            print(f"[ERROR] Error creating resource directories: {e}")
+            return None
+
+    # Print next steps
+    print(f"\n[OK] Skill '{skill_name}' initialized successfully at {skill_dir}")
+    print("\nNext steps:")
+    print("1. Edit SKILL.md to complete the TODO items and update the description")
+    if resources:
+        if include_examples:
+            print("2. Customize or delete the example files in scripts/, references/, and assets/")
+        else:
+            print("2. Add resources to scripts/, references/, and assets/ as needed")
+    else:
+        print("2. Create resource directories only if needed (scripts/, references/, assets/)")
+    print("3. Update agents/openai.yaml if the UI metadata should differ")
+    print("4. Run the validator when ready to check the skill structure")
+    print(
+        "5. Forward-test complex skills with realistic user requests to ensure they work as intended"
+    )
+
+    return skill_dir
+
+
+def main():
+    parser = argparse.ArgumentParser(
+        description="Create a new skill directory with a SKILL.md template.",
+    )
+    parser.add_argument("skill_name", help="Skill name (normalized to hyphen-case)")
+    parser.add_argument("--path", required=True, help="Output directory for the skill")
+    parser.add_argument(
+        "--resources",
+        default="",
+        help="Comma-separated list: scripts,references,assets",
+    )
+    parser.add_argument(
+        "--examples",
+        action="store_true",
+        help="Create example files inside the selected resource directories",
+    )
+    parser.add_argument(
+        "--interface",
+        action="append",
+        default=[],
+        help="Interface override in key=value format (repeatable)",
+    )
+    args = parser.parse_args()
+
+    raw_skill_name = args.skill_name
+    skill_name = normalize_skill_name(raw_skill_name)
+    if not skill_name:
+        print("[ERROR] Skill name must include at least one letter or digit.")
+        sys.exit(1)
+    if len(skill_name) > MAX_SKILL_NAME_LENGTH:
+        print(
+            f"[ERROR] Skill name '{skill_name}' is too long ({len(skill_name)} characters). "
+            f"Maximum is {MAX_SKILL_NAME_LENGTH} characters."
+        )
+        sys.exit(1)
+    if skill_name != raw_skill_name:
+        print(f"Note: Normalized skill name from '{raw_skill_name}' to '{skill_name}'.")
+
+    resources = parse_resources(args.resources)
+    if args.examples and not resources:
+        print("[ERROR] --examples requires --resources to be set.")
+        sys.exit(1)
+
+    path = args.path
+
+    print(f"Initializing skill: {skill_name}")
+    print(f"   Location: {path}")
+    if resources:
+        print(f"   Resources: {', '.join(resources)}")
+        if args.examples:
+            print("   Examples: enabled")
+    else:
+        print("   Resources: none (create as needed)")
+    print()
+
+    result = init_skill(skill_name, path, resources, args.examples, args.interface)
+
+    if result:
+        sys.exit(0)
+    else:
+        sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/skills/skill-creator/scripts/quick_validate.py b/skills/skill-creator/scripts/quick_validate.py
new file mode 100644
index 0000000..0547b40
--- /dev/null
+++ b/skills/skill-creator/scripts/quick_validate.py
@@ -0,0 +1,101 @@
+#!/usr/bin/env python3
+"""
+Quick validation script for skills - minimal version
+"""
+
+import re
+import sys
+from pathlib import Path
+
+import yaml
+
+MAX_SKILL_NAME_LENGTH = 64
+
+
+def validate_skill(skill_path):
+    """Basic validation of a skill"""
+    skill_path = Path(skill_path)
+
+    skill_md = skill_path / "SKILL.md"
+    if not skill_md.exists():
+        return False, "SKILL.md not found"
+
+    content = skill_md.read_text()
+    if not content.startswith("---"):
+        return False, "No YAML frontmatter found"
+
+    match = re.match(r"^---\n(.*?)\n---", content, re.DOTALL)
+    if not match:
+        return False, "Invalid frontmatter format"
+
+    frontmatter_text = match.group(1)
+
+    try:
+        frontmatter = yaml.safe_load(frontmatter_text)
+        if not isinstance(frontmatter, dict):
+            return False, "Frontmatter must be a YAML dictionary"
+    except yaml.YAMLError as e:
+        return False, f"Invalid YAML in frontmatter: {e}"
+
+    allowed_properties = {"name", "description", "license", "allowed-tools", "metadata"}
+
+    unexpected_keys = set(frontmatter.keys()) - allowed_properties
+    if unexpected_keys:
+        allowed = ", ".join(sorted(allowed_properties))
+        unexpected = ", ".join(sorted(unexpected_keys))
+        return (
+            False,
+            f"Unexpected key(s) in SKILL.md frontmatter: {unexpected}. Allowed properties are: {allowed}",
+        )
+
+    if "name" not in frontmatter:
+        return False, "Missing 'name' in frontmatter"
+    if "description" not in frontmatter:
+        return False, "Missing 'description' in frontmatter"
+
+    name = frontmatter.get("name", "")
+    if not isinstance(name, str):
+        return False, f"Name must be a string, got {type(name).__name__}"
+    name = name.strip()
+    if name:
+        if not re.match(r"^[a-z0-9-]+$", name):
+            return (
+                False,
+                f"Name '{name}' should be hyphen-case (lowercase letters, digits, and hyphens only)",
+            )
+        if name.startswith("-") or name.endswith("-") or "--" in name:
+            return (
+                False,
+                f"Name '{name}' cannot start/end with hyphen or contain consecutive hyphens",
+            )
+        if len(name) > MAX_SKILL_NAME_LENGTH:
+            return (
+                False,
+                f"Name is too long ({len(name)} characters). "
+                f"Maximum is {MAX_SKILL_NAME_LENGTH} characters.",
+            )
+
+    description = frontmatter.get("description", "")
+    if not isinstance(description, str):
+        return False, f"Description must be a string, got {type(description).__name__}"
+    description = description.strip()
+    if description:
+        if "<" in description or ">" in description:
+            return False, "Description cannot contain angle brackets (< or >)"
+        if len(description) > 1024:
+            return (
+                False,
+                f"Description is too long ({len(description)} characters). Maximum is 1024 characters.",
+            )
+
+    return True, "Skill is valid!"
+
+
+if __name__ == "__main__":
+    if len(sys.argv) != 2:
+        print("Usage: python quick_validate.py <skill_directory>")
+        sys.exit(1)
+
+    valid, message = validate_skill(sys.argv[1])
+    print(message)
+    sys.exit(0 if valid else 1)
diff --git a/skills/skill-installer/LICENSE.txt b/skills/skill-installer/LICENSE.txt
new file mode 100644
index 0000000..d645695
--- /dev/null
+++ b/skills/skill-installer/LICENSE.txt
@@ -0,0 +1,202 @@
+
+                                 Apache License
+                           Version 2.0, January 2004
+                        http://www.apache.org/licenses/
+
+   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
+
+   1. Definitions.
+
+      "License" shall mean the terms and conditions for use, reproduction,
+      and distribution as defined by Sections 1 through 9 of this document.
+
+      "Licensor" shall mean the copyright owner or entity authorized by
+      the copyright owner that is granting the License.
+
+      "Legal Entity" shall mean the union of the acting entity and all
+      other entities that control, are controlled by, or are under common
+      control with that entity. For the purposes of this definition,
+      "control" means (i) the power, direct or indirect, to cause the
+      direction or management of such entity, whether by contract or
+      otherwise, or (ii) ownership of fifty percent (50%) or more of the
+      outstanding shares, or (iii) beneficial ownership of such entity.
+
+      "You" (or "Your") shall mean an individual or Legal Entity
+      exercising permissions granted by this License.
+
+      "Source" form shall mean the preferred form for making modifications,
+      including but not limited to software source code, documentation
+      source, and configuration files.
+
+      "Object" form shall mean any form resulting from mechanical
+      transformation or translation of a Source form, including but
+      not limited to compiled object code, generated documentation,
+      and conversions to other media types.
+
+      "Work" shall mean the work of authorship, whether in Source or
+      Object form, made available under the License, as indicated by a
+      copyright notice that is included in or attached to the work
+      (an example is provided in the Appendix below).
+
+      "Derivative Works" shall mean any work, whether in Source or Object
+      form, that is based on (or derived from) the Work and for which the
+      editorial revisions, annotations, elaborations, or other modifications
+      represent, as a whole, an original work of authorship. For the purposes
+      of this License, Derivative Works shall not include works that remain
+      separable from, or merely link (or bind by name) to the interfaces of,
+      the Work and Derivative Works thereof.
+
+      "Contribution" shall mean any work of authorship, including
+      the original version of the Work and any modifications or additions
+      to that Work or Derivative Works thereof, that is intentionally
+      submitted to Licensor for inclusion in the Work by the copyright owner
+      or by an individual or Legal Entity authorized to submit on behalf of
+      the copyright owner. For the purposes of this definition, "submitted"
+      means any form of electronic, verbal, or written communication sent
+      to the Licensor or its representatives, including but not limited to
+      communication on electronic mailing lists, source code control systems,
+      and issue tracking systems that are managed by, or on behalf of, the
+      Licensor for the purpose of discussing and improving the Work, but
+      excluding communication that is conspicuously marked or otherwise
+      designated in writing by the copyright owner as "Not a Contribution."
+
+      "Contributor" shall mean Licensor and any individual or Legal Entity
+      on behalf of whom a Contribution has been received by Licensor and
+      subsequently incorporated within the Work.
+
+   2. Grant of Copyright License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      copyright license to reproduce, prepare Derivative Works of,
+      publicly display, publicly perform, sublicense, and distribute the
+      Work and such Derivative Works in Source or Object form.
+
+   3. Grant of Patent License. Subject to the terms and conditions of
+      this License, each Contributor hereby grants to You a perpetual,
+      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
+      (except as stated in this section) patent license to make, have made,
+      use, offer to sell, sell, import, and otherwise transfer the Work,
+      where such license applies only to those patent claims licensable
+      by such Contributor that are necessarily infringed by their
+      Contribution(s) alone or by combination of their Contribution(s)
+      with the Work to which such Contribution(s) was submitted. If You
+      institute patent litigation against any entity (including a
+      cross-claim or counterclaim in a lawsuit) alleging that the Work
+      or a Contribution incorporated within the Work constitutes direct
+      or contributory patent infringement, then any patent licenses
+      granted to You under this License for that Work shall terminate
+      as of the date such litigation is filed.
+
+   4. Redistribution. You may reproduce and distribute copies of the
+      Work or Derivative Works thereof in any medium, with or without
+      modifications, and in Source or Object form, provided that You
+      meet the following conditions:
+
+      (a) You must give any other recipients of the Work or
+          Derivative Works a copy of this License; and
+
+      (b) You must cause any modified files to carry prominent notices
+          stating that You changed the files; and
+
+      (c) You must retain, in the Source form of any Derivative Works
+          that You distribute, all copyright, patent, trademark, and
+          attribution notices from the Source form of the Work,
+          excluding those notices that do not pertain to any part of
+          the Derivative Works; and
+
+      (d) If the Work includes a "NOTICE" text file as part of its
+          distribution, then any Derivative Works that You distribute must
+          include a readable copy of the attribution notices contained
+          within such NOTICE file, excluding those notices that do not
+          pertain to any part of the Derivative Works, in at least one
+          of the following places: within a NOTICE text file distributed
+          as part of the Derivative Works; within the Source form or
+          documentation, if provided along with the Derivative Works; or,
+          within a display generated by the Derivative Works, if and
+          wherever such third-party notices normally appear. The contents
+          of the NOTICE file are for informational purposes only and
+          do not modify the License. You may add Your own attribution
+          notices within Derivative Works that You distribute, alongside
+          or as an addendum to the NOTICE text from the Work, provided
+          that such additional attribution notices cannot be construed
+          as modifying the License.
+
+      You may add Your own copyright statement to Your modifications and
+      may provide additional or different license terms and conditions
+      for use, reproduction, or distribution of Your modifications, or
+      for any such Derivative Works as a whole, provided Your use,
+      reproduction, and distribution of the Work otherwise complies with
+      the conditions stated in this License.
+
+   5. Submission of Contributions. Unless You explicitly state otherwise,
+      any Contribution intentionally submitted for inclusion in the Work
+      by You to the Licensor shall be under the terms and conditions of
+      this License, without any additional terms or conditions.
+      Notwithstanding the above, nothing herein shall supersede or modify
+      the terms of any separate license agreement you may have executed
+      with Licensor regarding such Contributions.
+
+   6. Trademarks. This License does not grant permission to use the trade
+      names, trademarks, service marks, or product names of the Licensor,
+      except as required for reasonable and customary use in describing the
+      origin of the Work and reproducing the content of the NOTICE file.
+
+   7. Disclaimer of Warranty. Unless required by applicable law or
+      agreed to in writing, Licensor provides the Work (and each
+      Contributor provides its Contributions) on an "AS IS" BASIS,
+      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
+      implied, including, without limitation, any warranties or conditions
+      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
+      PARTICULAR PURPOSE. You are solely responsible for determining the
+      appropriateness of using or redistributing the Work and assume any
+      risks associated with Your exercise of permissions under this License.
+
+   8. Limitation of Liability. In no event and under no legal theory,
+      whether in tort (including negligence), contract, or otherwise,
+      unless required by applicable law (such as deliberate and grossly
+      negligent acts) or agreed to in writing, shall any Contributor be
+      liable to You for damages, including any direct, indirect, special,
+      incidental, or consequential damages of any character arising as a
+      result of this License or out of the use or inability to use the
+      Work (including but not limited to damages for loss of goodwill,
+      work stoppage, computer failure or malfunction, or any and all
+      other commercial damages or losses), even if such Contributor
+      has been advised of the possibility of such damages.
+
+   9. Accepting Warranty or Additional Liability. While redistributing
+      the Work or Derivative Works thereof, You may choose to offer,
+      and charge a fee for, acceptance of support, warranty, indemnity,
+      or other liability obligations and/or rights consistent with this
+      License. However, in accepting such obligations, You may act only
+      on Your own behalf and on Your sole responsibility, not on behalf
+      of any other Contributor, and only if You agree to indemnify,
+      defend, and hold each Contributor harmless for any liability
+      incurred by, or claims asserted against, such Contributor by reason
+      of your accepting any such warranty or additional liability.
+
+   END OF TERMS AND CONDITIONS
+
+   APPENDIX: How to apply the Apache License to your work.
+
+      To apply the Apache License to your work, attach the following
+      boilerplate notice, with the fields enclosed by brackets "[]"
+      replaced with your own identifying information. (Don't include
+      the brackets!)  The text should be enclosed in the appropriate
+      comment syntax for the file format. We also recommend that a
+      file or class name and description of purpose be included on the
+      same "printed page" as the copyright notice for easier
+      identification within third-party archives.
+
+   Copyright [yyyy] [name of copyright owner]
+
+   Licensed under the Apache License, Version 2.0 (the "License");
+   you may not use this file except in compliance with the License.
+   You may obtain a copy of the License at
+
+       http://www.apache.org/licenses/LICENSE-2.0
+
+   Unless required by applicable law or agreed to in writing, software
+   distributed under the License is distributed on an "AS IS" BASIS,
+   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+   See the License for the specific language governing permissions and
+   limitations under the License.
diff --git a/skills/skill-installer/SKILL.md b/skills/skill-installer/SKILL.md
new file mode 100644
index 0000000..313626a
--- /dev/null
+++ b/skills/skill-installer/SKILL.md
@@ -0,0 +1,58 @@
+---
+name: skill-installer
+description: Install Codex skills into $CODEX_HOME/skills from a curated list or a GitHub repo path. Use when a user asks to list installable skills, install a curated skill, or install a skill from another repo (including private repos).
+metadata:
+  short-description: Install curated skills from openai/skills or other repos
+---
+
+# Skill Installer
+
+Helps install skills. By default these are from https://github.com/openai/skills/tree/main/skills/.curated, but users can also provide other locations. Experimental skills live in https://github.com/openai/skills/tree/main/skills/.experimental and can be installed the same way.
+
+Use the helper scripts based on the task:
+- List skills when the user asks what is available, or if the user uses this skill without specifying what to do. Default listing is `.curated`, but you can pass `--path skills/.experimental` when they ask about experimental skills.
+- Install from the curated list when the user provides a skill name.
+- Install from another repo when the user provides a GitHub repo/path (including private repos).
+
+Install skills with the helper scripts.
+
+## Communication
+
+When listing skills, output approximately as follows, depending on the context of the user's request. If they ask about experimental skills, list from `.experimental` instead of `.curated` and label the source accordingly:
+"""
+Skills from {repo}:
+1. skill-1
+2. skill-2 (already installed)
+3. ...
+Which ones would you like installed?
+"""
+
+After installing a skill, tell the user: "Restart Codex to pick up new skills."
+
+## Scripts
+
+All of these scripts use network, so when running in the sandbox, request escalation when running them.
+
+- `scripts/list-skills.py` (prints skills list with installed annotations)
+- `scripts/list-skills.py --format json`
+- Example (experimental list): `scripts/list-skills.py --path skills/.experimental`
+- `scripts/install-skill-from-github.py --repo <owner>/<repo> --path <path/to/skill> [<path/to/skill> ...]`
+- `scripts/install-skill-from-github.py --url https://github.com/<owner>/<repo>/tree/<ref>/<path>`
+- Example (experimental skill): `scripts/install-skill-from-github.py --repo openai/skills --path skills/.experimental/<skill-name>`
+
+## Behavior and Options
+
+- Defaults to direct download for public GitHub repos.
+- If download fails with auth/permission errors, falls back to git sparse checkout.
+- Aborts if the destination skill directory already exists.
+- Installs into `$CODEX_HOME/skills/<skill-name>` (defaults to `~/.codex/skills`).
+- Multiple `--path` values install multiple skills in one run, each named from the path basename unless `--name` is supplied.
+- Options: `--ref <ref>` (default `main`), `--dest <path>`, `--method auto|download|git`.
+
+## Notes
+
+- Curated listing is fetched from `https://github.com/openai/skills/tree/main/skills/.curated` via the GitHub API. If it is unavailable, explain the error and exit.
+- Private GitHub repos can be accessed via existing git credentials or optional `GITHUB_TOKEN`/`GH_TOKEN` for download.
+- Git fallback tries HTTPS first, then SSH.
+- The skills at https://github.com/openai/skills/tree/main/skills/.system are preinstalled, so no need to help users install those. If they ask, just explain this. If they insist, you can download and overwrite.
+- Installed annotations come from `$CODEX_HOME/skills`.
diff --git a/skills/skill-installer/agents/openai.yaml b/skills/skill-installer/agents/openai.yaml
new file mode 100644
index 0000000..88d40cd
--- /dev/null
+++ b/skills/skill-installer/agents/openai.yaml
@@ -0,0 +1,5 @@
+interface:
+  display_name: "Skill Installer"
+  short_description: "Install curated skills from openai/skills or other repos"
+  icon_small: "./assets/skill-installer-small.svg"
+  icon_large: "./assets/skill-installer.png"
diff --git a/skills/skill-installer/assets/skill-installer-small.svg b/skills/skill-installer/assets/skill-installer-small.svg
new file mode 100644
index 0000000..ccfc034
--- /dev/null
+++ b/skills/skill-installer/assets/skill-installer-small.svg
@@ -0,0 +1,3 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" viewBox="0 0 16 16">
+  <path fill="#0D0D0D" d="M2.145 3.959a2.033 2.033 0 0 1 2.022-1.824h5.966c.551 0 .997 0 1.357.029.367.03.692.093.993.246l.174.098c.397.243.72.593.932 1.01l.053.114c.116.269.168.557.194.878.03.36.03.805.03 1.357v4.3a2.365 2.365 0 0 1-2.366 2.365h-1.312a2.198 2.198 0 0 1-4.377 0H4.167A2.032 2.032 0 0 1 2.135 10.5V9.333l.004-.088A.865.865 0 0 1 3 8.468l.116-.006A1.135 1.135 0 0 0 3 6.199a.865.865 0 0 1-.865-.864V4.167l.01-.208Zm1.054 1.186a2.198 2.198 0 0 1 0 4.376v.98c0 .534.433.967.968.967H6l.089.004a.866.866 0 0 1 .776.861 1.135 1.135 0 0 0 2.27 0c0-.478.387-.865.865-.865h1.5c.719 0 1.301-.583 1.301-1.301v-4.3c0-.57 0-.964-.025-1.27a1.933 1.933 0 0 0-.09-.493L12.642 4a1.47 1.47 0 0 0-.541-.585l-.102-.056c-.126-.065-.295-.11-.596-.135a17.31 17.31 0 0 0-1.27-.025H4.167a.968.968 0 0 0-.968.968v.978Z"/>
+</svg>
diff --git a/skills/skill-installer/assets/skill-installer.png b/skills/skill-installer/assets/skill-installer.png
new file mode 100644
index 0000000000000000000000000000000000000000..2977cd5bb49b3b8bd50d8bf476d7cffbb3f88a46
GIT binary patch
literal 1086
zcmV-E1i|}>P)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1Jg-FK~#7F?cL8#
z6Hye$@!!m}r7gu`q4F=mKXIWfR1#c}xWFZkz|)xc0KSA9R=RSljSE@0z_@UM$Uh@!
zfKm(;XgjTQY^otF=(KaonK|c^kf2r}e7SSy-aAA<DW#NBN-3q3Qc9_Cu;5eU<&!zU
zo&z(dZ^pq;A+@+z@bed9@Xels)p!Qgu7aNz+fb}%5N0$8Ga7^$4Z@5DVMc>6qd}PI
zU}1Q*8dV$h?`gQj1R5vJPv45w5fz~cLLuCh0o2wr7yk^=5sDx*5-Ll>Xp|j99s4;%
zQVhaANX@%UNr^#N2cgm7dK0)Ltb@2~8A!uANPWK#(lEbd$(cJ^cn7KaK4A_$)<LYa
z3u#yfv4_qe4eKDz$SI`ZJwirL#9g-7uhioY4<HHqAT*D}rVb%RC=RG%caD&lDT=s!
zh2}hj=95IWg8EJhwT(=m8;<tCHN>)6Sba%Y@i-cF@4&0#eXMdBwS%I!9;%>MLUm$j
zrCd1PXrVVcuxk8{|NH&3w<GY&PWK}|HvTulxsPLe7mj2S4!z}aa1Rer+uQ9)n9v>J
zwpj5xtS;6mPHqVC8|_7OywPK))2M818jm9KAqOWj&~}U#8byi8o8IU#yT2wbh!syD
zHZqD%P!uPhhe_gsIGN0aIm3_G^_<aBA}@$HcXa)43}#`9tRRll)#zxUyE9Wn1+l$#
zMj*U-$P|5)lo?S$0$W44=C*MBFAN{OZ|`S!S04aJ0Ze{VAA!W>=OW3~=jat$Bqr}o
zwed>-54oBfA#OmM02NtJp6DFHjJY6*fR0~N$B@KakW2uFN)*+pK@xL8a=*~E{5GU9
z7lgjE^FPor8XehvNMm+VAKmi4upORROsoYr4~2-?AT&zue)b<_;+x3PLCl{R(swyU
z`8f#`M=pQu<Vt5Z1pOr-U248x_4cevot=4HwcZ@zw!YAG3EQ1$uHb3GM~g=qJ*lJS
zO+YuJV*bVXUmp(wd$)lvPn++DL~qa3DGXhXdVxkv|1vPV-i)$2jWCG*N}a+ye(mjv
zy+att**c*h`3-O<YcFf&m3O$r`&L?35W0LZA0_g3dv7g+GkHO>JK#)Skp2=llNY2K
z(32;I$O}>$17`w*@ZRH+7i4u7oXHA8`&rC48s!9`5TEA3U1)!T$`_i*mloLHVUcJD
zp#WcJn{OeAL8236`~Lrp!}4JBZfavXG$C4|6Xe4JqCg)dWk!QAqd}O_Ak1hGW;6&h
z8iW}Q!b~R%!vfF$u!G|#Wf!27Qc5YMlu}A5rBp=y0R^AlXy0glYybcN07*qoM6N<$
Ef|C;DQ~&?~

literal 0
HcmV?d00001

diff --git a/skills/skill-installer/scripts/github_utils.py b/skills/skill-installer/scripts/github_utils.py
new file mode 100644
index 0000000..711f597
--- /dev/null
+++ b/skills/skill-installer/scripts/github_utils.py
@@ -0,0 +1,21 @@
+#!/usr/bin/env python3
+"""Shared GitHub helpers for skill install scripts."""
+
+from __future__ import annotations
+
+import os
+import urllib.request
+
+
+def github_request(url: str, user_agent: str) -> bytes:
+    headers = {"User-Agent": user_agent}
+    token = os.environ.get("GITHUB_TOKEN") or os.environ.get("GH_TOKEN")
+    if token:
+        headers["Authorization"] = f"token {token}"
+    req = urllib.request.Request(url, headers=headers)
+    with urllib.request.urlopen(req) as resp:
+        return resp.read()
+
+
+def github_api_contents_url(repo: str, path: str, ref: str) -> str:
+    return f"https://api.github.com/repos/{repo}/contents/{path}?ref={ref}"
diff --git a/skills/skill-installer/scripts/install-skill-from-github.py b/skills/skill-installer/scripts/install-skill-from-github.py
new file mode 100644
index 0000000..1c8ce89
--- /dev/null
+++ b/skills/skill-installer/scripts/install-skill-from-github.py
@@ -0,0 +1,308 @@
+#!/usr/bin/env python3
+"""Install a skill from a GitHub repo path into $CODEX_HOME/skills."""
+
+from __future__ import annotations
+
+import argparse
+from dataclasses import dataclass
+import os
+import shutil
+import subprocess
+import sys
+import tempfile
+import urllib.error
+import urllib.parse
+import zipfile
+
+from github_utils import github_request
+DEFAULT_REF = "main"
+
+
+@dataclass
+class Args:
+    url: str | None = None
+    repo: str | None = None
+    path: list[str] | None = None
+    ref: str = DEFAULT_REF
+    dest: str | None = None
+    name: str | None = None
+    method: str = "auto"
+
+
+@dataclass
+class Source:
+    owner: str
+    repo: str
+    ref: str
+    paths: list[str]
+    repo_url: str | None = None
+
+
+class InstallError(Exception):
+    pass
+
+
+def _codex_home() -> str:
+    return os.environ.get("CODEX_HOME", os.path.expanduser("~/.codex"))
+
+
+def _tmp_root() -> str:
+    base = os.path.join(tempfile.gettempdir(), "codex")
+    os.makedirs(base, exist_ok=True)
+    return base
+
+
+def _request(url: str) -> bytes:
+    return github_request(url, "codex-skill-install")
+
+
+def _parse_github_url(url: str, default_ref: str) -> tuple[str, str, str, str | None]:
+    parsed = urllib.parse.urlparse(url)
+    if parsed.netloc != "github.com":
+        raise InstallError("Only GitHub URLs are supported for download mode.")
+    parts = [p for p in parsed.path.split("/") if p]
+    if len(parts) < 2:
+        raise InstallError("Invalid GitHub URL.")
+    owner, repo = parts[0], parts[1]
+    ref = default_ref
+    subpath = ""
+    if len(parts) > 2:
+        if parts[2] in ("tree", "blob"):
+            if len(parts) < 4:
+                raise InstallError("GitHub URL missing ref or path.")
+            ref = parts[3]
+            subpath = "/".join(parts[4:])
+        else:
+            subpath = "/".join(parts[2:])
+    return owner, repo, ref, subpath or None
+
+
+def _download_repo_zip(owner: str, repo: str, ref: str, dest_dir: str) -> str:
+    zip_url = f"https://codeload.github.com/{owner}/{repo}/zip/{ref}"
+    zip_path = os.path.join(dest_dir, "repo.zip")
+    try:
+        payload = _request(zip_url)
+    except urllib.error.HTTPError as exc:
+        raise InstallError(f"Download failed: HTTP {exc.code}") from exc
+    with open(zip_path, "wb") as file_handle:
+        file_handle.write(payload)
+    with zipfile.ZipFile(zip_path, "r") as zip_file:
+        _safe_extract_zip(zip_file, dest_dir)
+        top_levels = {name.split("/")[0] for name in zip_file.namelist() if name}
+    if not top_levels:
+        raise InstallError("Downloaded archive was empty.")
+    if len(top_levels) != 1:
+        raise InstallError("Unexpected archive layout.")
+    return os.path.join(dest_dir, next(iter(top_levels)))
+
+
+def _run_git(args: list[str]) -> None:
+    result = subprocess.run(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
+    if result.returncode != 0:
+        raise InstallError(result.stderr.strip() or "Git command failed.")
+
+
+def _safe_extract_zip(zip_file: zipfile.ZipFile, dest_dir: str) -> None:
+    dest_root = os.path.realpath(dest_dir)
+    for info in zip_file.infolist():
+        extracted_path = os.path.realpath(os.path.join(dest_dir, info.filename))
+        if extracted_path == dest_root or extracted_path.startswith(dest_root + os.sep):
+            continue
+        raise InstallError("Archive contains files outside the destination.")
+    zip_file.extractall(dest_dir)
+
+
+def _validate_relative_path(path: str) -> None:
+    if os.path.isabs(path) or os.path.normpath(path).startswith(".."):
+        raise InstallError("Skill path must be a relative path inside the repo.")
+
+
+def _validate_skill_name(name: str) -> None:
+    altsep = os.path.altsep
+    if not name or os.path.sep in name or (altsep and altsep in name):
+        raise InstallError("Skill name must be a single path segment.")
+    if name in (".", ".."):
+        raise InstallError("Invalid skill name.")
+
+
+def _git_sparse_checkout(repo_url: str, ref: str, paths: list[str], dest_dir: str) -> str:
+    repo_dir = os.path.join(dest_dir, "repo")
+    clone_cmd = [
+        "git",
+        "clone",
+        "--filter=blob:none",
+        "--depth",
+        "1",
+        "--sparse",
+        "--single-branch",
+        "--branch",
+        ref,
+        repo_url,
+        repo_dir,
+    ]
+    try:
+        _run_git(clone_cmd)
+    except InstallError:
+        _run_git(
+            [
+                "git",
+                "clone",
+                "--filter=blob:none",
+                "--depth",
+                "1",
+                "--sparse",
+                "--single-branch",
+                repo_url,
+                repo_dir,
+            ]
+        )
+    _run_git(["git", "-C", repo_dir, "sparse-checkout", "set", *paths])
+    _run_git(["git", "-C", repo_dir, "checkout", ref])
+    return repo_dir
+
+
+def _validate_skill(path: str) -> None:
+    if not os.path.isdir(path):
+        raise InstallError(f"Skill path not found: {path}")
+    skill_md = os.path.join(path, "SKILL.md")
+    if not os.path.isfile(skill_md):
+        raise InstallError("SKILL.md not found in selected skill directory.")
+
+
+def _copy_skill(src: str, dest_dir: str) -> None:
+    os.makedirs(os.path.dirname(dest_dir), exist_ok=True)
+    if os.path.exists(dest_dir):
+        raise InstallError(f"Destination already exists: {dest_dir}")
+    shutil.copytree(src, dest_dir)
+
+
+def _build_repo_url(owner: str, repo: str) -> str:
+    return f"https://github.com/{owner}/{repo}.git"
+
+
+def _build_repo_ssh(owner: str, repo: str) -> str:
+    return f"git@github.com:{owner}/{repo}.git"
+
+
+def _prepare_repo(source: Source, method: str, tmp_dir: str) -> str:
+    if method in ("download", "auto"):
+        try:
+            return _download_repo_zip(source.owner, source.repo, source.ref, tmp_dir)
+        except InstallError as exc:
+            if method == "download":
+                raise
+            err_msg = str(exc)
+            if "HTTP 401" in err_msg or "HTTP 403" in err_msg or "HTTP 404" in err_msg:
+                pass
+            else:
+                raise
+    if method in ("git", "auto"):
+        repo_url = source.repo_url or _build_repo_url(source.owner, source.repo)
+        try:
+            return _git_sparse_checkout(repo_url, source.ref, source.paths, tmp_dir)
+        except InstallError:
+            repo_url = _build_repo_ssh(source.owner, source.repo)
+            return _git_sparse_checkout(repo_url, source.ref, source.paths, tmp_dir)
+    raise InstallError("Unsupported method.")
+
+
+def _resolve_source(args: Args) -> Source:
+    if args.url:
+        owner, repo, ref, url_path = _parse_github_url(args.url, args.ref)
+        if args.path is not None:
+            paths = list(args.path)
+        elif url_path:
+            paths = [url_path]
+        else:
+            paths = []
+        if not paths:
+            raise InstallError("Missing --path for GitHub URL.")
+        return Source(owner=owner, repo=repo, ref=ref, paths=paths)
+
+    if not args.repo:
+        raise InstallError("Provide --repo or --url.")
+    if "://" in args.repo:
+        return _resolve_source(
+            Args(url=args.repo, repo=None, path=args.path, ref=args.ref)
+        )
+
+    repo_parts = [p for p in args.repo.split("/") if p]
+    if len(repo_parts) != 2:
+        raise InstallError("--repo must be in owner/repo format.")
+    if not args.path:
+        raise InstallError("Missing --path for --repo.")
+    paths = list(args.path)
+    return Source(
+        owner=repo_parts[0],
+        repo=repo_parts[1],
+        ref=args.ref,
+        paths=paths,
+    )
+
+
+def _default_dest() -> str:
+    return os.path.join(_codex_home(), "skills")
+
+
+def _parse_args(argv: list[str]) -> Args:
+    parser = argparse.ArgumentParser(description="Install a skill from GitHub.")
+    parser.add_argument("--repo", help="owner/repo")
+    parser.add_argument("--url", help="https://github.com/owner/repo[/tree/ref/path]")
+    parser.add_argument(
+        "--path",
+        nargs="+",
+        help="Path(s) to skill(s) inside repo",
+    )
+    parser.add_argument("--ref", default=DEFAULT_REF)
+    parser.add_argument("--dest", help="Destination skills directory")
+    parser.add_argument(
+        "--name", help="Destination skill name (defaults to basename of path)"
+    )
+    parser.add_argument(
+        "--method",
+        choices=["auto", "download", "git"],
+        default="auto",
+    )
+    return parser.parse_args(argv, namespace=Args())
+
+
+def main(argv: list[str]) -> int:
+    args = _parse_args(argv)
+    try:
+        source = _resolve_source(args)
+        source.ref = source.ref or args.ref
+        if not source.paths:
+            raise InstallError("No skill paths provided.")
+        for path in source.paths:
+            _validate_relative_path(path)
+        dest_root = args.dest or _default_dest()
+        tmp_dir = tempfile.mkdtemp(prefix="skill-install-", dir=_tmp_root())
+        try:
+            repo_root = _prepare_repo(source, args.method, tmp_dir)
+            installed = []
+            for path in source.paths:
+                skill_name = args.name if len(source.paths) == 1 else None
+                skill_name = skill_name or os.path.basename(path.rstrip("/"))
+                _validate_skill_name(skill_name)
+                if not skill_name:
+                    raise InstallError("Unable to derive skill name.")
+                dest_dir = os.path.join(dest_root, skill_name)
+                if os.path.exists(dest_dir):
+                    raise InstallError(f"Destination already exists: {dest_dir}")
+                skill_src = os.path.join(repo_root, path)
+                _validate_skill(skill_src)
+                _copy_skill(skill_src, dest_dir)
+                installed.append((skill_name, dest_dir))
+        finally:
+            if os.path.isdir(tmp_dir):
+                shutil.rmtree(tmp_dir, ignore_errors=True)
+        for skill_name, dest_dir in installed:
+            print(f"Installed {skill_name} to {dest_dir}")
+        return 0
+    except InstallError as exc:
+        print(f"Error: {exc}", file=sys.stderr)
+        return 1
+
+
+if __name__ == "__main__":
+    raise SystemExit(main(sys.argv[1:]))
diff --git a/skills/skill-installer/scripts/list-skills.py b/skills/skill-installer/scripts/list-skills.py
new file mode 100644
index 0000000..0977c29
--- /dev/null
+++ b/skills/skill-installer/scripts/list-skills.py
@@ -0,0 +1,107 @@
+#!/usr/bin/env python3
+"""List skills from a GitHub repo path."""
+
+from __future__ import annotations
+
+import argparse
+import json
+import os
+import sys
+import urllib.error
+
+from github_utils import github_api_contents_url, github_request
+
+DEFAULT_REPO = "openai/skills"
+DEFAULT_PATH = "skills/.curated"
+DEFAULT_REF = "main"
+
+
+class ListError(Exception):
+    pass
+
+
+class Args(argparse.Namespace):
+    repo: str
+    path: str
+    ref: str
+    format: str
+
+
+def _request(url: str) -> bytes:
+    return github_request(url, "codex-skill-list")
+
+
+def _codex_home() -> str:
+    return os.environ.get("CODEX_HOME", os.path.expanduser("~/.codex"))
+
+
+def _installed_skills() -> set[str]:
+    root = os.path.join(_codex_home(), "skills")
+    if not os.path.isdir(root):
+        return set()
+    entries = set()
+    for name in os.listdir(root):
+        path = os.path.join(root, name)
+        if os.path.isdir(path):
+            entries.add(name)
+    return entries
+
+
+def _list_skills(repo: str, path: str, ref: str) -> list[str]:
+    api_url = github_api_contents_url(repo, path, ref)
+    try:
+        payload = _request(api_url)
+    except urllib.error.HTTPError as exc:
+        if exc.code == 404:
+            raise ListError(
+                "Skills path not found: "
+                f"https://github.com/{repo}/tree/{ref}/{path}"
+            ) from exc
+        raise ListError(f"Failed to fetch skills: HTTP {exc.code}") from exc
+    data = json.loads(payload.decode("utf-8"))
+    if not isinstance(data, list):
+        raise ListError("Unexpected skills listing response.")
+    skills = [item["name"] for item in data if item.get("type") == "dir"]
+    return sorted(skills)
+
+
+def _parse_args(argv: list[str]) -> Args:
+    parser = argparse.ArgumentParser(description="List skills.")
+    parser.add_argument("--repo", default=DEFAULT_REPO)
+    parser.add_argument(
+        "--path",
+        default=DEFAULT_PATH,
+        help="Repo path to list (default: skills/.curated)",
+    )
+    parser.add_argument("--ref", default=DEFAULT_REF)
+    parser.add_argument(
+        "--format",
+        choices=["text", "json"],
+        default="text",
+        help="Output format",
+    )
+    return parser.parse_args(argv, namespace=Args())
+
+
+def main(argv: list[str]) -> int:
+    args = _parse_args(argv)
+    try:
+        skills = _list_skills(args.repo, args.path, args.ref)
+        installed = _installed_skills()
+        if args.format == "json":
+            payload = [
+                {"name": name, "installed": name in installed} for name in skills
+            ]
+            print(json.dumps(payload))
+        else:
+            for idx, name in enumerate(skills, start=1):
+                suffix = " (already installed)" if name in installed else ""
+                print(f"{idx}. {name}{suffix}")
+        return 0
+    except ListError as exc:
+        print(f"Error: {exc}", file=sys.stderr)
+        return 1
+
+
+if __name__ == "__main__":
+    raise SystemExit(main(sys.argv[1:]))

From d43be9041955ea37c3437c3cfb5779ce9351e92f Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Mon, 22 Jun 2026 21:30:57 +0800
Subject: [PATCH 03/13] test

---
 fluxon_rs/fluxon_kv/src/kv_test.rs            | 31 ++++++++--
 .../test_top_attention_log_mgmt_contract.py   | 57 +++++++++++++++++++
 .../top_attention_test_index/_common.py       | 16 ++++++
 .../top_attention_test_index/_log_mgmt.py     | 15 +++--
 4 files changed, 111 insertions(+), 8 deletions(-)

diff --git a/fluxon_rs/fluxon_kv/src/kv_test.rs b/fluxon_rs/fluxon_kv/src/kv_test.rs
index a287769..8c3a711 100644
--- a/fluxon_rs/fluxon_kv/src/kv_test.rs
+++ b/fluxon_rs/fluxon_kv/src/kv_test.rs
@@ -11,7 +11,7 @@
 
 use crate::cluster_manager::ClusterManagerRdmaControlInit;
 use crate::config::{
-    ClientConfig, ContributeToClusterPoolSize, FluxonKvSpec, MasterConfig, MonitoringConfig,
+    ClientConfig, ContributeToClusterPoolSize, FluxonKvSpec, LargeFilePaths, MasterConfig, MonitoringConfig,
     ProtocolConfig, ProtocolType, TestSpecConfig, TestSpecTransportMode, TransferEngineType,
 };
 use crate::run_master_with_test_overrides;
@@ -850,6 +850,24 @@ fn default_external_contribute_to_cluster_pool_size() -> ContributeToClusterPool
     }
 }
 
+fn default_client_large_file_paths(
+    instance_key: &str,
+    contribute_to_cluster_pool_size: &ContributeToClusterPoolSize,
+) -> LargeFilePaths {
+    if contribute_to_cluster_pool_size.dram == 0
+        && contribute_to_cluster_pool_size.vram.is_empty()
+    {
+        return LargeFilePaths {
+            log_root_path: String::new(),
+            cache_root_path: String::new(),
+        };
+    }
+    LargeFilePaths {
+        log_root_path: format!("/tmp/kvcache_large/log/{}", instance_key),
+        cache_root_path: format!("/tmp/kvcache_large/cache/{}", instance_key),
+    }
+}
+
 fn default_owner_test_client_options(round_profile: KvTestRoundProfile) -> KvTestClientOptions {
     KvTestClientOptions {
         protocol_config: Some(round_profile.protocol_config()),
@@ -1020,6 +1038,9 @@ fn build_client_launch(
         .rdma_control_init
         .expect("kv_test requires rdma_control_init to be set explicitly");
     let transfer_backend_activation_mode = options.transfer_backend_activation_mode;
+    let contribute_to_cluster_pool_size = options
+        .contribute_to_cluster_pool_size
+        .unwrap_or(default_owner_contribute_to_cluster_pool_size());
     let shared_memory_path = options
         .shared_memory_path
         .unwrap_or_else(|| format!("/tmp/kvcache_shared_memory/{}", instance_key));
@@ -1030,9 +1051,7 @@ fn build_client_launch(
         cluster_name: round.cluster_name.clone(),
         etcd_addresses_raw,
         instance_key: instance_key.clone(),
-        contribute_to_cluster_pool_size: options
-            .contribute_to_cluster_pool_size
-            .unwrap_or(default_owner_contribute_to_cluster_pool_size()),
+        contribute_to_cluster_pool_size: contribute_to_cluster_pool_size.clone(),
         protocol: options.protocol_config.unwrap_or_else(tcp_protocol_config),
         pprof_duration_seconds: None,
         redis_compat_listen_addr: None,
@@ -1054,6 +1073,10 @@ fn build_client_launch(
         // binds multiple roles to the same owner path.
         shared_memory_path,
         shared_file_path,
+        large_file_paths: default_client_large_file_paths(
+            &instance_key,
+            &contribute_to_cluster_pool_size,
+        ),
         // Mirror round intent into the generated config so logs and runtime behavior
         // agree on whether this launch is transfer_only vs transfer_with_rpc.
         test_spec_config: kv_test_round_test_spec_config(round.round_profile),
diff --git a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
index c06c033..95d5764 100644
--- a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
+++ b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
@@ -107,6 +107,63 @@ def fake_run_python_file(description: str, path: str, extra_args=()):
                 ],
             )
 
+    def test_main_strips_passthrough_case_config_before_delegating(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            run_dir = Path(td)
+            cfg_dir = run_dir / "configs"
+            cfg_dir.mkdir(parents=True)
+            case_cfg = cfg_dir / "ci_scene_config.yaml"
+            case_cfg.write_text(
+                yaml.safe_dump(
+                    {
+                        "case": {
+                            "scene_id": "ci_top_attention_log_mgmt",
+                            "scale_id": "n1_kvowner_dram_20gib",
+                            "profile_id": "fluxon_tcp_thread",
+                            "case_id": "ci_top_attention_log_mgmt__n1_kvowner_dram_20gib__fluxon_tcp_thread",
+                        },
+                        "scene_config": {"enabled": True},
+                        "scene_runtime": {
+                            "etcd": {"ip": "127.0.0.1", "port": 19180},
+                            "greptime": {"ip": "127.0.0.1", "port": 19190},
+                        },
+                    },
+                    sort_keys=False,
+                ),
+                encoding="utf-8",
+            )
+
+            python_calls: list[tuple[str, tuple[str, ...]]] = []
+
+            def fake_run_python_file(description: str, path: str, extra_args=()):
+                del description
+                python_calls.append((path, tuple(extra_args)))
+                return 0
+
+            with mock.patch.object(_ENTRY, "run_python_file", side_effect=fake_run_python_file):
+                with mock.patch.object(_ENTRY, "run_cargo", return_value=0) as run_cargo:
+                    with mock.patch.object(
+                        sys,
+                        "argv",
+                        [
+                            str(MODULE_PATH),
+                            "--case-config",
+                            str(case_cfg),
+                            "--",
+                            "--case-config",
+                            str(case_cfg),
+                            "--nocapture",
+                        ],
+                    ):
+                        rc = _ENTRY.main()
+
+            self.assertEqual(rc, 0)
+            self.assertEqual(
+                python_calls[0],
+                ("deployment/tests/test_log_shard.py", ("--", "--nocapture")),
+            )
+            self.assertNotIn("--case-config", run_cargo.call_args.args[0])
+
 
 if __name__ == "__main__":
     raise SystemExit(unittest.main())
diff --git a/fluxon_test_stack/top_attention_test_index/_common.py b/fluxon_test_stack/top_attention_test_index/_common.py
index 3991aa7..c852b43 100755
--- a/fluxon_test_stack/top_attention_test_index/_common.py
+++ b/fluxon_test_stack/top_attention_test_index/_common.py
@@ -32,6 +32,22 @@ def parse_python_passthrough(description: str) -> tuple[str, list[str]]:
     return args.python, passthrough
 
 
+def strip_passthrough_case_config(passthrough: Sequence[str]) -> list[str]:
+    out: list[str] = []
+    idx = 0
+    while idx < len(passthrough):
+        token = passthrough[idx]
+        if token == "--case-config":
+            idx += 2
+            continue
+        if token.startswith("--case-config="):
+            idx += 1
+            continue
+        out.append(token)
+        idx += 1
+    return out
+
+
 def run_pytest(description: str, paths: Iterable[str]) -> int:
     python, passthrough = parse_python_passthrough(description)
     return call([python, "-m", "pytest", *paths, *passthrough])
diff --git a/fluxon_test_stack/top_attention_test_index/_log_mgmt.py b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
index e3547ab..3d5ed97 100644
--- a/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
+++ b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
@@ -3,7 +3,13 @@
 
 import argparse
 
-from _common import REPO_ROOT, load_case_config, run_cargo, run_python_file
+from _common import (
+    REPO_ROOT,
+    load_case_config,
+    run_cargo,
+    run_python_file,
+    strip_passthrough_case_config,
+)
 
 
 TEST_REQUIREMENTS = ["cargo", "etcd", "ops", "submodules"]
@@ -21,11 +27,12 @@ def main() -> int:
     args, passthrough = parser.parse_known_args()
     if args.case_config:
         _ = load_case_config(args.case_config, expected_scene_id=SCENE_ID)
+    child_passthrough = tuple(strip_passthrough_case_config(passthrough))
 
     rc = run_python_file(
         "Flat index entry for ops/shared-supervisor log shard helper coverage.",
         "deployment/tests/test_log_shard.py",
-        extra_args=tuple(passthrough),
+        extra_args=child_passthrough,
     )
     if rc != 0:
         return rc
@@ -36,7 +43,7 @@ def main() -> int:
         rc = run_python_file(
             "Flat index entry for ops/shared-supervisor log routing coverage.",
             "deployment/tests/test_selection_supervisor_codegen.py",
-            extra_args=("--test-id", test_id, *passthrough),
+            extra_args=("--test-id", test_id, *child_passthrough),
         )
         if rc != 0:
             return rc
@@ -46,7 +53,7 @@ def main() -> int:
         str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
         "--test",
         "log_mgmt",
-        *passthrough,
+        *child_passthrough,
     ])
 
 

From 65cab1e6406021150144caf9e6fb2b3e93a007da Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 09:28:26 +0800
Subject: [PATCH 04/13] test

---
 .../test_top_attention_log_mgmt_contract.py   | 102 +++++++++++-------
 .../top_attention_test_index/_common.py       |  34 ++++--
 .../top_attention_test_index/_log_mgmt.py     |   8 +-
 3 files changed, 92 insertions(+), 52 deletions(-)

diff --git a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
index 95d5764..9f715cb 100644
--- a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
+++ b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
@@ -14,6 +14,7 @@
 
 REPO_ROOT = Path(__file__).resolve().parents[2]
 MODULE_PATH = REPO_ROOT / "fluxon_test_stack" / "top_attention_test_index" / "_log_mgmt.py"
+COMMON_MODULE_PATH = REPO_ROOT / "fluxon_test_stack" / "top_attention_test_index" / "_common.py"
 
 
 def _load_module():
@@ -34,6 +35,24 @@ def _load_module():
 _ENTRY = _load_module()
 
 
+def _load_common_module():
+    module_dir = COMMON_MODULE_PATH.parent
+    sys.path.insert(0, str(module_dir))
+    try:
+        spec = importlib.util.spec_from_file_location("fluxon_test_stack_top_attention_common_contract", COMMON_MODULE_PATH)
+        assert spec is not None and spec.loader is not None
+        mod = importlib.util.module_from_spec(spec)
+        sys.modules[spec.name] = mod
+        spec.loader.exec_module(mod)
+        return mod
+    finally:
+        if sys.path and sys.path[0] == str(module_dir):
+            sys.path.pop(0)
+
+
+_COMMON = _load_common_module()
+
+
 class TestTopAttentionLogMgmtContract(unittest.TestCase):
     def test_main_accepts_case_config_and_runs_canonical_tests(self) -> None:
         with tempfile.TemporaryDirectory() as td:
@@ -75,7 +94,7 @@ def fake_run_python_file(description: str, path: str, extra_args=()):
                     with mock.patch.object(
                         sys,
                         "argv",
-                        [str(MODULE_PATH), "--case-config", str(case_cfg), "--", "--nocapture"],
+                        [str(MODULE_PATH), "--case-config", str(case_cfg)],
                     ):
                         rc = _ENTRY.main()
 
@@ -83,14 +102,14 @@ def fake_run_python_file(description: str, path: str, extra_args=()):
             self.assertEqual(
                 python_calls,
                 [
-                    ("deployment/tests/test_log_shard.py", ("--", "--nocapture")),
+                    ("deployment/tests/test_log_shard.py", ()),
                     (
                         "deployment/tests/test_selection_supervisor_codegen.py",
-                        ("--test-id", "runtime_log_path_uses_daily_shard_files", "--", "--nocapture"),
+                        ("--test-id", "runtime_log_path_uses_daily_shard_files"),
                     ),
                     (
                         "deployment/tests/test_selection_supervisor_codegen.py",
-                        ("--test-id", "runtime_log_shards_roll_and_preserve_content_boundaries", "--", "--nocapture"),
+                        ("--test-id", "runtime_log_shards_roll_and_preserve_content_boundaries"),
                     ),
                 ],
             )
@@ -102,12 +121,10 @@ def fake_run_python_file(description: str, path: str, extra_args=()):
                     str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
                     "--test",
                     "log_mgmt",
-                    "--",
-                    "--nocapture",
                 ],
             )
 
-    def test_main_strips_passthrough_case_config_before_delegating(self) -> None:
+    def test_main_rejects_passthrough_args(self) -> None:
         with tempfile.TemporaryDirectory() as td:
             run_dir = Path(td)
             cfg_dir = run_dir / "configs"
@@ -133,36 +150,47 @@ def test_main_strips_passthrough_case_config_before_delegating(self) -> None:
                 encoding="utf-8",
             )
 
-            python_calls: list[tuple[str, tuple[str, ...]]] = []
-
-            def fake_run_python_file(description: str, path: str, extra_args=()):
-                del description
-                python_calls.append((path, tuple(extra_args)))
-                return 0
-
-            with mock.patch.object(_ENTRY, "run_python_file", side_effect=fake_run_python_file):
-                with mock.patch.object(_ENTRY, "run_cargo", return_value=0) as run_cargo:
-                    with mock.patch.object(
-                        sys,
-                        "argv",
-                        [
-                            str(MODULE_PATH),
-                            "--case-config",
-                            str(case_cfg),
-                            "--",
-                            "--case-config",
-                            str(case_cfg),
-                            "--nocapture",
-                        ],
-                    ):
-                        rc = _ENTRY.main()
-
-            self.assertEqual(rc, 0)
-            self.assertEqual(
-                python_calls[0],
-                ("deployment/tests/test_log_shard.py", ("--", "--nocapture")),
-            )
-            self.assertNotIn("--case-config", run_cargo.call_args.args[0])
+            with mock.patch.object(
+                sys,
+                "argv",
+                [
+                    str(MODULE_PATH),
+                    "--case-config",
+                    str(case_cfg),
+                    "--",
+                    "--nocapture",
+                ],
+            ):
+                with self.assertRaisesRegex(ValueError, "_log_mgmt does not accept passthrough args"):
+                    _ENTRY.main()
+
+    def test_run_python_file_does_not_forward_parent_passthrough(self) -> None:
+        with mock.patch.object(_COMMON, "call", return_value=0) as call_mock:
+            with mock.patch.object(
+                sys,
+                "argv",
+                [
+                    str(COMMON_MODULE_PATH),
+                    "--case-config",
+                    "/tmp/should_not_leak.yaml",
+                    "--",
+                    "--nocapture",
+                ],
+            ):
+                rc = _COMMON.run_python_file(
+                    "delegate test",
+                    "deployment/tests/test_log_shard.py",
+                )
+
+        self.assertEqual(rc, 0)
+        self.assertEqual(
+            call_mock.call_args.args[0],
+            [
+                sys.executable,
+                "-u",
+                str(REPO_ROOT / "deployment/tests/test_log_shard.py"),
+            ],
+        )
 
 
 if __name__ == "__main__":
diff --git a/fluxon_test_stack/top_attention_test_index/_common.py b/fluxon_test_stack/top_attention_test_index/_common.py
index c852b43..3bd9a4c 100755
--- a/fluxon_test_stack/top_attention_test_index/_common.py
+++ b/fluxon_test_stack/top_attention_test_index/_common.py
@@ -53,15 +53,22 @@ def run_pytest(description: str, paths: Iterable[str]) -> int:
     return call([python, "-m", "pytest", *paths, *passthrough])
 
 
-def run_python_file(description: str, path: str, extra_args: Iterable[str] = ()) -> int:
-    python, passthrough = parse_python_passthrough(description)
-    return call([python, "-u", str(REPO_ROOT / path), *extra_args, *passthrough])
-
-
-def run_python_files(description: str, paths: Iterable[str]) -> int:
-    python, passthrough = parse_python_passthrough(description)
+def run_python_file(
+    description: str,
+    path: str,
+    extra_args: Iterable[str] = (),
+) -> int:
+    python, _ = parse_python_passthrough(description)
+    return call([python, "-u", str(REPO_ROOT / path), *extra_args])
+
+
+def run_python_files(
+    description: str,
+    paths: Iterable[str],
+) -> int:
+    python, _ = parse_python_passthrough(description)
     for path in paths:
-        rc = call([python, "-u", str(REPO_ROOT / path), *passthrough])
+        rc = call([python, "-u", str(REPO_ROOT / path)])
         if rc != 0:
             return rc
     return 0
@@ -166,7 +173,14 @@ def _prepare_cargo_env(env: dict[str, str] | None) -> dict[str, str] | None:
     return prepared_env
 
 
-def run_cargo(args: Iterable[str], *, env: dict[str, str] | None = None) -> int:
+def run_cargo(
+    args: Iterable[str],
+    *,
+    env: dict[str, str] | None = None,
+    passthrough: Sequence[str] | None = None,
+) -> int:
     # Rust test binaries launched via cargo run/load depend on the wheel-bundled native
     # runtime under the active venv. Keep one authoritative search root for all wrappers.
-    return call(["cargo", *args], env=_prepare_cargo_env(env))
+    _, parsed_passthrough = parse_python_passthrough("cargo delegate")
+    effective_passthrough = parsed_passthrough if passthrough is None else list(passthrough)
+    return call(["cargo", *args, *effective_passthrough], env=_prepare_cargo_env(env))
diff --git a/fluxon_test_stack/top_attention_test_index/_log_mgmt.py b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
index 3d5ed97..9ef7cd5 100644
--- a/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
+++ b/fluxon_test_stack/top_attention_test_index/_log_mgmt.py
@@ -8,7 +8,6 @@
     load_case_config,
     run_cargo,
     run_python_file,
-    strip_passthrough_case_config,
 )
 
 
@@ -27,12 +26,12 @@ def main() -> int:
     args, passthrough = parser.parse_known_args()
     if args.case_config:
         _ = load_case_config(args.case_config, expected_scene_id=SCENE_ID)
-    child_passthrough = tuple(strip_passthrough_case_config(passthrough))
+    if passthrough:
+        raise ValueError(f"_log_mgmt does not accept passthrough args: {tuple(passthrough)!r}")
 
     rc = run_python_file(
         "Flat index entry for ops/shared-supervisor log shard helper coverage.",
         "deployment/tests/test_log_shard.py",
-        extra_args=child_passthrough,
     )
     if rc != 0:
         return rc
@@ -43,7 +42,7 @@ def main() -> int:
         rc = run_python_file(
             "Flat index entry for ops/shared-supervisor log routing coverage.",
             "deployment/tests/test_selection_supervisor_codegen.py",
-            extra_args=("--test-id", test_id, *child_passthrough),
+            extra_args=("--test-id", test_id),
         )
         if rc != 0:
             return rc
@@ -53,7 +52,6 @@ def main() -> int:
         str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
         "--test",
         "log_mgmt",
-        *child_passthrough,
     ])
 
 

From 13bdf28e7a2f0579cbf35d172ad567eccf86da35 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 11:21:35 +0800
Subject: [PATCH 05/13] test

---
 .../test_top_attention_log_mgmt_contract.py   | 36 +++++++++++++++++++
 .../top_attention_test_index/_common.py       | 19 +---------
 2 files changed, 37 insertions(+), 18 deletions(-)

diff --git a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
index 9f715cb..c9d6ba0 100644
--- a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
+++ b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
@@ -192,6 +192,42 @@ def test_run_python_file_does_not_forward_parent_passthrough(self) -> None:
             ],
         )
 
+    def test_run_cargo_does_not_forward_parent_passthrough(self) -> None:
+        with mock.patch.object(_COMMON, "call", return_value=0) as call_mock:
+            with mock.patch.object(
+                sys,
+                "argv",
+                [
+                    str(COMMON_MODULE_PATH),
+                    "--case-config",
+                    "/tmp/should_not_leak.yaml",
+                    "--",
+                    "--nocapture",
+                ],
+            ):
+                rc = _COMMON.run_cargo(
+                    [
+                        "test",
+                        "--manifest-path",
+                        str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
+                        "--test",
+                        "log_mgmt",
+                    ],
+                )
+
+        self.assertEqual(rc, 0)
+        self.assertEqual(
+            call_mock.call_args.args[0],
+            [
+                "cargo",
+                "test",
+                "--manifest-path",
+                str(REPO_ROOT / "fluxon_rs" / "fluxon_util" / "Cargo.toml"),
+                "--test",
+                "log_mgmt",
+            ],
+        )
+
 
 if __name__ == "__main__":
     raise SystemExit(unittest.main())
diff --git a/fluxon_test_stack/top_attention_test_index/_common.py b/fluxon_test_stack/top_attention_test_index/_common.py
index 3bd9a4c..4fcfaa7 100755
--- a/fluxon_test_stack/top_attention_test_index/_common.py
+++ b/fluxon_test_stack/top_attention_test_index/_common.py
@@ -32,22 +32,6 @@ def parse_python_passthrough(description: str) -> tuple[str, list[str]]:
     return args.python, passthrough
 
 
-def strip_passthrough_case_config(passthrough: Sequence[str]) -> list[str]:
-    out: list[str] = []
-    idx = 0
-    while idx < len(passthrough):
-        token = passthrough[idx]
-        if token == "--case-config":
-            idx += 2
-            continue
-        if token.startswith("--case-config="):
-            idx += 1
-            continue
-        out.append(token)
-        idx += 1
-    return out
-
-
 def run_pytest(description: str, paths: Iterable[str]) -> int:
     python, passthrough = parse_python_passthrough(description)
     return call([python, "-m", "pytest", *paths, *passthrough])
@@ -181,6 +165,5 @@ def run_cargo(
 ) -> int:
     # Rust test binaries launched via cargo run/load depend on the wheel-bundled native
     # runtime under the active venv. Keep one authoritative search root for all wrappers.
-    _, parsed_passthrough = parse_python_passthrough("cargo delegate")
-    effective_passthrough = parsed_passthrough if passthrough is None else list(passthrough)
+    effective_passthrough = [] if passthrough is None else list(passthrough)
     return call(["cargo", *args, *effective_passthrough], env=_prepare_cargo_env(env))

From 48cb22bc0010d8feec0b5aedeff0052b11122de4 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 14:52:58 +0800
Subject: [PATCH 06/13] test

---
 .../test_selection_supervisor_codegen.py      | 11 +++++--
 .../test_top_attention_log_mgmt_contract.py   | 30 +++++++++++++++++++
 .../top_attention_test_index/_common.py       | 12 ++++++--
 3 files changed, 47 insertions(+), 6 deletions(-)

diff --git a/deployment/tests/test_selection_supervisor_codegen.py b/deployment/tests/test_selection_supervisor_codegen.py
index a00caa9..adc82a9 100644
--- a/deployment/tests/test_selection_supervisor_codegen.py
+++ b/deployment/tests/test_selection_supervisor_codegen.py
@@ -712,20 +712,25 @@ def test_runtime_log_shards_roll_and_preserve_content_boundaries() -> None:
         try:
             _wait_until_present(module, label)
             first_shard = root / "test-log-roll.2026-01-01.log"
-            second_shard = root / "test-log-roll.2026-01-02.log"
+            second_shard = None
             deadline = time.time() + 20.0
             while time.time() < deadline:
-                if first_shard.exists() and second_shard.exists():
+                shard_paths = sorted(root.glob("test-log-roll.*.log"))
+                if len(shard_paths) >= 2:
+                    second_shard = shard_paths[-1]
+                if first_shard.exists() and second_shard is not None and second_shard.exists():
                     first_text = first_shard.read_text(encoding="utf-8", errors="replace")
                     second_text = second_shard.read_text(encoding="utf-8", errors="replace")
                     if "[ops-log-mgmt][phase=before]" in first_text and "[ops-log-mgmt][phase=after]" in second_text:
                         break
                 time.sleep(0.2)
             assert first_shard.exists(), first_shard
+            assert second_shard is not None, sorted(path.name for path in root.glob("test-log-roll.*.log"))
             assert second_shard.exists(), second_shard
             assert not stale_shard.exists(), stale_shard
             shard_names = sorted(path.name for path in root.glob("test-log-roll.*.log"))
-            assert shard_names == ["test-log-roll.2026-01-01.log", "test-log-roll.2026-01-02.log"], shard_names
+            assert shard_names[0] == "test-log-roll.2026-01-01.log", shard_names
+            assert len(shard_names) == 2, shard_names
             first_text = first_shard.read_text(encoding="utf-8", errors="replace")
             second_text = second_shard.read_text(encoding="utf-8", errors="replace")
             assert "[ops-log-mgmt][phase=before]" in first_text, first_text
diff --git a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
index c9d6ba0..2b92fd0 100644
--- a/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
+++ b/fluxon_test_stack/tests/test_top_attention_log_mgmt_contract.py
@@ -192,6 +192,36 @@ def test_run_python_file_does_not_forward_parent_passthrough(self) -> None:
             ],
         )
 
+    def test_run_pytest_does_not_forward_parent_passthrough(self) -> None:
+        with mock.patch.object(_COMMON, "call", return_value=0) as call_mock:
+            with mock.patch.object(
+                sys,
+                "argv",
+                [
+                    str(COMMON_MODULE_PATH),
+                    "--case-config",
+                    "/tmp/should_not_leak.yaml",
+                    "--",
+                    "-k",
+                    "smoke",
+                ],
+            ):
+                rc = _COMMON.run_pytest(
+                    "delegate pytest",
+                    ["fluxon_test_stack/tests/test_top_attention_bin_kvtest_contract.py"],
+                )
+
+        self.assertEqual(rc, 0)
+        self.assertEqual(
+            call_mock.call_args.args[0],
+            [
+                sys.executable,
+                "-m",
+                "pytest",
+                "fluxon_test_stack/tests/test_top_attention_bin_kvtest_contract.py",
+            ],
+        )
+
     def test_run_cargo_does_not_forward_parent_passthrough(self) -> None:
         with mock.patch.object(_COMMON, "call", return_value=0) as call_mock:
             with mock.patch.object(
diff --git a/fluxon_test_stack/top_attention_test_index/_common.py b/fluxon_test_stack/top_attention_test_index/_common.py
index 4fcfaa7..c890584 100755
--- a/fluxon_test_stack/top_attention_test_index/_common.py
+++ b/fluxon_test_stack/top_attention_test_index/_common.py
@@ -32,9 +32,15 @@ def parse_python_passthrough(description: str) -> tuple[str, list[str]]:
     return args.python, passthrough
 
 
-def run_pytest(description: str, paths: Iterable[str]) -> int:
-    python, passthrough = parse_python_passthrough(description)
-    return call([python, "-m", "pytest", *paths, *passthrough])
+def run_pytest(
+    description: str,
+    paths: Iterable[str],
+    *,
+    passthrough: Sequence[str] | None = None,
+) -> int:
+    python, _ = parse_python_passthrough(description)
+    effective_passthrough = [] if passthrough is None else list(passthrough)
+    return call([python, "-m", "pytest", *paths, *effective_passthrough])
 
 
 def run_python_file(

From 5b36a1f9a4a0884674301872245fa0d64f79d9de Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 16:44:03 +0800
Subject: [PATCH 07/13] fix quick start; simplify tcp

---
 .../atomic_group_service_block.sh.tmpl        |   4 +-
 .../etcd_health_wait_block.sh.tmpl            |   4 -
 .../standalone_start_body.sh.tmpl             |   4 +-
 .../tcp_ready_helpers.sh.tmpl                 | 120 ------------------
 .../tcp_ready_wait_block.sh.tmpl              |   6 -
 deployment/tests/test_gen_bare_deploy_bash.py | 111 ++++++++++++++--
 deployment/utils/proc_lifecycle_codegen.py    |  70 ++++++++--
 examples/fluxon_quick_start/start.py          |  10 ++
 ...15\347\275\256\346\200\273\350\247\210.md" |  60 ++++++++-
 .../tests/test_quick_start_release_only.py    |  38 ++++++
 10 files changed, 264 insertions(+), 163 deletions(-)
 delete mode 100644 deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
 delete mode 100644 deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
 delete mode 100644 deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl

diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
index 6ad9a1a..25da0dd 100644
--- a/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_service_block.sh.tmpl
@@ -16,8 +16,8 @@ else
   LOGFILE="{{LOGFILE_PATH}}"
   echo "[rollout] start {{SERVICE_NAME}} node=$NODE_ID hostworkdir=$HOSTWORKDIR"
   # English note:
-  # - Atomic-group order still depends on a readiness gate, but that gate now observes only the
-  #   detached supervisor process subtree on this host.
+  # - Atomic-group order still depends on a startup gate, but that gate now checks only whether
+  #   one supervised child PID stays alive without restart on this host.
   # - Ownership stays inside the shared selection supervisor big loop; the group runner only waits
   #   through the fixed startup observation window before advancing to the next service.
 {{INDENTED_SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK}}
diff --git a/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
deleted file mode 100644
index b424bc3..0000000
--- a/deployment/templates/gen_bare_deploy_bash/etcd_health_wait_block.sh.tmpl
+++ /dev/null
@@ -1,4 +0,0 @@
-if ! wait_service_etcd_endpoint_healthy "$SERVICE" "$HOSTWORKDIR/fluxon_release/ext_images/etcd/etcdctl" "http://$HOST_IP:$SERVICE_PORT" {{ETCD_HEALTH_STABLE_SECONDS}} {{ETCD_HEALTH_DEADLINE_TS}} "{{CONTEXT}}"; then
-  echo "{{CONTEXT}} etcd-health failed svc=$SERVICE endpoint=http://$HOST_IP:$SERVICE_PORT"
-  exit 1
-fi
diff --git a/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
index bc2fc40..b58d3de 100644
--- a/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
@@ -21,7 +21,7 @@ fi
 # English note:
 # - Bare start must not depend on extra supervisor observation subcommands because the shared
 #   runtime surface is intentionally reduced to run/stop.
-# - We therefore launch the detached supervisor and wait until its pid subtree keeps a live child
-#   process alive across the fixed startup observation window.
+# - We therefore launch the detached supervisor and wait until one supervised child PID stays
+#   alive without restart across the fixed startup observation window.
 {{SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK}}echo "Started $SERVICE (label: $SUPERVISOR_LABEL)"
 echo "Logs: $LOGFILE"
diff --git a/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
deleted file mode 100644
index 0c0cc3b..0000000
--- a/deployment/templates/gen_bare_deploy_bash/tcp_ready_helpers.sh.tmpl
+++ /dev/null
@@ -1,120 +0,0 @@
-wait_service_tcp_ready() {
-  svc="$1"
-  host="$2"
-  port="$3"
-  stable_seconds="$4"
-  deadline_ts="$5"
-  context="$6"
-  if [[ ! "$port" =~ ^[0-9]+$ ]]; then
-    echo "$context tcp-ready: invalid port svc=$svc port=$port"
-    return 1
-  fi
-  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then
-    echo "$context tcp-ready: invalid stable_seconds svc=$svc stable_seconds=$stable_seconds"
-    return 1
-  fi
-  poll_interval_seconds={{TCP_READY_POLL_INTERVAL_SECONDS}}
-  stable_checks=$(python3 - "$stable_seconds" "$poll_interval_seconds" <<'__FLUXON_TCP_READY_CHECKS__'
-import math
-import sys
-stable_seconds = float(sys.argv[1])
-poll_interval_seconds = float(sys.argv[2])
-print(max(1, int(math.ceil(stable_seconds / poll_interval_seconds))))
-__FLUXON_TCP_READY_CHECKS__
-)
-  if [[ ! "$stable_checks" =~ ^[0-9]+$ ]] || [ "$stable_checks" -le 0 ]; then
-    echo "$context tcp-ready: failed to compute stable_checks svc=$svc"
-    return 1
-  fi
-  ok_checks=0
-  while true; do
-    now=$(date +%s)
-    if [ "$now" -ge "$deadline_ts" ]; then
-      echo "$context tcp-ready: deadline exceeded svc=$svc host=$host port=$port"
-      return 1
-    fi
-    if python3 - "$host" "$port" <<'__FLUXON_TCP_READY_PROBE__'
-import socket
-import sys
-host = sys.argv[1]
-port = int(sys.argv[2])
-with socket.create_connection((host, port), timeout=1.0):
-    pass
-__FLUXON_TCP_READY_PROBE__
-    then
-      ok_checks=$((ok_checks+1))
-      if [ "$ok_checks" -ge "$stable_checks" ]; then
-        echo "$context tcp-ready: ok svc=$svc host=$host port=$port stable_checks=$stable_checks"
-        return 0
-      fi
-    else
-      if [ "$ok_checks" -ne 0 ]; then
-        echo "$context tcp-ready: reset svc=$svc ok_checks=$ok_checks host=$host port=$port"
-      fi
-      ok_checks=0
-    fi
-    sleep "$poll_interval_seconds"
-  done
-}
-
-wait_service_etcd_endpoint_healthy() {
-  svc="$1"
-  etcdctl_bin="$2"
-  endpoint="$3"
-  stable_seconds="$4"
-  deadline_ts="$5"
-  context="$6"
-  if [ ! -x "$etcdctl_bin" ]; then
-    echo "$context etcd-health: missing etcdctl svc=$svc path=$etcdctl_bin"
-    return 1
-  fi
-  if [ -z "$endpoint" ]; then
-    echo "$context etcd-health: missing endpoint svc=$svc"
-    return 1
-  fi
-  if [[ ! "$stable_seconds" =~ ^[0-9]+$ ]] || [ "$stable_seconds" -le 0 ]; then
-    echo "$context etcd-health: invalid stable_seconds svc=$svc stable_seconds=$stable_seconds"
-    return 1
-  fi
-  poll_interval_seconds={{ETCD_HEALTH_POLL_INTERVAL_SECONDS}}
-  stable_checks=$(python3 - "$stable_seconds" "$poll_interval_seconds" <<'__FLUXON_ETCD_HEALTH_CHECKS__'
-import math
-import sys
-stable_seconds = float(sys.argv[1])
-poll_interval_seconds = float(sys.argv[2])
-print(max(1, int(math.ceil(stable_seconds / poll_interval_seconds))))
-__FLUXON_ETCD_HEALTH_CHECKS__
-)
-  if [[ ! "$stable_checks" =~ ^[0-9]+$ ]] || [ "$stable_checks" -le 0 ]; then
-    echo "$context etcd-health: failed to compute stable_checks svc=$svc"
-    return 1
-  fi
-  ok_checks=0
-  last_output=""
-  while true; do
-    now=$(date +%s)
-    if [ "$now" -ge "$deadline_ts" ]; then
-      if [ -n "$last_output" ]; then
-        last_output="${last_output//$'\n'/ }"
-        echo "$context etcd-health: deadline exceeded svc=$svc endpoint=$endpoint last_output=$last_output"
-      else
-        echo "$context etcd-health: deadline exceeded svc=$svc endpoint=$endpoint"
-      fi
-      return 1
-    fi
-    if probe_output=$(ETCDCTL_API=3 "$etcdctl_bin" --endpoints "$endpoint" --dial-timeout "{{ETCD_HEALTH_PROBE_TIMEOUT_MS}}ms" --command-timeout "{{ETCD_HEALTH_PROBE_TIMEOUT_MS}}ms" endpoint health 2>&1); then
-      ok_checks=$((ok_checks+1))
-      if [ "$ok_checks" -ge "$stable_checks" ]; then
-        echo "$context etcd-health: ok svc=$svc endpoint=$endpoint stable_checks=$stable_checks"
-        return 0
-      fi
-    else
-      last_output="$probe_output"
-      if [ "$ok_checks" -ne 0 ]; then
-        echo "$context etcd-health: reset svc=$svc ok_checks=$ok_checks endpoint=$endpoint"
-      fi
-      ok_checks=0
-    fi
-    sleep "$poll_interval_seconds"
-  done
-}
diff --git a/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl
deleted file mode 100644
index bbf021b..0000000
--- a/deployment/templates/gen_bare_deploy_bash/tcp_ready_wait_block.sh.tmpl
+++ /dev/null
@@ -1,6 +0,0 @@
-if [[ "${SERVICE_PORT:-}" =~ ^[0-9]+$ ]]; then
-  if ! wait_service_tcp_ready "$SERVICE" "$HOST_IP" "$SERVICE_PORT" {{TCP_READY_STABLE_SECONDS}} {{TCP_READY_DEADLINE_TS}} "{{CONTEXT}}"; then
-    echo "{{CONTEXT}} tcp-ready failed svc=$SERVICE host=$HOST_IP port=$SERVICE_PORT"
-    exit 1
-  fi
-fi
diff --git a/deployment/tests/test_gen_bare_deploy_bash.py b/deployment/tests/test_gen_bare_deploy_bash.py
index f1645a3..9f392ed 100644
--- a/deployment/tests/test_gen_bare_deploy_bash.py
+++ b/deployment/tests/test_gen_bare_deploy_bash.py
@@ -61,6 +61,7 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("bare_child_command_preserves_runtime_hostworkdir_expansion", test_bare_child_command_preserves_runtime_hostworkdir_expansion),
         ("supervisor_label_uses_stable_selection_suffix", test_supervisor_label_uses_stable_selection_suffix),
         ("bootstrap_start_reuses_already_present_selection", test_bootstrap_start_reuses_already_present_selection),
+        ("bare_start_fails_when_child_exits_within_startup_window", test_bare_start_fails_when_child_exits_within_startup_window),
         ("atomic_group_start_does_not_auto_stop_on_failure", test_atomic_group_start_does_not_auto_stop_on_failure),
         ("atomic_group_preserves_nested_heredoc_terminator", test_atomic_group_preserves_nested_heredoc_terminator),
         ("atomic_group_stop_script_is_shell_valid", test_atomic_group_stop_script_is_shell_valid),
@@ -577,7 +578,7 @@ def _handle_signal(_signum, _frame):
             assert first.returncode == 0, (
                 f"first start failed rc={first.returncode} stdout={first.stdout!r} stderr={first.stderr!r}"
             )
-            _wait_until_selection_present(supervisor_module, label=label)
+            _wait_until_selection_present(supervisor_module, label=label, scope_key=str(hostworkdir))
 
             second_env = base_env.copy()
             second_env["FLUXON_BARE_ALLOW_ALREADY_PRESENT"] = "true"
@@ -594,7 +595,7 @@ def _handle_signal(_signum, _frame):
                 f"reuse start failed rc={second.returncode} stdout={second.stdout!r} stderr={second.stderr!r}"
             )
             assert "[bare] already present svc=svc_plain" in second.stdout, second.stdout
-            live_supervisors = supervisor_module._iter_live_supervisors(label)
+            live_supervisors = supervisor_module._iter_live_supervisors(label, scope_key=str(hostworkdir))
             assert len(live_supervisors) == 1, live_supervisors
         finally:
             subprocess.run(
@@ -606,10 +607,90 @@ def _handle_signal(_signum, _frame):
                 env=base_env,
                 timeout=20,
             )
-            _wait_until_selection_absent(supervisor_module, label=label)
+            _wait_until_selection_absent(supervisor_module, label=label, scope_key=str(hostworkdir))
         print("PASS: test_bootstrap_start_reuses_already_present_selection")
 
 
+def test_bare_start_fails_when_child_exits_within_startup_window() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_child_exit_") as td:
+        tmpdir = Path(td)
+        hostworkdir = tmpdir / "hostworkdir"
+        outdir = hostworkdir / "gen_bare_deploy_bash"
+        config_path = tmpdir / "deployconf.yaml"
+        hostworkdir.mkdir(parents=True, exist_ok=True)
+        (hostworkdir / "exit_after_delay.py").write_text(
+            textwrap.dedent(
+                """
+                #!/usr/bin/env python3
+                import time
+
+                time.sleep(1.5)
+                raise SystemExit(17)
+                """
+            ).strip()
+            + "\n",
+            encoding="utf-8",
+        )
+        config_path.write_text(
+            textwrap.dedent(
+                f"""
+                name_prefix: fluxon-testbed
+                cluster_nodes:
+                  - hostname: node-a
+                    ip: 127.0.0.1
+                    hostworkdir: {hostworkdir}
+                service:
+                  svc_plain:
+                    entrypoint: |
+                      exec python3 "${{HOSTWORKDIR}}/exit_after_delay.py"
+                    node_bind:
+                      node: ["node-a"]
+                """
+            ).strip()
+            + "\n",
+            encoding="utf-8",
+        )
+
+        result = _run_generator(config_path=config_path, outdir=outdir)
+        assert result.returncode == 0, f"generator failed: stdout={result.stdout} stderr={result.stderr}"
+
+        start_script = outdir / "start_svc_plain.sh"
+        stop_script = outdir / "stop_svc_plain.sh"
+        supervisor_module = _load_generated_supervisor_module(outdir / "selection_supervisor.py")
+        label = "DaemonSet/fluxon-testbed-svc_plain"
+        repo_root = DEPLOYMENT_DIR.parent
+        env = os.environ.copy()
+        env["NODE_ID"] = "node-a"
+
+        try:
+            start = subprocess.run(
+                [str(start_script)],
+                check=False,
+                capture_output=True,
+                text=True,
+                cwd=str(repo_root),
+                env=env,
+                timeout=20,
+            )
+            assert start.returncode != 0, (
+                f"expected startup gate failure rc={start.returncode} stdout={start.stdout!r} stderr={start.stderr!r}"
+            )
+            assert "[bare] probable-ready failed svc=svc_plain" in start.stdout, start.stdout
+            assert "child pid exited" in start.stdout or "child pid changed" in start.stdout, start.stdout
+        finally:
+            subprocess.run(
+                [str(stop_script)],
+                check=False,
+                capture_output=True,
+                text=True,
+                cwd=str(repo_root),
+                env=env,
+                timeout=20,
+            )
+            _wait_until_selection_absent(supervisor_module, label=label, scope_key=str(hostworkdir))
+        print("PASS: test_bare_start_fails_when_child_exits_within_startup_window")
+
+
 def test_atomic_group_preserves_nested_heredoc_terminator() -> None:
     with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_atomic_heredoc_") as td:
         tmpdir = Path(td)
@@ -749,22 +830,34 @@ def _load_python_module(*, module_name: str, path: Path):
     return module
 
 
-def _wait_until_selection_present(module, *, label: str, timeout_seconds: int = 15) -> None:
+def _wait_until_selection_present(
+    module,
+    *,
+    label: str,
+    scope_key: Optional[str] = None,
+    timeout_seconds: int = 15,
+) -> None:
     deadline = time.time() + timeout_seconds
     while time.time() < deadline:
-        if module._selection_present(label):
+        if module._selection_present(label, scope_key=scope_key):
             return
         time.sleep(0.2)
-    raise RuntimeError(f"timeout waiting selection present: label={label}")
+    raise RuntimeError(f"timeout waiting selection present: label={label} scope_key={scope_key}")
 
 
-def _wait_until_selection_absent(module, *, label: str, timeout_seconds: int = 15) -> None:
+def _wait_until_selection_absent(
+    module,
+    *,
+    label: str,
+    scope_key: Optional[str] = None,
+    timeout_seconds: int = 15,
+) -> None:
     deadline = time.time() + timeout_seconds
     while time.time() < deadline:
-        if not module._iter_live_supervisors(label):
+        if not module._iter_live_supervisors(label, scope_key=scope_key):
             return
         time.sleep(0.2)
-    raise RuntimeError(f"timeout waiting selection absent: label={label}")
+    raise RuntimeError(f"timeout waiting selection absent: label={label} scope_key={scope_key}")
 
 
 if __name__ == "__main__":
diff --git a/deployment/utils/proc_lifecycle_codegen.py b/deployment/utils/proc_lifecycle_codegen.py
index 116b0c4..b0acd71 100644
--- a/deployment/utils/proc_lifecycle_codegen.py
+++ b/deployment/utils/proc_lifecycle_codegen.py
@@ -135,26 +135,42 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
   '
 }}
 
-_pid_tree_has_child_process() {{
+_pid_tree_direct_child_pids() {{
   root_pid="$1"
-  pids="$(_pid_tree_list "$root_pid" 2>/dev/null || true)"
-  if [ -z "$pids" ]; then
+  if [[ ! "$root_pid" =~ ^[0-9]+$ ]]; then
     return 1
   fi
-  # More than one PID means the supervisor has a live child process.
-  set -- $pids
-  if [ "$#" -ge 2 ]; then
-    return 0
+  if ! _pid_exists "$root_pid"; then
+    return 1
   fi
-  return 1
+
+  ps -eo pid=,ppid=,stat= 2>/dev/null | awk -v root="$root_pid" '
+    {{
+      pid=$1;
+      ppid=$2;
+      state=$3;
+      if (ppid != root) {{
+        next;
+      }}
+      if (state ~ /^Z/) {{
+        next;
+      }}
+      out=out " " pid;
+    }}
+    END {{
+      sub(/^ /, "", out);
+      print out;
+    }}
+  '
 }}
 
 wait_service_probably_ready_pid_tree() {{
   # Startup gate contract:
-  # - Success means the supervisor PID stays alive across the fixed startup window.
+  # - Success means one supervised direct child PID becomes visible and stays unchanged across the
+  #   fixed startup window.
   # - During this startup window we do not probe service ports or readiness endpoints.
-  # - We intentionally do not require the child to expose ports, endpoints, or even finish
-  #   spawning before the window ends.
+  # - A child exit or restart inside the window is treated as startup failure even if the
+  #   supervisor process itself stays alive and restarts again later.
   svc="$1"
   root_pid="$2"
   startup_window_seconds="$3"
@@ -170,19 +186,47 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
     return 1
   fi
 
+  observed_child_pid=""
   while true; do
     if ! _pid_exists "$root_pid"; then
       echo "$context probable-ready: supervisor pid exited svc=$svc pid=$root_pid"
       return 1
     fi
 
+    current_child_pids="$(_pid_tree_direct_child_pids "$root_pid" 2>/dev/null || true)"
+    current_child_pid=""
+    if [ -n "$current_child_pids" ]; then
+      set -- $current_child_pids
+      if [ "$#" -ne 1 ]; then
+        echo "$context probable-ready: multiple direct child pids svc=$svc supervisor_pid=$root_pid child_pids=$current_child_pids"
+        return 1
+      fi
+      current_child_pid="$1"
+    fi
+
+    if [ -z "$current_child_pid" ]; then
+      if [ -n "$observed_child_pid" ]; then
+        echo "$context probable-ready: child pid exited svc=$svc supervisor_pid=$root_pid child_pid=$observed_child_pid"
+        return 1
+      fi
+    elif [ -z "$observed_child_pid" ]; then
+      observed_child_pid="$current_child_pid"
+    elif [ "$current_child_pid" != "$observed_child_pid" ]; then
+      echo "$context probable-ready: child pid changed svc=$svc supervisor_pid=$root_pid child_pid=$observed_child_pid replacement_child_pid=$current_child_pid"
+      return 1
+    fi
+
     now=$(date +%s)
     if [ "$now" -ge "$deadline_ts" ]; then
-      echo "$context probable-ready: ok svc=$svc startup_window_seconds=$startup_window_seconds pid=$root_pid"
+      if [ -z "$observed_child_pid" ]; then
+        echo "$context probable-ready: no child pid observed svc=$svc supervisor_pid=$root_pid startup_window_seconds=$startup_window_seconds"
+        return 1
+      fi
+      echo "$context probable-ready: ok svc=$svc startup_window_seconds=$startup_window_seconds supervisor_pid=$root_pid child_pid=$observed_child_pid"
       return 0
     fi
 
-    sleep 1
+    sleep 0.2
   done
 }}
 
diff --git a/examples/fluxon_quick_start/start.py b/examples/fluxon_quick_start/start.py
index 17fd8c2..c051598 100644
--- a/examples/fluxon_quick_start/start.py
+++ b/examples/fluxon_quick_start/start.py
@@ -528,6 +528,13 @@ def _monitoring_block(greptime_http_port: int) -> Dict[str, Any]:
     }
 
 
+def _owner_large_file_paths(workdir: Path) -> Dict[str, str]:
+    return {
+        "log_root_path": str(workdir / "large" / "log" / "owner"),
+        "cache_root_path": str(workdir / "large" / "cache" / "owner"),
+    }
+
+
 def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: int,
                     panel_port: int, greptime_http_port: int, workdir: Path) -> Dict[str, Any]:
     shm = str(workdir / "sharemem")
@@ -554,6 +561,7 @@ def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: i
                 "shared_memory_path": shm,
                 "shared_file_path": shared_file_path,
                 "sub_cluster": "default",
+                "large_file_paths": _owner_large_file_paths(workdir),
             },
         },
         "kvexternal_rexport_httpserver_http": {
@@ -599,6 +607,7 @@ def _gen_mq_config(etcd_ep: str, cluster: str, master_port: int, greptime_http_p
                 "shared_memory_path": shm,
                 "shared_file_path": shared_file_path,
                 "sub_cluster": "default",
+                "large_file_paths": _owner_large_file_paths(workdir),
             },
         },
         "kvexternal": {
@@ -657,6 +666,7 @@ def _gen_fs_config(etcd_ep: str, cluster: str, master_port: int, panel_port: int
                 "shared_memory_path": shm,
                 "shared_file_path": shared_file_path,
                 "sub_cluster": "default",
+                "large_file_paths": _owner_large_file_paths(workdir),
             },
         },
         "fs_master": {
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
index 852b73f..84fb0dc 100644
--- "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -107,29 +107,75 @@ TestStack 的配置已经单独有设计文档，这里只收口成一句话：
 
 ### 5.1 KV
 
-KV 的入口在 `fluxon_kv/src/config.rs`，对外分成 master 和 client 两个稳定 YAML：
+KV 的入口在 `fluxon_kv/src/config.rs`。稳定结论是：`master` 单独使用 `MasterConfigYaml`；`owner` 和 `external` 共用 `ClientConfigYaml`，再由 `verify()` 按内存贡献收敛成 owner / external / side-transfer worker 三个运行时分支。
 
 | 类型 | 作用 |
 | --- | --- |
 | `MasterConfigYaml` | master 节点输入 |
 | `ClientConfigYaml` | owner / external 输入 |
+| `FluxonKvSpecYaml` | client 侧 `fluxonkv_spec` 子块 |
 | `TestSpecConfig` | 测试和实验分支开关 |
 | `MonitoringConfigYaml` | master 监控块 |
 | `NetworkConfig` | 网络白名单和 IP 映射，共享自 `fluxon_commu_contract` |
 
-核心分流规则：
+`master` 的 YAML 结构：
 
-- `contribute_to_cluster_pool_size` 缺失或全零时，进入 external。
-- `contribute_to_cluster_pool_size.dram > 0` 时，进入 owner。
-- `test_spec_config.side_transfer_role = worker` 时，走 side-transfer worker 分支，强制 `TransferEngineType::P2p`。
+| 字段 | 规则 | 作用 |
+| --- | --- | --- |
+| `instance_key` | 必填 | master 实例标识 |
+| `cluster_name` | 必填 | 集群名 |
+| `etcd_endpoints` | 必填，输入用 raw `host:port` | master 控制面 etcd 地址；校验后归一化成 `http://host:port` |
+| `log_dir` | 必填 | master 日志 / profile 根目录 |
+| `port` | 可选，给出时 `> 0` | master 监听端口 |
+| `protocol` | 可选 | 协议选择；缺省走编译期默认协议 |
+| `monitoring` | 逻辑必填 | Prometheus / remote write / OTLP log 配置块 |
+| `network` | 可选 | 网络白名单和主 IP 扩展映射 |
+| `pprof_duration_seconds` | 可选，给出时 `> 0` | profile 导出时长 |
+| `master_ui` | 可选，但依赖 `monitoring` | 嵌入式 monitor HTTP 服务；当前只暴露 `http_listen_addr` |
+| `test_spec_config` | 可选 | test / fast-path / side-transfer 实验开关 |
+
+`owner` 和 `external` 共用同一套 `ClientConfigYaml` 骨架：
+
+| 顶层字段 | 规则 | 说明 |
+| --- | --- | --- |
+| `instance_key` | 必填 | client 实例标识 |
+| `protocol` | 可选 | 协议选择 |
+| `contribute_to_cluster_pool_size` | 用来分流 owner / external | 缺失或全零是 external；`dram > 0` 是 owner |
+| `pprof_duration_seconds` | 可选，给出时 `> 0` | profile 导出时长 |
+| `fluxonkv_spec` | 必填 | KV 业务配置子块 |
+| `test_spec_config` | 可选 | 测试和 side-transfer 分支开关 |
+
+`fluxonkv_spec` 里，owner / external 共享的基础字段只有这几项：
+
+| 字段 | 作用 |
+| --- | --- |
+| `cluster_name` | 目标集群名 |
+| `shared_memory_path` | 本机共享内存 authority；运行时会拼成 `cluster_name` 作用域路径 |
+| `shared_file_path` | 本机共享文件 authority；运行时会拼成 `cluster_name` 作用域路径 |
+| `p2p_listen_port` | 可选的 P2P 监听端口 |
+
+只有 `owner` 能声明的字段：
+
+| 字段 | 作用 |
+| --- | --- |
+| `etcd_addresses` | owner 连接 etcd 的 raw `host:port` 列表；运行时同时保留 raw 和归一化 `http://host:port` 两份视图 |
+| `sub_cluster` | owner 所属子集群标签 |
+| `large_file_paths.log_root_path` | owner 日志大文件根目录 |
+| `large_file_paths.cache_root_path` | owner cache 大文件根目录 |
+| `redis_compat` | Redis 兼容监听配置 |
+
+`external` 的结构更小：它不声明 `etcd_addresses`、`sub_cluster`、`large_file_paths`、`redis_compat`，这些 owner 侧字段都从 owner 发布的 `shared.json` 继承。本地 YAML 只保留 attach owner 所需的共享 bundle 锚点和本进程参数。
 
 主要约束：
 
 - `monitoring` 在 master 上必填。
 - `master_ui` 依赖 `monitoring`，并作为嵌入式 monitor HTTP 服务启动。
+- `contribute_to_cluster_pool_size` 里的容量都按 16 MiB 对齐；`dram = 0` 但 `vram` 非 0 会被拒绝，避免半 owner 半 external 的模糊状态。
+- owner 模式要求 `contribute_to_cluster_pool_size.dram > 0`，并且必须显式提供 `etcd_addresses`、`sub_cluster`、`large_file_paths`。
+- zero-contribution `external` 模式禁止再写 owner 专属字段；运行时会从 owner `shared.json` 补齐这部分信息。
 - `shared_memory_path` / `shared_file_path` 会拼成 `cluster_name` 作用域路径。
-- `etcd_addresses` 在 client 侧保留 raw `host:port` 和归一化 `http://host:port` 两份视图。
-- zero-contribution `external` / side worker 的 `etcd_addresses`、`sub_cluster`、`large_file_paths` 由 owner 发布的 `shared.json` 继承；本地配置面只保留 attach owner 所需的共享 bundle 锚点和本进程参数。
+- `test_spec_config.side_transfer_role = worker` 不是第三套 YAML，而是 zero-contribution client 的子分支；它强制 `TransferEngineType::P2p`，并关闭 transfer RPC fast path。
+- `test_spec_config.side_transfer_worker_count` 只允许出现在 owner 配置里，用来控制 owner 拉起的 worker 数量。
 
 更细的调用时序、持有生命周期和并发规则分别在 `kv_1_概览与分层.md`、`kv_2_调用时序.md`、`kv_3_参数与并发.md`、`kv_4_allocation_segment_holder生命周期.md` 里展开。
 
diff --git a/setup_and_pack/tests/test_quick_start_release_only.py b/setup_and_pack/tests/test_quick_start_release_only.py
index 6d41bf3..413eee4 100644
--- a/setup_and_pack/tests/test_quick_start_release_only.py
+++ b/setup_and_pack/tests/test_quick_start_release_only.py
@@ -123,6 +123,44 @@ def _handle_mq_shell_line(line, shutdown_requested, status_lines):
         self.assertIn("MQ shell status:", stdout.getvalue())
         shutdown_requested.set.assert_not_called()
 
+    def test_quick_start_owner_configs_include_large_file_paths(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            workdir = Path(tmpdir)
+
+            kv_cfg = _START._gen_kv_config(
+                "127.0.0.1:12379",
+                "qs_kv_cluster",
+                31000,
+                8083,
+                0,
+                14000,
+                workdir,
+            )
+            mq_cfg = _START._gen_mq_config(
+                "127.0.0.1:12379",
+                "qs_mq_cluster",
+                34200,
+                14000,
+                workdir,
+                panel_port=18080,
+            )
+            fs_cfg = _START._gen_fs_config(
+                "127.0.0.1:12379",
+                "qs_fs_cluster",
+                34100,
+                34180,
+                14000,
+                workdir,
+            )
+
+            expected = {
+                "log_root_path": str(workdir / "large" / "log" / "owner"),
+                "cache_root_path": str(workdir / "large" / "cache" / "owner"),
+            }
+            self.assertEqual(kv_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)
+            self.assertEqual(mq_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)
+            self.assertEqual(fs_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)
+
     def test_pack_fluxon_pylib_cleans_stale_build_artifacts_before_bdist(self) -> None:
         with tempfile.TemporaryDirectory() as tmpdir:
             repo_root = Path(tmpdir)

From 1eb1ebde14352cd8ea0fa3db8020b65cf927a3a3 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 17:47:32 +0800
Subject: [PATCH 08/13] test

---
 ...13\350\257\225\346\265\201\347\250\213.md" | 24 +++++
 fluxon_py/config.py                           |  4 +
 fluxon_rs/fluxon_kv/src/config.rs             |  4 +
 fluxon_test_stack/start_test_bed.py           |  1 -
 fluxon_test_stack/test_runner.py              | 21 +++-
 .../test_test_runner_testbed_contract.py      | 96 +++++++++++++++++++
 6 files changed, 148 insertions(+), 2 deletions(-)

diff --git "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md" "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
index ce767f7..80a8184 100644
--- "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
+++ "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
@@ -378,6 +378,30 @@ deploy.instances 不写死在 suite 中。Runner 会结合 scale、profile 和
 - `resolved_case` 会额外固化 `command_id`、`test_id` 等 CI 元数据；
 - 生成顺序是稳定的，后续 phase 规划依赖这个顺序。
 
+### 7.8 owner 模式配置契约
+
+**稳定结论：**
+
+- owner 模式配置一律必须显式提供 `fluxonkv_spec.large_file_paths.log_root_path` 和 `cache_root_path`。
+- `fluxonkv_spec.p2p_listen_port` 不是 owner 模式的必填项；是否显式写入，取决于具体分支的运行契约。
+- 不要把 `TEST_STACK` case-local owner 的显式端口分配规则，复制到 shared testbed / CI owner 配置上。
+
+这里需要明确区分两类 owner 配置生成面：
+
+| surface | `large_file_paths` | `p2p_listen_port` | 原因 |
+| --- | --- | --- | --- |
+| shared testbed / CI owner | 必填 | 默认省略，保持隐式 | 这类 owner 运行在共享环境里，宿主端口占用和 host 布局更易变化，保持由运行时自行绑定可用端口更稳妥 |
+| `TEST_STACK` case-local owner | 必填 | 显式写入 | 同一 case 内的 node runtime 需要消费 runner 预编译的有限端口计划，owner peer 地址必须稳定 |
+
+这条边界对应两种不同责任：
+
+- `large_file_paths` 是 owner 模式本身的配置契约，缺失时应直接视为配置错误；
+- `p2p_listen_port` 是否显式，则是某个运行 surface 的拓扑与端口规划策略，不应从一个 surface 横向推广到另一个 surface。
+
+本次相关经验可以收敛成一句规则：
+
+- owner 模式要显式约束的是 large-file roots，不是“默认必须写死 p2p 端口”。
+
 ## 8. case 执行流程
 
 ### 8.1 总体时序
diff --git a/fluxon_py/config.py b/fluxon_py/config.py
index 51e0d7d..b50caad 100644
--- a/fluxon_py/config.py
+++ b/fluxon_py/config.py
@@ -587,6 +587,10 @@ def to_fluxon_kv_client_config_yaml_str(self) -> str:
 
             return yaml.safe_dump(cfg, sort_keys=False)
 
+        # Owner mode must always declare large-file roots for logs and caches.
+        # p2p_listen_port remains optional here: deterministic case-local
+        # topologies may pin it, while shared testbed flows can leave it unset
+        # and let runtime choose an available port.
         if "large_file_paths" not in spec:
             raise ValueError("fluxonkv_spec.large_file_paths is required for owner mode")
         large_file_paths = spec.get("large_file_paths")
diff --git a/fluxon_rs/fluxon_kv/src/config.rs b/fluxon_rs/fluxon_kv/src/config.rs
index 2df094c..8ea906f 100644
--- a/fluxon_rs/fluxon_kv/src/config.rs
+++ b/fluxon_rs/fluxon_kv/src/config.rs
@@ -1086,6 +1086,10 @@ impl ClientConfigYaml {
             }
             .into_kverror());
         }
+        // Owner mode always needs explicit large-file roots for logs and caches.
+        // The listen port stays optional at this contract layer: deterministic
+        // callers may pin it, while shared testbed owners can leave it unset
+        // and let the runtime bind a free port.
         let large_file_paths = if is_external {
             LargeFilePaths {
                 log_root_path: String::new(),
diff --git a/fluxon_test_stack/start_test_bed.py b/fluxon_test_stack/start_test_bed.py
index d2416e0..d2d2504 100644
--- a/fluxon_test_stack/start_test_bed.py
+++ b/fluxon_test_stack/start_test_bed.py
@@ -835,7 +835,6 @@ def _rewrite_same_host_local_multi_node_fixed_ports(
     master_cfg = _require_mapping(services.get("master"), "deployconf.service.master")
     ops_agent_cfg = _require_mapping(services.get("ops_agent"), "deployconf.service.ops_agent")
     ops_controller_cfg = _require_mapping(services.get("ops_controller"), "deployconf.service.ops_controller")
-
     global_envs["TIKV_PD_PEER_PORT"] = str(plan["tikv_pd_peer_port"])
     global_envs["TIKV_STATUS_FULL_ADDRESS"] = (
         "${${TIKV__NODE_ID}__IP}:" + str(plan["tikv_status_port"])
diff --git a/fluxon_test_stack/test_runner.py b/fluxon_test_stack/test_runner.py
index a81eaf5..2d965df 100644
--- a/fluxon_test_stack/test_runner.py
+++ b/fluxon_test_stack/test_runner.py
@@ -9296,6 +9296,16 @@ def _test_stack_kv_owner_runtime_instance_key(*, runtime_instance_prefix: str, o
     return f"{runtime_instance_prefix}__kv_owner__{target_slug}"
 
 
+def _fluxon_kv_owner_large_file_paths(*, owner_work_root: Path) -> Dict[str, str]:
+    # Owner mode always needs explicit large-file roots for logs and caches,
+    # even on surfaces that intentionally leave p2p_listen_port implicit.
+    root = owner_work_root.resolve()
+    return {
+        "log_root_path": str((root / "large" / "log").resolve()),
+        "cache_root_path": str((root / "large" / "cache").resolve()),
+    }
+
+
 def _build_test_stack_external_kv_owner_instances(
     *,
     scene_mode: str,
@@ -9350,6 +9360,8 @@ def _build_test_stack_external_kv_owner_instances(
             owner_target=target,
             ctx="external kv owner",
         )
+        # TEST_STACK case-local owners use the compiled slot-based port plan so
+        # node runtimes in the same case can resolve stable owner peers.
         owner_p2p_listen_port = (
             int(kv_p2p_port_base)
             + int(kv_p2p_port_stride) * int(run_index - 1)
@@ -9371,6 +9383,8 @@ def _build_test_stack_external_kv_owner_instances(
                 owner_target=target,
                 ctx="runtime.stack_identity owner bundle roots",
             )
+        owner_services_dir = run_dir / "services" / "kv_owner" / target_slug
+        owner_large_file_paths = _fluxon_kv_owner_large_file_paths(owner_work_root=owner_services_dir)
         owner_cfg = {
             "instance_key": _test_stack_kv_owner_runtime_instance_key(
                 runtime_instance_prefix=runtime_instance_prefix,
@@ -9383,6 +9397,7 @@ def _build_test_stack_external_kv_owner_instances(
                 "cluster_name": cluster_name,
                 "shared_memory_path": owner_shared_memory_path,
                 "shared_file_path": owner_shared_file_path,
+                "large_file_paths": owner_large_file_paths,
                 "sub_cluster": FLUXON_KV_OWNER_SUB_CLUSTER,
                 "p2p_listen_port": int(owner_p2p_listen_port),
             },
@@ -9405,7 +9420,6 @@ def _build_test_stack_external_kv_owner_instances(
             raise ValueError(f"test_stack owner config already exists (no overwrite): {owner_cfg_path}")
         _write_yaml_file(owner_cfg_path, owner_cfg)
 
-        owner_services_dir = run_dir / "services" / "kv_owner" / target_slug
         owner_services_dir.mkdir(parents=True, exist_ok=True)
         owner_inst = copy.deepcopy(coord_tpl)
         owner_inst["id"] = instance_id
@@ -14506,6 +14520,7 @@ def _write_ci_scene_config_yaml(
 def _write_ci_master_owner_configs(
     resolved_case: Dict[str, Any], *, run_dir: Path, cluster_name: str, share_mem_path: str, share_file_path: str, owner_dram_bytes: int
 ) -> tuple[Path, Path]:
+    owner_work_root = run_dir / "services" / "owner_0"
     master_cfg = {
         "etcd_endpoints": ["__ETCD__"],
         "cluster_name": cluster_name,
@@ -14534,6 +14549,10 @@ def _write_ci_master_owner_configs(
             "cluster_name": cluster_name,
             "shared_memory_path": share_mem_path,
             "shared_file_path": share_file_path,
+            # Shared testbed / CI owners keep p2p_listen_port implicit so the
+            # runtime can bind a free host port, but owner mode still requires
+            # explicit large-file roots.
+            "large_file_paths": _fluxon_kv_owner_large_file_paths(owner_work_root=owner_work_root),
             "sub_cluster": FLUXON_KV_OWNER_SUB_CLUSTER,
         },
     }
diff --git a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
index bbfcd00..3f43433 100644
--- a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
+++ b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
@@ -38,6 +38,39 @@ def _load_module():
 
 
 class TestTestRunnerTestbedContract(unittest.TestCase):
+    def test_write_ci_master_owner_configs_emits_owner_large_file_paths(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            run_dir = Path(td)
+            resolved_case = {
+                "deploy": {
+                    "instances": [
+                        {"id": "master", "deployer": {"target": "local-node-a"}},
+                        {"id": "owner_0", "deployer": {"target": "local-node-a"}},
+                    ],
+                    "target_ip_map": {"local-node-a": "127.0.0.1"},
+                }
+            }
+
+            with mock.patch.object(_RUNNER, "_ci_base_runtime_service_target_ip", side_effect=["127.0.0.1", "127.0.0.1"]):
+                with mock.patch.object(_RUNNER, "_ci_base_runtime_service_port", side_effect=[19180, 19190]):
+                    _, owner_path = _RUNNER._write_ci_master_owner_configs(
+                        resolved_case,
+                        run_dir=run_dir,
+                        cluster_name="ci_cluster",
+                        share_mem_path="/tmp/ci_shm",
+                        share_file_path="/tmp/ci_share",
+                        owner_dram_bytes=1073741824,
+                    )
+
+            owner_cfg = yaml.safe_load(owner_path.read_text(encoding="utf-8"))
+            self.assertEqual(
+                owner_cfg["fluxonkv_spec"]["large_file_paths"],
+                {
+                    "log_root_path": str((run_dir / "services" / "owner_0" / "large" / "log").resolve()),
+                    "cache_root_path": str((run_dir / "services" / "owner_0" / "large" / "cache").resolve()),
+                },
+            )
+
     def test_write_ci_scene_config_yaml_emits_structured_scene_config(self) -> None:
         with tempfile.TemporaryDirectory() as td:
             run_dir = Path(td)
@@ -80,6 +113,69 @@ def test_write_ci_scene_config_yaml_emits_structured_scene_config(self) -> None:
             self.assertEqual(payload["scene_runtime"]["etcd"], {"ip": "127.0.0.1", "port": 2379})
             self.assertEqual(payload["scene_runtime"]["greptime"], {"ip": "127.0.0.1", "port": 4000})
 
+    def test_generated_test_stack_owner_config_emits_large_file_paths(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            run_dir = Path(td)
+            cfg_dir = run_dir / "configs"
+            cfg_dir.mkdir(parents=True)
+            owner_target = "local-node-a"
+            target_slug = "local-node-a"
+            runtime_instance_prefix = "case1"
+            coord_tpl = {"deployer": {"target": ""}}
+            cluster_nodes = {"local-node-a": {"python_abi": "cpython3.10"}}
+            resolved_case = {
+                "runtime": {
+                    "run_dir": str(run_dir),
+                    "stack_identity": {
+                        "cluster_name": "bench_cluster",
+                        "shared_memory_path": "/tmp/bench_shm",
+                        "shared_file_path": "/tmp/bench_share",
+                    },
+                }
+            }
+
+            with mock.patch.object(_RUNNER, "_test_stack_runtime_required_python_abi", return_value="cpython3.10"):
+                with mock.patch.object(_RUNNER, "_test_stack_etcd_addresses", return_value=["127.0.0.1:19180"]):
+                    with mock.patch.object(_RUNNER, "_test_stack_target_host_venv_python", return_value="/tmp/venv/bin/python3"):
+                        with mock.patch.object(_RUNNER, "_test_stack_runtime_module_command", return_value="owner-cmd"):
+                            owner_instances = _RUNNER._build_test_stack_external_kv_owner_instances(
+                                scene_mode="bench",
+                                resolved_case=resolved_case,
+                                scale={"owner": {"owner_count": 1, "owner_dram_bytes": 1073741824}},
+                                runtime=resolved_case["runtime"],
+                                run_dir=run_dir,
+                                cfg_dir=cfg_dir,
+                                coord_tpl=coord_tpl,
+                                test_stack_runtime={},
+                                cluster_nodes=cluster_nodes,
+                                owner_targets=[owner_target],
+                                needs_kv_master=True,
+                                kv_p2p_port_base=31000,
+                                kv_p2p_port_stride=100,
+                                kv_p2p_slot_offset=0,
+                                p2p_ports_per_slot=10,
+                                node_total=1,
+                                run_index=1,
+                                runtime_instance_prefix=runtime_instance_prefix,
+                                kv_base={},
+                                test_spec_config={},
+                                perf_config=None,
+                                runtime_env={},
+                                owner_group_processes=None,
+                                owner_cpu_core_by_target={},
+                            )
+
+            self.assertEqual(len(owner_instances), 1)
+            owner_cfg_path = cfg_dir / f"test_stack_kv_owner__{target_slug}.yaml"
+            owner_cfg = yaml.safe_load(owner_cfg_path.read_text(encoding="utf-8"))
+            self.assertEqual(
+                owner_cfg["fluxonkv_spec"]["large_file_paths"],
+                {
+                    "log_root_path": str((run_dir / "services" / "kv_owner" / target_slug / "large" / "log").resolve()),
+                    "cache_root_path": str((run_dir / "services" / "kv_owner" / target_slug / "large" / "cache").resolve()),
+                },
+            )
+
     def test_ci_source_overlay_includes_fluxon_test_stack(self) -> None:
         self.assertIn("fluxon_test_stack", _RUNNER._CI_SOURCE_OVERLAY_ROOTS)
         self.assertNotIn("quartz_prewarm", _RUNNER._CI_SOURCE_OVERLAY_ROOTS)

From 229a5d08c43474ac2c695fce2529150b60826dfa Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Tue, 23 Jun 2026 21:43:42 +0800
Subject: [PATCH 09/13] test

---
 deployment/gen_bare_deploy_bash.py            |   4 +-
 .../atomic_group_start.sh.tmpl                |   2 +-
 ...ction_supervisor_launch_wait_block.sh.tmpl |   3 +-
 .../standalone_start_body.sh.tmpl             |   1 -
 deployment/tests/test_gen_bare_deploy_bash.py |  39 +-
 .../utils/selection_supervisor_codegen.py     |  17 +-
 ...15\347\275\256\346\200\273\350\247\210.md" | 452 +++++++++++++-----
 fluxon_test_stack/ci_2_virt_node.py           |   1 +
 .../tests/test_ci_2_virt_node_contract.py     |  48 ++
 setup_and_pack/nix/lib_layout.py              |  22 +-
 setup_and_pack/tests/test_lib_layout.py       |  35 ++
 11 files changed, 499 insertions(+), 125 deletions(-)

diff --git a/deployment/gen_bare_deploy_bash.py b/deployment/gen_bare_deploy_bash.py
index 5503658..fdd5d0e 100644
--- a/deployment/gen_bare_deploy_bash.py
+++ b/deployment/gen_bare_deploy_bash.py
@@ -619,7 +619,7 @@ def _render_standalone_start_body(*, name_prefix: str, service_name: str) -> str
             "SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK": _render_selection_supervisor_launch_wait_block(
                 run_cmd=run_cmd,
                 stable_seconds_expr=str(STANDALONE_PROBABLE_READY_SECONDS),
-                deadline_ts_expr='"$STARTUP_DEADLINE_TS"',
+                deadline_ts_expr=f'$(( $(date +%s) + {STANDALONE_STARTUP_DEADLINE_SECONDS} ))',
                 context="[bare]",
             ),
         },
@@ -693,7 +693,7 @@ def _render_atomic_group_service_block(
                 script=_render_selection_supervisor_launch_wait_block(
                     run_cmd=run_cmd,
                     stable_seconds_expr=str(ATOMIC_GROUP_PROBABLE_READY_SECONDS),
-                    deadline_ts_expr='"$GROUP_STARTUP_DEADLINE_TS"',
+                    deadline_ts_expr=f'$(( $(date +%s) + {ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS} ))',
                     context="[rollout]",
                 ).rstrip()
                 + "\n",
diff --git a/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
index d0c82ad..7dca2b5 100644
--- a/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/atomic_group_start.sh.tmpl
@@ -3,5 +3,5 @@ set -euo pipefail
 
 GROUP={{GROUP_ASSIGN}}
 NAME_PREFIX={{NAME_PREFIX_ASSIGN}}
-{{HOST_PRELUDE}}{{ATOMIC_GROUP_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}{{PROC_LIFECYCLE_HELPERS}}{{GLOBAL_ENV_EXPORTS}}GROUP_STARTUP_DEADLINE_TS=$(( $(date +%s) + {{GROUP_STARTUP_DEADLINE_ASSIGN}} ))
+{{HOST_PRELUDE}}{{ATOMIC_GROUP_NODE_RESOLUTION_TAIL}}{{SELECTION_SUPERVISOR_PATH_BLOCK}}{{PROC_LIFECYCLE_HELPERS}}{{GLOBAL_ENV_EXPORTS}}
 {{SERVICE_BLOCKS}}echo "[atomic-group] ready group=$GROUP node=$NODE_ID"
diff --git a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
index f466cbc..52cce05 100644
--- a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
@@ -3,7 +3,8 @@ if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then
   echo "{{CONTEXT}} launch failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
   exit 1
 fi
-if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" {{STABLE_SECONDS_EXPR}} {{DEADLINE_TS_EXPR}} "{{CONTEXT}}"; then
+STARTUP_DEADLINE_TS={{DEADLINE_TS_EXPR}}
+if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" {{STABLE_SECONDS_EXPR}} "$STARTUP_DEADLINE_TS" "{{CONTEXT}}"; then
   echo "{{CONTEXT}} probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
   exit 1
 fi
diff --git a/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
index b58d3de..0758876 100644
--- a/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/standalone_start_body.sh.tmpl
@@ -1,7 +1,6 @@
 SUPERVISOR_LABEL={{SUPERVISOR_LABEL_ASSIGN}}
 RUNTIME_STATE_JSON={{RUNTIME_STATE_JSON_ASSIGN}}
 OWNER_TS_MS=$(python3 -c 'import time; print(int(time.time() * 1000))')
-STARTUP_DEADLINE_TS=$(( $(date +%s) + {{STARTUP_DEADLINE_SECONDS}} ))
 LOG_DIR="$HOSTWORKDIR/log"
 LOGFILE="$LOG_DIR/${SERVICE}.log"
 mkdir -p "$LOG_DIR"
diff --git a/deployment/tests/test_gen_bare_deploy_bash.py b/deployment/tests/test_gen_bare_deploy_bash.py
index 9f392ed..19f80ac 100644
--- a/deployment/tests/test_gen_bare_deploy_bash.py
+++ b/deployment/tests/test_gen_bare_deploy_bash.py
@@ -136,10 +136,9 @@ def test_preserves_hostworkdir_runtime_token() -> None:
         assert "/hostworkdir/svc_" not in script, script
         assert "wait-present" not in script, script
         assert "launch_only_start_gate" not in script, script
-        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID"' in script, script
+        _assert_standalone_deadline_after_launch(script)
         assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
         assert "export SERVICE_PORT=12345" in script, script
-        assert 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
         assert "wait_service_tcp_ready" not in script, script
         assert "wait_service_etcd_endpoint_healthy" not in script, script
         assert 'SUPERVISOR_PID=$( setsid ' not in script, script
@@ -196,8 +195,12 @@ def test_atomic_group_start_does_not_auto_stop_on_failure() -> None:
         assert 'SUPERVISOR_PID=$( setsid ' not in script, script
         assert 'echo "[rollout] probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"' in script, script
         assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID"' in script, script
-        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$GROUP_STARTUP_DEADLINE_TS" "[rollout]"' in script, script
-        assert 'GROUP_STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
+        assert 'GROUP_STARTUP_DEADLINE_TS=' not in script, script
+        assert script.count('STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))') == 2, script
+        _assert_deadline_after_launch(
+            script=script,
+            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[rollout]"',
+        )
         assert "export SERVICE_PORT=23456" in script, script
         assert "unset SERVICE_PORT" in script, script
         assert "wait_service_tcp_ready" not in script, script
@@ -326,7 +329,7 @@ def test_bare_start_uses_no_exit_startup_gate() -> None:
         plain_script = (outdir / "start_svc_plain.sh").read_text(encoding="utf-8")
 
         for script in (etcd_script, tikv_script, plain_script):
-            assert 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))' in script, script
+            _assert_standalone_deadline_after_launch(script)
             assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
             assert "wait_service_tcp_ready" not in script, script
             assert "wait_service_etcd_endpoint_healthy" not in script, script
@@ -362,7 +365,11 @@ def test_normalized_testbed_master_exports_service_port_for_atomic_group() -> No
         assert "export MASTER__PORT=51051" in master_block, master_block
         assert "export SERVICE_PORT=51051" in master_block, master_block
         assert "unset SERVICE_PORT" not in master_block, master_block
-        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$GROUP_STARTUP_DEADLINE_TS" "[rollout]"' in master_block, master_block
+        assert 'GROUP_STARTUP_DEADLINE_TS=' not in master_block, master_block
+        _assert_deadline_after_launch(
+            script=master_block,
+            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[rollout]"',
+        )
         assert "wait_service_tcp_ready" not in master_block, master_block
         print("PASS: test_normalized_testbed_master_exports_service_port_for_atomic_group")
 
@@ -860,5 +867,25 @@ def _wait_until_selection_absent(
     raise RuntimeError(f"timeout waiting selection absent: label={label} scope_key={scope_key}")
 
 
+def _assert_deadline_after_launch(*, script: str, wait_call: str) -> None:
+    launch_check = 'if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then'
+    deadline_assign = 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))'
+    assert launch_check in script, script
+    assert deadline_assign in script, script
+    assert wait_call in script, script
+
+    launch_check_idx = script.index(launch_check)
+    deadline_idx = script.index(deadline_assign)
+    wait_idx = script.index(wait_call)
+    assert launch_check_idx < deadline_idx < wait_idx, script
+
+
+def _assert_standalone_deadline_after_launch(script: str) -> None:
+    _assert_deadline_after_launch(
+        script=script,
+        wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"',
+    )
+
+
 if __name__ == "__main__":
     raise SystemExit(main())
diff --git a/deployment/utils/selection_supervisor_codegen.py b/deployment/utils/selection_supervisor_codegen.py
index ab76dfc..8e8d7fb 100644
--- a/deployment/utils/selection_supervisor_codegen.py
+++ b/deployment/utils/selection_supervisor_codegen.py
@@ -1011,6 +1011,17 @@ def _iter_process_cmdlines() -> List[tuple[int, List[str]]]:
     return out
 
 
+def _iter_process_snapshots() -> List[tuple[ProcessInfo, List[str]]]:
+    infos_by_pid = {info.pid: info for info in _iter_process_infos()}
+    out: List[tuple[ProcessInfo, List[str]]] = []
+    for pid, args in _iter_process_cmdlines():
+        process_info = infos_by_pid.get(pid)
+        if process_info is None or process_info.is_zombie:
+            continue
+        out.append((process_info, args))
+    return out
+
+
 def _arg_value(args: List[str], flag: str) -> Optional[str]:
     for idx, arg in enumerate(args[:-1]):
         if arg == flag:
@@ -1155,13 +1166,11 @@ def _iter_process_infos() -> List[ProcessInfo]:
 
 def _iter_live_supervisors(label: Optional[str] = None, *, scope_key: Optional[str] = None) -> List[LiveSupervisor]:
     out: List[LiveSupervisor] = []
-    for pid, args in _iter_process_cmdlines():
+    for process_info, args in _iter_process_snapshots():
         supervisor_command = _find_selection_supervisor_command(args)
         if supervisor_command is None:
             continue
-        process_info = _find_process_info(pid)
-        if process_info is None or process_info.is_zombie:
-            continue
+        pid = process_info.pid
         runtime_label = _arg_value(args, "--label")
         if runtime_label is None:
             raise RuntimeError(f"running selection supervisor is missing --label pid={pid}")
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
index 84fb0dc..4f9f65e 100644
--- "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -55,31 +55,75 @@ flowchart TD
 
 这是仓库级开发环境配置，不是业务 runtime config。
 
-| 字段 | 规则 | 主要用途 |
-| --- | --- | --- |
-| `etcd` | 必填，`host:port` | 供 Rust / Python / 测试工具读取 etcd 地址 |
-| `prom` | 必填，`http(s)://.../v1` 或 `.../api/v1` | 供 Grafana / TSDB 查询 URL 使用 |
-| `prom_remote_write_url` | 必填，`http(s)://...` | 供 remote write 使用 |
+最小骨架：
+
+```yaml
+# Rust / Python / 测试工具共用的 etcd 地址
+# 输入要求 raw host:port
+etcd: 127.0.0.1:43579
+
+# Prometheus-compatible 查询入口
+prom: http://127.0.0.1:44030/v1/prometheus
+
+# remote write 入口
+prom_remote_write_url: http://127.0.0.1:44030/v1/prometheus/write
+```
+
+这里的重点不是字段多，而是格式严格分层：
+
+- `etcd` 用 raw `host:port`。
+- `prom` 用带 scheme 的 HTTP URL，并且路径通常是 `/v1/prometheus` 或 `/api/v1`。
+- `prom_remote_write_url` 也是完整 URL。
 
 `setup_and_pack/utils/repo_config_utils.py` 里保留了 `prometheus_remote_write_url` 的旧名兼容读取，但这是 build tooling 的过渡路径，不是推荐的新契约。
 
 ### 4.2 `build_config_ext_static.yml`
 
-当前只固定一个值：
+当前最小骨架只有一个稳定字段：
 
-| 字段 | 规则 |
-| --- | --- |
-| `manylinux_version` | 必填，当前只允许 `2_28` |
+```yaml
+manylinux_version: "2_28"
+```
+
+当前实现只接受 `2_28`。
 
 ### 4.3 `deployment/deployconf.yaml`
 
-这是部署和打包流水线的核心配置。当前稳定消费面主要有三块：
+这是部署和打包流水线的核心配置。先看最重要的骨架：
+
+```yaml
+namespace: fluxon-example
+name_prefix: fluxon-example
+image: fluxon_quick_start:0.2.1
+
+cluster_nodes:
+  - hostname: example-node-a
+    ip: 192.0.2.10
+    hostworkdir: /opt/example/fluxon/deployment/example_deploy
+    mounts:
+      - /opt/example/fluxon: /fluxon_mount
+      - /var/run/docker.sock: /var/run/docker.sock
+
+global_envs:
+  FLUXON_CLUSTER_NAME: "fluxon-example-cluster"
+  FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
+  FLUXON_SHARED_FILE: "${HOSTWORKDIR}/shm1_files"
+  ETCD_FULL_ADDRESS: "${${ETCD__NODE_ID}__IP}:${ETCD__PORT}"
+  FLUXON_PROMETHEUS_BASE_URL: "http://${${GREPTIME__NODE_ID}__IP}:${GREPTIME__PORT}/v1/prometheus"
+  MONITOR_GREPTIMEDB_WRITE_URL: "http://${${GREPTIME__NODE_ID}__IP}:${GREPTIME__PORT}/v1/prometheus/write"
+
+release_ext_images:
+  etcd:
+    image: quay.io/coreos/etcd:v3.5.0
+  greptime:
+    image: greptime/greptimedb:v0.15.1
+```
 
-| 区块 | 关键字段 | 作用 |
-| --- | --- | --- |
-| `cluster_nodes` | 节点列表 | 作为 placeholder 解析的基础 |
-| `service` | 服务节点映射 | 供部署脚本和测试脚本查 service ip:port |
-| `global_envs` | `ETCD_FULL_ADDRESS`、`FLUXON_PROMETHEUS_BASE_URL`、`MONITOR_GREPTIMEDB_WRITE_URL`、`FLUXON_CLUSTER_NAME`、`FLUXON_SHARED_MEM`、`FLUXON_SHARED_FILE` | 供部署/测试代码读取集群级 authority |
+读这份配置时，先抓住三层：
+
+- `cluster_nodes` 提供节点清单，是 placeholder 解析的基础。
+- `global_envs` 提供集群级 authority，比如 etcd、Prometheus、cluster name、shared roots。
+- `release_ext_images` 和后续 service/workload 块把这些 authority 接进具体部署动作。
 
 `global_envs` 允许占位符解析，先由 `cluster_nodes` + `service` 构造映射，再把变量落成最终值。
 
@@ -87,84 +131,191 @@ flowchart TD
 
 这是一层测试入口配置，不是 runtime 部署配置。
 
-| 字段 | 规则 |
-| --- | --- |
-| `deployconf_path` | 必填，指向共享 deployconf |
-| `kv_svc_type` | 必填，当前测试助手只接受已知 backend 类型 |
+最小骨架：
+
+```yaml
+deployconf_path: ../../deployment/deployconf.yaml
+kv_svc_type: fluxon
+```
+
+这里没有复杂分支：
+
+- `deployconf_path` 指向共享 deployconf。
+- `kv_svc_type` 选择测试要接的 KV backend；当前 checked-in 样例用的是 `fluxon`。
 
 测试代码里还保留了 mooncake 相关读取函数，但 checked-in 的最小样例只使用上面两个字段。
 
 ### 4.5 `fluxon_test_stack/*`
 
-TestStack 的配置已经单独有设计文档，这里只收口成一句话：
+TestStack 有三份主配置，建议直接从 YAML 骨架理解：
+
+`ci_test_list.yaml` 定义 suite / scene 空间：
+
+```yaml
+schema_version: 9
+
+run:
+  mode: full_once
+  selectors:
+    case_ids: ALL
+    profile_ids: [fluxon_fastws, fluxon_tquic, fluxon_sockudo_ws, fluxon_tcp]
+    command_ids: ALL
+    test_ids: ALL
+
+scenes:
+  kv_read_heavy_zipf:
+    test_stack:
+      mode: KVSTORE
+      read_ratio: 0.9
+      write_ratio: 0.1
+      request_distribution: zipfian
+    select:
+      scales: [n1_kvowner_dram_20gib]
+      profiles: [fluxon_tcp]
+```
+
+`start_test_bed.yaml` 定义 testbed authority 和 UI：
+
+```yaml
+schema_version: 6
 
-- `ci_test_list.yaml` 定义 suite 空间。
-- `start_test_bed.yaml` 定义共享 testbed 和 UI。
-- `gitops.yaml` 定义 GitOps 轮询和记录。
-- 生成的 `deployconf_testbed.yml` 是派生产物，不是手工主配置。
+deployconf_path: ./deployconf_testbed.yml
+controller_url: http://192.0.2.10:19080/r/ops/fluxon_testbed
+controller_basic_auth:
+  username: example_admin
+  password: example_password
+
+test_runner_ui:
+  enabled: true
+  host: 0.0.0.0
+  port: 18080
+  workdir: ./test_runner_ui_runtime
+  gitops_config_path: ./gitops/gitops.yaml
+
+bootstrap_phases:
+  - mode: fixed_bare
+    node: infra44-ThinkStation-PX
+    services: [etcd, greptime, tikv_pd, tikv]
+```
+
+`gitops/gitops.yaml` 定义 GitOps 轮询和触发命令：
+
+```yaml
+interval: 60
+
+retention:
+  max_age_days: 7
+
+repos:
+  - addr: git@github.com:Tele-AI/fluxon.git
+    follow:
+      - branch: big_step2
+        run:
+          name_prefix: fluxon_ci
+          commands:
+            - python3 fluxon_test_stack/pack_test_stack_rsc.py --all-profiles -c fluxon_test_stack/ci_test_list.yaml
+            - python3 fluxon_test_stack/test_runner.py -c fluxon_test_stack/ci_test_list.yaml -w .
+```
+
+生成的 `deployconf_testbed.yml` 是派生产物，不是手工主配置。
 
 ## 5. 运行时配置
 
 ### 5.1 KV
 
-KV 的入口在 `fluxon_kv/src/config.rs`。稳定结论是：`master` 单独使用 `MasterConfigYaml`；`owner` 和 `external` 共用 `ClientConfigYaml`，再由 `verify()` 按内存贡献收敛成 owner / external / side-transfer worker 三个运行时分支。
+KV 的入口在 `fluxon_kv/src/config.rs`。先记结论：`master` 单独使用 `MasterConfigYaml`；`owner` 和 `external` 共用 `ClientConfigYaml`；`verify()` 再按内存贡献把 client 配置收敛成 owner / external / side-transfer worker 三个运行时分支。
 
-| 类型 | 作用 |
-| --- | --- |
-| `MasterConfigYaml` | master 节点输入 |
-| `ClientConfigYaml` | owner / external 输入 |
-| `FluxonKvSpecYaml` | client 侧 `fluxonkv_spec` 子块 |
-| `TestSpecConfig` | 测试和实验分支开关 |
-| `MonitoringConfigYaml` | master 监控块 |
-| `NetworkConfig` | 网络白名单和 IP 映射，共享自 `fluxon_commu_contract` |
-
-`master` 的 YAML 结构：
-
-| 字段 | 规则 | 作用 |
-| --- | --- | --- |
-| `instance_key` | 必填 | master 实例标识 |
-| `cluster_name` | 必填 | 集群名 |
-| `etcd_endpoints` | 必填，输入用 raw `host:port` | master 控制面 etcd 地址；校验后归一化成 `http://host:port` |
-| `log_dir` | 必填 | master 日志 / profile 根目录 |
-| `port` | 可选，给出时 `> 0` | master 监听端口 |
-| `protocol` | 可选 | 协议选择；缺省走编译期默认协议 |
-| `monitoring` | 逻辑必填 | Prometheus / remote write / OTLP log 配置块 |
-| `network` | 可选 | 网络白名单和主 IP 扩展映射 |
-| `pprof_duration_seconds` | 可选，给出时 `> 0` | profile 导出时长 |
-| `master_ui` | 可选，但依赖 `monitoring` | 嵌入式 monitor HTTP 服务；当前只暴露 `http_listen_addr` |
-| `test_spec_config` | 可选 | test / fast-path / side-transfer 实验开关 |
-
-`owner` 和 `external` 共用同一套 `ClientConfigYaml` 骨架：
-
-| 顶层字段 | 规则 | 说明 |
-| --- | --- | --- |
-| `instance_key` | 必填 | client 实例标识 |
-| `protocol` | 可选 | 协议选择 |
-| `contribute_to_cluster_pool_size` | 用来分流 owner / external | 缺失或全零是 external；`dram > 0` 是 owner |
-| `pprof_duration_seconds` | 可选，给出时 `> 0` | profile 导出时长 |
-| `fluxonkv_spec` | 必填 | KV 业务配置子块 |
-| `test_spec_config` | 可选 | 测试和 side-transfer 分支开关 |
-
-`fluxonkv_spec` 里，owner / external 共享的基础字段只有这几项：
-
-| 字段 | 作用 |
-| --- | --- |
-| `cluster_name` | 目标集群名 |
-| `shared_memory_path` | 本机共享内存 authority；运行时会拼成 `cluster_name` 作用域路径 |
-| `shared_file_path` | 本机共享文件 authority；运行时会拼成 `cluster_name` 作用域路径 |
-| `p2p_listen_port` | 可选的 P2P 监听端口 |
+`master` 的最小骨架：
 
-只有 `owner` 能声明的字段：
+```yaml
+instance_key: my-master-1
+cluster_name: demo-kv-cluster
 
-| 字段 | 作用 |
-| --- | --- |
-| `etcd_addresses` | owner 连接 etcd 的 raw `host:port` 列表；运行时同时保留 raw 和归一化 `http://host:port` 两份视图 |
-| `sub_cluster` | owner 所属子集群标签 |
-| `large_file_paths.log_root_path` | owner 日志大文件根目录 |
-| `large_file_paths.cache_root_path` | owner cache 大文件根目录 |
-| `redis_compat` | Redis 兼容监听配置 |
+# master 控制面 etcd 地址；输入要求 raw host:port
+etcd_endpoints:
+  - 127.0.0.1:2379
+
+# master 自己的日志 / profile 根目录
+log_dir: /var/lib/fluxon/master_logs
+
+# 可选；给出时必须 > 0
+port: 31000
+
+# 可选；当前 monitor 配置在 master 上是必填的
+monitoring:
+  prometheus_base_url: http://127.0.0.1:4000/v1/prometheus
+  prom_remote_write_url:
+    - http://127.0.0.1:4000/v1/prometheus/write
+  otlp_log_api:
+    otlp_endpoint: http://127.0.0.1:4000/v1/otlp/v1/logs
+
+# 可选；配置后 KV Web UI 会作为 master 内嵌 HTTP 服务启动
+master_ui:
+  http_listen_addr: 0.0.0.0:31100
+```
+
+`owner` 和 `external` 共用同一个 `ClientConfigYaml` 外壳，先看 `owner`：
+
+```yaml
+instance_key: my-owner-1
 
-`external` 的结构更小：它不声明 `etcd_addresses`、`sub_cluster`、`large_file_paths`、`redis_compat`，这些 owner 侧字段都从 owner 发布的 `shared.json` 继承。本地 YAML 只保留 attach owner 所需的共享 bundle 锚点和本进程参数。
+# 只要 dram > 0，就进入 owner 分支
+contribute_to_cluster_pool_size:
+  # 容量按 16 MiB 对齐
+  dram: 1677721600
+  vram: {}
+
+fluxonkv_spec:
+  cluster_name: demo-kv-cluster
+
+  # 本机共享内存 authority；运行时会拼成 cluster_name 作用域路径
+  shared_memory_path: /dev/shm/fluxon
+
+  # 本机共享文件 authority；shared.json、profile、peer metadata 等在这条根下
+  # 运行时也会拼成 cluster_name 作用域路径
+  shared_file_path: /var/lib/fluxon/shared
+
+  # owner 必须自己连接 etcd；输入要求 raw host:port
+  etcd_addresses:
+    - 127.0.0.1:2379
+
+  # owner 必须声明自己属于哪个 sub-cluster
+  sub_cluster: default
+
+  # owner 必须声明大文件根目录；日志和 cache 都从这里派生
+  large_file_paths:
+    log_root_path: /var/lib/fluxon/log
+    cache_root_path: /var/lib/fluxon/cache
+
+  # 可选
+  p2p_listen_port: 31001
+
+  # 可选；Redis 兼容入口只允许 owner 配
+  # redis_compat:
+  #   listen_addr: 0.0.0.0:6379
+```
+
+`external` 用的还是 `ClientConfigYaml`，但结构会更小：
+
+```yaml
+instance_key: my-external-1
+
+fluxonkv_spec:
+  cluster_name: demo-kv-cluster
+
+  # external 只保留 attach owner 所需的本机共享锚点
+  shared_memory_path: /dev/shm/fluxon
+  shared_file_path: /var/lib/fluxon/shared
+
+  # 可选
+  p2p_listen_port: 31002
+```
+
+这里最重要的差异不是“多几个字段”，而是配置责任不同：
+
+- `owner` 负责提供共享内存池、连接 etcd、声明 `sub_cluster`、发布 `shared.json`、给出日志和 cache 的大文件根目录。
+- `external` 不再声明 `etcd_addresses`、`sub_cluster`、`large_file_paths`、`redis_compat`；这些 owner 侧字段都从 owner 发布的 `shared.json` 继承。
+- `etcd_addresses` 在 owner 侧会同时保留两份视图：对外契约还是 raw `host:port`，运行时内部会归一化成 `http://host:port`。
 
 主要约束：
 
@@ -183,31 +334,65 @@ KV 的入口在 `fluxon_kv/src/config.rs`。稳定结论是：`master` 单独使
 
 FS 的配置集中在 `fluxon_fs_core/src/config.rs`，上层 `fluxon_fs/src/config.rs` 只是重导出。
 
-| 配置块 | 入口 | 结果 |
-| --- | --- | --- |
-| cache | `fluxon_fs.cache` | `FluxonFsGlobalConfig` |
-| master | `fluxon_fs.master` | `FluxonFsMasterConfig` |
-| master_panel | `fluxon_fs.master_panel` | `FluxonFsMasterPanelConfig` |
-
-`fluxon_fs.cache` 的核心字段：
-
-- `stale_window_ms` 必须 `> 0`。
-- `write_session_target_inflight_bytes` 可缺省，默认 128 MiB。
-- `rules[*]` 需要绝对路径、合法 cache/write 模式、合法前缀和非零 cache 上限。
-- `exports[*]` 需要绝对路径；`nodes` 缺失时表示 `AgentRegistry`，给出时表示 `StaticNodes`。
+这块分成 `cache`、`master`、`master_panel` 三个稳定子块，直接看骨架更直观：
+
+```yaml
+fluxon_fs:
+  master:
+    instance_key: fluxon_fs_master
+    pull_interval_ms: 1000
+
+  master_panel:
+    listen_addr: 0.0.0.0:8091
+    public_base_url: http://127.0.0.1:8091
+    prometheus_base_url: http://127.0.0.1:4000/v1/prometheus
+    auto_refresh_interval_secs: 10
+    access_db_path: /var/lib/fluxon/fs_master_access.db
+    bootstrap_access_model:
+      users:
+        - username: admin
+          password: admin
+          can_manage_users: true
+      scope_access: []
+    transfer_state_store:
+      kind: tikv
+      tikv:
+        pd_endpoints:
+          - 127.0.0.1:2379
+        key_prefix: /fluxon_fs_transfer/
+    s3_gateway:
+      get_object_inflight_pieces: 8
+      kv_miss_policy: remote_read
+
+  cache:
+    stale_window_ms: 5000
+    write_session_target_inflight_bytes: 134217728
+    rules:
+      - dir_abs: /var/lib/fluxon/local_shared
+        cache_mode: read_through
+        write_mode: write_through
+        kv_key_prefix: /fluxon_fs_cache/local_shared/
+        bytes_field_key: bytes
+        max_cache_bytes: 1048576
+        on_refresh_error: apply_stale_window
+    exports:
+      demo:
+        remote_root_dir_abs: /var/lib/fluxon/export_root
+        nodes:
+          - fluxon_fs_writer
+        cache_max_bytes: 1048576
+```
 
-`fluxon_fs.master` 的核心字段：
+读这段时抓三个点：
 
-- `instance_key` 必填。
-- `pull_interval_ms` 可选，但如果给出必须 `> 0`。
-- 旧的 `fluxon_fs.rpc` 和 `rpc_timeout_ms` 已移除。
+- `fluxon_fs.master` 很小，当前稳定字段只有 `instance_key` 和可选的 `pull_interval_ms`；旧的 `fluxon_fs.rpc` 和 `rpc_timeout_ms` 已移除。
+- `fluxon_fs.master_panel` 负责 UI/S3 授权和 transfer 状态；`listen_addr`、`public_base_url`、`prometheus_base_url`、`access_db_path`、`bootstrap_access_model`、`s3_gateway` 都是启动基线。
+- `fluxon_fs.cache` 负责目录级 cache / export 规则；`rules[*].dir_abs` 和 `exports[*].remote_root_dir_abs` 都必须是绝对路径。
 
-`fluxon_fs.master_panel` 的核心字段：
+还要记住两个分支规则：
 
-- `listen_addr`、`public_base_url`、`prometheus_base_url`、`access_db_path` 都是必需基线。
-- `bootstrap_access_model` 是面板的启动授权模型。
-- `transfer_state_store` 当前稳定实现是 `tikv`。
-- `s3_gateway` 负责对象请求和 KV miss 策略。
+- `exports.<name>.nodes` 缺失时，路由模式是 `AgentRegistry`；给出时是 `StaticNodes`。
+- `write_session_target_inflight_bytes` 可缺省，默认 128 MiB；但给出时必须 `> 0`。
 
 FS 还把访问模型拆成两层：
 
@@ -218,10 +403,35 @@ FS 还把访问模型拆成两层：
 
 `fluxon_cli/src/config.rs` 定义统一监控页配置，KV 的 `master_ui` 和 TestStack 的 UI 都复用它。
 
-| 类型 | 关键字段 |
-| --- | --- |
-| `MonitorConfigYaml` | `etcd_endpoints`、`prometheus_base_url`、`cluster_name`、`member_kind`、`output` |
-| 可选项 | `mq_unique_key_prefixes`、`http_listen_addr`、`greptime_sql` |
+最小骨架：
+
+```yaml
+etcd_endpoints:
+  - http://127.0.0.1:2379
+
+prometheus_base_url: http://127.0.0.1:4000/v1/prometheus
+cluster_name: demo-kv-cluster
+
+# kv / mq / fs
+member_kind: kv
+
+# cli / web
+output: web
+
+# 可选；web 模式常用
+http_listen_addr: 0.0.0.0:18080
+
+# 可选；只有 MQ 页面需要扫描 unique key 时再给
+# mq_unique_key_prefixes:
+#   - /fluxon_mq_unique/
+
+# 可选；不写时，如果 prometheus_base_url 明确指向 Greptime /v1/prometheus，
+# 会自动派生默认 SQL 连接信息
+# greptime_sql:
+#   base_url: http://127.0.0.1:4000
+#   db: public
+#   log_table: fluxon_logs
+```
 
 主要约束：
 
@@ -234,12 +444,36 @@ FS 还把访问模型拆成两层：
 
 `fluxon_commu_contract` 提供多个被 KV / FS 共同复用的基础类型：
 
-| 类型 | 取值 | 作用 |
-| --- | --- | --- |
-| `ProtocolType` | `Tcp` / `Rdma` | 输入协议选择 |
-| `TransferEngineType` | `Closed` / `P2p` | 传输引擎分支 |
-| `TransferBackendActivationMode` | 三个显式分支 | 控制 backend 激活方式 |
-| `NetworkConfig` | `subnet_whitelist`、`primary_ip_to_extended_ips` | 网络白名单和 IP 扩展映射 |
+最常见的是 `NetworkConfig` 这块 YAML：
+
+```yaml
+network:
+  subnet_whitelist:
+    - 127.0.0.0/8
+    - 10.0.0.0/24
+  primary_ip_to_extended_ips:
+    10.0.0.10:
+      - 10.0.0.11
+      - 10.0.0.12
+```
+
+以及协议/传输分支这两个输入：
+
+```yaml
+protocol:
+  protocol_type: rdma
+```
+
+```yaml
+protocol:
+  protocol_type: tcp
+```
+
+这里对应的稳定枚举取值是：
+
+- `ProtocolType`: `tcp` / `rdma`
+- `TransferEngineType`: `Closed` / `P2p`
+- `TransferBackendActivationMode`: `RdmaControl` / `TcpTestBypassRdmaControl` / `TestForceEnableBypassRdmaControl`
 
 这些类型是共享契约，不属于某一个子系统的私有配置。
 
diff --git a/fluxon_test_stack/ci_2_virt_node.py b/fluxon_test_stack/ci_2_virt_node.py
index 7f91716..405c9a2 100644
--- a/fluxon_test_stack/ci_2_virt_node.py
+++ b/fluxon_test_stack/ci_2_virt_node.py
@@ -710,6 +710,7 @@ def _render_ci_nix_pack_config(
     env_cfg = _load_yaml_mapping(env_companion_path.resolve(), ctx="CI pack env companion")
     merged_cfg = copy.deepcopy(static_cfg)
     merged_cfg.update(copy.deepcopy(env_cfg))
+    merged_cfg["project_root"] = str(repo_root.resolve())
 
     profile_cfg = merged_cfg.get("profile")
     if not isinstance(profile_cfg, dict):
diff --git a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
index b8f1e2e..100bec7 100644
--- a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
+++ b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
@@ -347,6 +347,54 @@ def fake_run(argv: list[str], *, env=None) -> None:
             self.assertIn(str(env_path.resolve()), calls[0])
             self.assertIn(str((root / "pack_release_runtime").resolve()), calls[0])
 
+    def test_render_ci_nix_pack_config_sets_explicit_project_root(self) -> None:
+        with tempfile.TemporaryDirectory() as td:
+            root = Path(td)
+            static_config_path = root / "static.yaml"
+            env_companion_path = root / "env.yaml"
+            out_path = root / "generated" / "setup_and_pack" / "nix" / "pack_fluxonkv_pylib_ci.yaml"
+
+            _ENTRY._write_yaml(
+                static_config_path,
+                {
+                    "schema_version": 1,
+                    "runtime": {
+                        "base_system": "manylinux_2_28",
+                        "architectures": ["x86_64"],
+                        "python_abi": "cpython3.10",
+                    },
+                    "profile": {
+                        "source_kind": "bridge_prebuilt",
+                        "native_runtime_dir_names": ["cxxpacked"],
+                        "target_support_dir_names": ["meson-0.64.0"],
+                        "ext_bundle_dir_name": "cxxpacked",
+                    },
+                    "assembly": {
+                        "baseline_path": "/tmp/baseline",
+                    },
+                },
+            )
+            _ENTRY._write_yaml(
+                env_companion_path,
+                {
+                    "host_paths": {
+                        "root_path": "/tmp/project-data",
+                    },
+                },
+            )
+
+            rendered_path = _ENTRY._render_ci_nix_pack_config(
+                static_config_path=static_config_path,
+                env_companion_path=env_companion_path,
+                out_path=out_path,
+                repo_root=REPO_ROOT,
+            )
+
+            self.assertEqual(rendered_path, out_path.resolve())
+            rendered_cfg = _ENTRY._load_yaml_mapping(rendered_path, ctx="rendered nix pack config")
+            self.assertEqual(rendered_cfg["project_root"], str(REPO_ROOT.resolve()))
+            self.assertEqual(rendered_cfg["profile"]["build_root_path"], str(REPO_ROOT.resolve()))
+
     def test_prepare_pack_release_runtime_dirs_creates_expected_layout(self) -> None:
         with tempfile.TemporaryDirectory() as td:
             root = Path(td) / "pack_release_runtime"
diff --git a/setup_and_pack/nix/lib_layout.py b/setup_and_pack/nix/lib_layout.py
index 8322a55..b25d7d1 100644
--- a/setup_and_pack/nix/lib_layout.py
+++ b/setup_and_pack/nix/lib_layout.py
@@ -41,6 +41,7 @@
 PACK_CONFIG_STATIC_STEM_SUFFIX = "_static"
 PACK_CONFIG_ENV_STEM_SUFFIX = "_env"
 DEFAULT_PACK_CONFIG_ENV_DIR_NAME = "setup_and_pack"
+PROJECT_ROOT_CONFIG_KEY = "project_root"
 HOST_PATHS_ROOT_KEY = "root_path"
 DEFAULT_HOST_PATH_SUFFIXES = {
     ("store", "project_data_root"): "",
@@ -224,7 +225,7 @@ def load_experiment_spec_from_root(*, config_path: Path, config_root: dict) -> E
     profile_config = _require_mapping(raw_config, "profile")
     assembly_config = _require_mapping(raw_config, "assembly")
 
-    project_root = _detect_project_root(config_path=config_path)
+    project_root = _resolve_project_root(config_path=config_path, raw_config=raw_config)
     project_data_root = _require_absolute_path(store_config, "project_data_root")
     base_system = _require_enum_string(runtime_config, "base_system", SUPPORTED_BASE_SYSTEMS)
     architectures = tuple(
@@ -547,6 +548,25 @@ def _detect_project_root(*, config_path: Path) -> Path:
     )
 
 
+def _resolve_project_root(*, config_path: Path, raw_config: dict) -> Path:
+    configured_project_root = _optional_non_empty_string(raw_config, PROJECT_ROOT_CONFIG_KEY)
+    if configured_project_root is not None:
+        project_root = Path(configured_project_root)
+        if not project_root.is_absolute():
+            raise RuntimeError(
+                f"config.{PROJECT_ROOT_CONFIG_KEY} must be an absolute path: {configured_project_root}"
+            )
+        resolved_project_root = project_root.resolve()
+        if not _is_project_root_candidate(resolved_project_root):
+            raise RuntimeError(
+                "config.project_root must point at a project root containing one of "
+                f"{PROJECT_ROOT_MARKER_FILE_NAMES + PROJECT_ROOT_MARKER_DIR_NAMES} "
+                f"and child dirs {PROJECT_ROOT_REQUIRED_CHILD_DIR_NAMES}: {resolved_project_root}"
+            )
+        return resolved_project_root
+    return _detect_project_root(config_path=config_path)
+
+
 def _is_project_root_candidate(candidate_root: Path) -> bool:
     has_marker = any(
         (candidate_root / marker_name).exists()
diff --git a/setup_and_pack/tests/test_lib_layout.py b/setup_and_pack/tests/test_lib_layout.py
index 6d05d54..049be32 100644
--- a/setup_and_pack/tests/test_lib_layout.py
+++ b/setup_and_pack/tests/test_lib_layout.py
@@ -139,6 +139,41 @@ def test_load_experiment_spec_from_root_parses_closed_sdk_search_roots(self) ->
                 (str(closed_sdk_root.resolve()),),
             )
 
+    def test_load_experiment_spec_from_root_accepts_explicit_project_root(self) -> None:
+        with tempfile.TemporaryDirectory() as tmpdir:
+            root = Path(tmpdir)
+            project_root = root / "repo"
+            generated_config_path = root / "generated" / "setup_and_pack" / "nix" / "pack_fluxonkv_pylib_ci.yaml"
+            (project_root / ".git").mkdir(parents=True, exist_ok=True)
+            (project_root / "setup_and_pack").mkdir(parents=True, exist_ok=True)
+            generated_config_path.parent.mkdir(parents=True, exist_ok=True)
+
+            spec = _LIB_LAYOUT.load_experiment_spec_from_root(
+                config_path=generated_config_path,
+                config_root={
+                    "project_root": str(project_root.resolve()),
+                    "store": {
+                        "project_data_root": str((root / "project_data").resolve()),
+                    },
+                    "runtime": {
+                        "base_system": "manylinux_2_28",
+                        "architectures": ["x86_64"],
+                        "python_abi": "cpython3.10",
+                    },
+                    "profile": {
+                        "source_kind": "bridge_prebuilt",
+                        "native_runtime_dir_names": ["cxxpacked"],
+                        "target_support_dir_names": ["meson-0.64.0"],
+                        "ext_bundle_dir_name": "cxxpacked",
+                    },
+                    "assembly": {
+                        "baseline_path": str((root / "baseline").resolve()),
+                    },
+                },
+            )
+
+            self.assertEqual(spec.project_root, project_root.resolve())
+
     def test_load_experiment_config_root_expands_host_root_aliases(self) -> None:
         with tempfile.TemporaryDirectory() as tmpdir:
             root = Path(tmpdir)

From ac18cc77595e29ce1f453e7a1e0aa8272251a6ee Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Wed, 24 Jun 2026 12:05:29 +0800
Subject: [PATCH 10/13] test

---
 deployment/gen_bare_deploy_bash.py            |  12 +-
 ...ction_supervisor_launch_wait_block.sh.tmpl |   4 +-
 deployment/tests/test_gen_bare_deploy_bash.py | 133 ++-
 .../test_start_test_bed_bootstrap_log.py      |  40 +
 deployment/utils/proc_lifecycle_codegen.py    |  39 +-
 examples/fluxon_quick_start/start.py          |   3 +-
 examples/start_kv_and_fs_svc.py               |   7 +
 examples/start_master_owner.py                |   7 +
 ...15\347\275\256\346\200\273\350\247\210.md" |   7 +-
 ...13\350\257\225\346\265\201\347\250\213.md" |   2 +-
 ...15\345\212\241\345\271\263\351\235\242.md" |   3 +
 ...7 - 3 - KV-RPC\346\216\245\345\217\243.md" |   3 +
 ...0\267 - 4 - MQ\346\216\245\345\217\243.md" |   3 +
 ...0\267 - 5 - FS\346\216\245\345\217\243.md" |   3 +
 .../User - 3 - KV and RPC Interface.md        |   3 +
 fluxon_py/config.py                           | 269 +++--
 .../tests/fluxon_fs_transfer_tikv_support.py  |   3 +
 ...est_backend_relay_deployconf.template.yaml |  12 +
 fluxon_py/tests/test_backend_relay_docker.py  |  73 +-
 fluxon_py/tests/test_config.py                | 170 ++-
 .../tests/test_mq/test_example_ctrl_c_exit.py |   3 +
 fluxon_rs/fluxon_fs/src/agent.rs              |  11 +-
 fluxon_rs/fluxon_fs/src/agent_service.rs      |   7 +
 .../src/agent_service/transfer_agent.rs       |  39 +-
 fluxon_rs/fluxon_fs/src/remote_disk_cache.rs  |   6 +-
 fluxon_rs/fluxon_kv/framework_init_steps.yaml | 146 +--
 .../fluxon_kv/src/client_seg_pool/mod.rs      |  30 +-
 fluxon_rs/fluxon_kv/src/config.rs             | 191 +++-
 .../external_client_test.rs                   |   8 +-
 .../fluxon_kv/src/external_client_api/mod.rs  |  10 +-
 fluxon_rs/fluxon_kv/src/kv_test.rs            |  40 +-
 fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs    |   3 +-
 fluxon_rs/fluxon_kv/src/lib.rs                | 161 +--
 .../fluxon_kv/src/memholder/memholder_test.rs |   8 +-
 fluxon_rs/fluxon_util/src/log.rs              |  12 +-
 fluxon_rs/fluxon_util/tests/log_mgmt.rs       |  14 +
 fluxon_test_stack/start_test_bed.py           |  19 +-
 skills/browser-helm/SKILL.md                  | 232 ----
 skills/browser-helm/agents/openai.yaml        |   6 -
 skills/browser-helm/references/commands.md    | 131 ---
 skills/canvas-dag_organizer-v1/SKILL.md       |  10 -
 .../agents/openai.yaml                        |   6 -
 skills/canvas-ops-v1/SKILL.md                 |  10 -
 skills/canvas-ops-v1/agents/openai.yaml       |   6 -
 skills/canvas-tidy_selection-v1/SKILL.md      |  10 -
 .../agents/openai.yaml                        |   6 -
 skills/find-skills/SKILL.md                   | 133 ---
 skills/imagegen/LICENSE.txt                   | 201 ----
 skills/imagegen/SKILL.md                      | 356 -------
 skills/imagegen/agents/openai.yaml            |   6 -
 skills/imagegen/assets/imagegen-small.svg     |   5 -
 skills/imagegen/assets/imagegen.png           | Bin 1711 -> 0 bytes
 skills/imagegen/references/cli.md             | 242 -----
 skills/imagegen/references/codex-network.md   |  33 -
 skills/imagegen/references/image-api.md       |  90 --
 skills/imagegen/references/prompting.md       | 118 ---
 skills/imagegen/references/sample-prompts.md  | 433 --------
 skills/imagegen/scripts/image_gen.py          | 995 ------------------
 skills/imagegen/scripts/remove_chroma_key.py  | 440 --------
 skills/openai-docs/LICENSE.txt                | 201 ----
 skills/openai-docs/SKILL.md                   | 167 ---
 skills/openai-docs/agents/openai.yaml         |  14 -
 skills/openai-docs/assets/openai-small.svg    |   3 -
 skills/openai-docs/assets/openai.png          | Bin 1429 -> 0 bytes
 skills/openai-docs/references/latest-model.md |  37 -
 .../openai-docs/references/prompting-guide.md | 244 -----
 .../openai-docs/references/upgrade-guide.md   | 181 ----
 .../scripts/fetch-codex-manual.mjs            | 598 -----------
 .../scripts/resolve-latest-model-info.js      | 147 ---
 skills/plugin-creator/SKILL.md                | 243 -----
 skills/plugin-creator/agents/openai.yaml      |   6 -
 .../assets/plugin-creator-small.svg           |   3 -
 .../plugin-creator/assets/plugin-creator.png  | Bin 1563 -> 0 bytes
 .../references/installing-and-updating.md     | 143 ---
 .../references/plugin-json-spec.md            | 194 ----
 .../scripts/create_basic_plugin.py            | 324 ------
 .../scripts/read_marketplace_name.py          |  48 -
 .../scripts/update_plugin_cachebuster.py      |  78 --
 .../plugin-creator/scripts/validate_plugin.py | 593 -----------
 .../SKILL.md                                  |  11 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  16 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  27 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  15 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 .../SKILL.md                                  |  10 -
 .../agents/openai.yaml                        |   6 -
 skills/rs-skill-smoke-09e1daf7/SKILL.md       |   8 -
 skills/rs-skill-smoke-529efbc9/SKILL.md       |   8 -
 skills/rs-skill-smoke-cde1029f/SKILL.md       |   8 -
 skills/skill-creator/SKILL.md                 | 416 --------
 skills/skill-creator/agents/openai.yaml       |   5 -
 .../assets/skill-creator-small.svg            |   3 -
 skills/skill-creator/assets/skill-creator.png | Bin 1563 -> 0 bytes
 skills/skill-creator/license.txt              | 202 ----
 .../skill-creator/references/openai_yaml.md   |  49 -
 .../scripts/generate_openai_yaml.py           | 226 ----
 skills/skill-creator/scripts/init_skill.py    | 400 -------
 .../skill-creator/scripts/quick_validate.py   | 101 --
 skills/skill-installer/LICENSE.txt            | 202 ----
 skills/skill-installer/SKILL.md               |  58 -
 skills/skill-installer/agents/openai.yaml     |   5 -
 .../assets/skill-installer-small.svg          |   3 -
 .../assets/skill-installer.png                | Bin 1086 -> 0 bytes
 .../skill-installer/scripts/github_utils.py   |  21 -
 .../scripts/install-skill-from-github.py      | 308 ------
 skills/skill-installer/scripts/list-skills.py | 107 --
 137 files changed, 907 insertions(+), 9753 deletions(-)
 delete mode 100644 skills/browser-helm/SKILL.md
 delete mode 100644 skills/browser-helm/agents/openai.yaml
 delete mode 100644 skills/browser-helm/references/commands.md
 delete mode 100644 skills/canvas-dag_organizer-v1/SKILL.md
 delete mode 100644 skills/canvas-dag_organizer-v1/agents/openai.yaml
 delete mode 100644 skills/canvas-ops-v1/SKILL.md
 delete mode 100644 skills/canvas-ops-v1/agents/openai.yaml
 delete mode 100644 skills/canvas-tidy_selection-v1/SKILL.md
 delete mode 100644 skills/canvas-tidy_selection-v1/agents/openai.yaml
 delete mode 100644 skills/find-skills/SKILL.md
 delete mode 100644 skills/imagegen/LICENSE.txt
 delete mode 100644 skills/imagegen/SKILL.md
 delete mode 100644 skills/imagegen/agents/openai.yaml
 delete mode 100644 skills/imagegen/assets/imagegen-small.svg
 delete mode 100644 skills/imagegen/assets/imagegen.png
 delete mode 100644 skills/imagegen/references/cli.md
 delete mode 100644 skills/imagegen/references/codex-network.md
 delete mode 100644 skills/imagegen/references/image-api.md
 delete mode 100644 skills/imagegen/references/prompting.md
 delete mode 100644 skills/imagegen/references/sample-prompts.md
 delete mode 100644 skills/imagegen/scripts/image_gen.py
 delete mode 100644 skills/imagegen/scripts/remove_chroma_key.py
 delete mode 100644 skills/openai-docs/LICENSE.txt
 delete mode 100644 skills/openai-docs/SKILL.md
 delete mode 100644 skills/openai-docs/agents/openai.yaml
 delete mode 100644 skills/openai-docs/assets/openai-small.svg
 delete mode 100644 skills/openai-docs/assets/openai.png
 delete mode 100644 skills/openai-docs/references/latest-model.md
 delete mode 100644 skills/openai-docs/references/prompting-guide.md
 delete mode 100644 skills/openai-docs/references/upgrade-guide.md
 delete mode 100644 skills/openai-docs/scripts/fetch-codex-manual.mjs
 delete mode 100644 skills/openai-docs/scripts/resolve-latest-model-info.js
 delete mode 100644 skills/plugin-creator/SKILL.md
 delete mode 100644 skills/plugin-creator/agents/openai.yaml
 delete mode 100644 skills/plugin-creator/assets/plugin-creator-small.svg
 delete mode 100644 skills/plugin-creator/assets/plugin-creator.png
 delete mode 100644 skills/plugin-creator/references/installing-and-updating.md
 delete mode 100644 skills/plugin-creator/references/plugin-json-spec.md
 delete mode 100644 skills/plugin-creator/scripts/create_basic_plugin.py
 delete mode 100644 skills/plugin-creator/scripts/read_marketplace_name.py
 delete mode 100644 skills/plugin-creator/scripts/update_plugin_cachebuster.py
 delete mode 100644 skills/plugin-creator/scripts/validate_plugin.py
 delete mode 100644 skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
 delete mode 100644 skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
 delete mode 100644 skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
 delete mode 100644 skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
 delete mode 100644 skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
 delete mode 100644 skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
 delete mode 100644 skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
 delete mode 100644 skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
 delete mode 100644 skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
 delete mode 100644 skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
 delete mode 100644 skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
 delete mode 100644 skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
 delete mode 100644 skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
 delete mode 100644 skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
 delete mode 100644 skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
 delete mode 100644 skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
 delete mode 100644 skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
 delete mode 100644 skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
 delete mode 100644 skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
 delete mode 100644 skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
 delete mode 100644 skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
 delete mode 100644 skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
 delete mode 100644 skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
 delete mode 100644 skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
 delete mode 100644 skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
 delete mode 100644 skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
 delete mode 100644 skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
 delete mode 100644 skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
 delete mode 100644 skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
 delete mode 100644 skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
 delete mode 100644 skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
 delete mode 100644 skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
 delete mode 100644 skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
 delete mode 100644 skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
 delete mode 100644 skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
 delete mode 100644 skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
 delete mode 100644 skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
 delete mode 100644 skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
 delete mode 100644 skills/rs-skill-smoke-09e1daf7/SKILL.md
 delete mode 100644 skills/rs-skill-smoke-529efbc9/SKILL.md
 delete mode 100644 skills/rs-skill-smoke-cde1029f/SKILL.md
 delete mode 100644 skills/skill-creator/SKILL.md
 delete mode 100644 skills/skill-creator/agents/openai.yaml
 delete mode 100644 skills/skill-creator/assets/skill-creator-small.svg
 delete mode 100644 skills/skill-creator/assets/skill-creator.png
 delete mode 100644 skills/skill-creator/license.txt
 delete mode 100644 skills/skill-creator/references/openai_yaml.md
 delete mode 100644 skills/skill-creator/scripts/generate_openai_yaml.py
 delete mode 100644 skills/skill-creator/scripts/init_skill.py
 delete mode 100644 skills/skill-creator/scripts/quick_validate.py
 delete mode 100644 skills/skill-installer/LICENSE.txt
 delete mode 100644 skills/skill-installer/SKILL.md
 delete mode 100644 skills/skill-installer/agents/openai.yaml
 delete mode 100644 skills/skill-installer/assets/skill-installer-small.svg
 delete mode 100644 skills/skill-installer/assets/skill-installer.png
 delete mode 100644 skills/skill-installer/scripts/github_utils.py
 delete mode 100644 skills/skill-installer/scripts/install-skill-from-github.py
 delete mode 100644 skills/skill-installer/scripts/list-skills.py

diff --git a/deployment/gen_bare_deploy_bash.py b/deployment/gen_bare_deploy_bash.py
index fdd5d0e..5d047ed 100644
--- a/deployment/gen_bare_deploy_bash.py
+++ b/deployment/gen_bare_deploy_bash.py
@@ -49,8 +49,8 @@
 ATOMIC_GROUP_CRASHLOOP_INTERVAL_LT_SECONDS = 30
 ATOMIC_GROUP_PROBABLE_READY_SECONDS = 10
 STANDALONE_PROBABLE_READY_SECONDS = 10
-STANDALONE_STARTUP_DEADLINE_SECONDS = 10
-ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS = 10
+STANDALONE_STARTUP_DEADLINE_SECONDS = 20
+ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS = 20
 HOSTWORKDIR_RUNTIME_TOKEN = "${HOSTWORKDIR}"
 REPO_ROOT = SCRIPT_DIR.parent
 BARE_TEMPLATE_DIR = SCRIPT_DIR / "templates" / "gen_bare_deploy_bash"
@@ -552,7 +552,7 @@ def _render_selection_supervisor_launch_wait_block(
     *,
     run_cmd: str,
     stable_seconds_expr: str,
-    deadline_ts_expr: str,
+    deadline_seconds_expr: str,
     context: str,
 ) -> str:
     return _render_bare_template(
@@ -560,7 +560,7 @@ def _render_selection_supervisor_launch_wait_block(
         values={
             "RUN_CMD": run_cmd,
             "STABLE_SECONDS_EXPR": stable_seconds_expr,
-            "DEADLINE_TS_EXPR": deadline_ts_expr,
+            "DEADLINE_SECONDS_EXPR": deadline_seconds_expr,
             "CONTEXT": context,
         },
     )
@@ -619,7 +619,7 @@ def _render_standalone_start_body(*, name_prefix: str, service_name: str) -> str
             "SELECTION_SUPERVISOR_LAUNCH_WAIT_BLOCK": _render_selection_supervisor_launch_wait_block(
                 run_cmd=run_cmd,
                 stable_seconds_expr=str(STANDALONE_PROBABLE_READY_SECONDS),
-                deadline_ts_expr=f'$(( $(date +%s) + {STANDALONE_STARTUP_DEADLINE_SECONDS} ))',
+                deadline_seconds_expr=str(STANDALONE_STARTUP_DEADLINE_SECONDS),
                 context="[bare]",
             ),
         },
@@ -693,7 +693,7 @@ def _render_atomic_group_service_block(
                 script=_render_selection_supervisor_launch_wait_block(
                     run_cmd=run_cmd,
                     stable_seconds_expr=str(ATOMIC_GROUP_PROBABLE_READY_SECONDS),
-                    deadline_ts_expr=f'$(( $(date +%s) + {ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS} ))',
+                    deadline_seconds_expr=str(ATOMIC_GROUP_STARTUP_DEADLINE_SECONDS),
                     context="[rollout]",
                 ).rstrip()
                 + "\n",
diff --git a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
index 52cce05..702e5bd 100644
--- a/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
+++ b/deployment/templates/gen_bare_deploy_bash/selection_supervisor_launch_wait_block.sh.tmpl
@@ -3,8 +3,8 @@ if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then
   echo "{{CONTEXT}} launch failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
   exit 1
 fi
-STARTUP_DEADLINE_TS={{DEADLINE_TS_EXPR}}
-if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" {{STABLE_SECONDS_EXPR}} "$STARTUP_DEADLINE_TS" "{{CONTEXT}}"; then
+STARTUP_DEADLINE_SECONDS={{DEADLINE_SECONDS_EXPR}}
+if ! wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" {{STABLE_SECONDS_EXPR}} "$STARTUP_DEADLINE_SECONDS" "{{CONTEXT}}"; then
   echo "{{CONTEXT}} probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"
   exit 1
 fi
diff --git a/deployment/tests/test_gen_bare_deploy_bash.py b/deployment/tests/test_gen_bare_deploy_bash.py
index 19f80ac..0ca0a79 100644
--- a/deployment/tests/test_gen_bare_deploy_bash.py
+++ b/deployment/tests/test_gen_bare_deploy_bash.py
@@ -5,6 +5,7 @@
 import argparse
 import importlib.util
 import os
+import shlex
 import subprocess
 import sys
 import tempfile
@@ -62,6 +63,7 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("supervisor_label_uses_stable_selection_suffix", test_supervisor_label_uses_stable_selection_suffix),
         ("bootstrap_start_reuses_already_present_selection", test_bootstrap_start_reuses_already_present_selection),
         ("bare_start_fails_when_child_exits_within_startup_window", test_bare_start_fails_when_child_exits_within_startup_window),
+        ("pid_ready_check_requires_full_stable_window_after_first_child_observation", test_pid_ready_check_requires_full_stable_window_after_first_child_observation),
         ("atomic_group_start_does_not_auto_stop_on_failure", test_atomic_group_start_does_not_auto_stop_on_failure),
         ("atomic_group_preserves_nested_heredoc_terminator", test_atomic_group_preserves_nested_heredoc_terminator),
         ("atomic_group_stop_script_is_shell_valid", test_atomic_group_stop_script_is_shell_valid),
@@ -137,7 +139,7 @@ def test_preserves_hostworkdir_runtime_token() -> None:
         assert "wait-present" not in script, script
         assert "launch_only_start_gate" not in script, script
         _assert_standalone_deadline_after_launch(script)
-        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
+        assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_SECONDS" "[bare]"' in script, script
         assert "export SERVICE_PORT=12345" in script, script
         assert "wait_service_tcp_ready" not in script, script
         assert "wait_service_etcd_endpoint_healthy" not in script, script
@@ -195,11 +197,11 @@ def test_atomic_group_start_does_not_auto_stop_on_failure() -> None:
         assert 'SUPERVISOR_PID=$( setsid ' not in script, script
         assert 'echo "[rollout] probable-ready failed svc=$SERVICE label=$SUPERVISOR_LABEL supervisor_pid=$SUPERVISOR_PID"' in script, script
         assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID"' in script, script
-        assert 'GROUP_STARTUP_DEADLINE_TS=' not in script, script
-        assert script.count('STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))') == 2, script
+        assert 'GROUP_STARTUP_DEADLINE_SECONDS=' not in script, script
+        assert script.count('STARTUP_DEADLINE_SECONDS=20') == 2, script
         _assert_deadline_after_launch(
             script=script,
-            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[rollout]"',
+            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_SECONDS" "[rollout]"',
         )
         assert "export SERVICE_PORT=23456" in script, script
         assert "unset SERVICE_PORT" in script, script
@@ -330,7 +332,7 @@ def test_bare_start_uses_no_exit_startup_gate() -> None:
 
         for script in (etcd_script, tikv_script, plain_script):
             _assert_standalone_deadline_after_launch(script)
-            assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"' in script, script
+            assert 'wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_SECONDS" "[bare]"' in script, script
             assert "wait_service_tcp_ready" not in script, script
             assert "wait_service_etcd_endpoint_healthy" not in script, script
         print("PASS: test_bare_start_uses_no_exit_startup_gate")
@@ -365,10 +367,10 @@ def test_normalized_testbed_master_exports_service_port_for_atomic_group() -> No
         assert "export MASTER__PORT=51051" in master_block, master_block
         assert "export SERVICE_PORT=51051" in master_block, master_block
         assert "unset SERVICE_PORT" not in master_block, master_block
-        assert 'GROUP_STARTUP_DEADLINE_TS=' not in master_block, master_block
+        assert 'GROUP_STARTUP_DEADLINE_SECONDS=' not in master_block, master_block
         _assert_deadline_after_launch(
             script=master_block,
-            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[rollout]"',
+            wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_SECONDS" "[rollout]"',
         )
         assert "wait_service_tcp_ready" not in master_block, master_block
         print("PASS: test_normalized_testbed_master_exports_service_port_for_atomic_group")
@@ -698,6 +700,119 @@ def test_bare_start_fails_when_child_exits_within_startup_window() -> None:
         print("PASS: test_bare_start_fails_when_child_exits_within_startup_window")
 
 
+def test_pid_ready_check_requires_full_stable_window_after_first_child_observation() -> None:
+    proc_lifecycle = _load_python_module(
+        module_name="test_proc_lifecycle_codegen_runtime",
+        path=DEPLOYMENT_DIR / "utils" / "proc_lifecycle_codegen.py",
+    )
+    helpers = proc_lifecycle.render_bash_proc_lifecycle_funcs_pid_tree(
+        timeouts=proc_lifecycle.StopTimeouts(term_seconds=60, kill_seconds=10, supersede_seconds=30)
+    )
+    with tempfile.TemporaryDirectory(prefix="test_proc_lifecycle_late_child_") as td:
+        tmpdir = Path(td)
+        shell_script = tmpdir / "probe.sh"
+        supervisor_script = tmpdir / "delayed_child_supervisor.py"
+        child_script = tmpdir / "sleep_child.py"
+
+        child_script.write_text(
+            textwrap.dedent(
+                """
+                #!/usr/bin/env python3
+                import signal
+                import time
+
+                def _handle_signal(_signum, _frame):
+                    raise SystemExit(0)
+
+                signal.signal(signal.SIGTERM, _handle_signal)
+                signal.signal(signal.SIGINT, _handle_signal)
+
+                while True:
+                    time.sleep(0.2)
+                """
+            ).strip()
+            + "\n",
+            encoding="utf-8",
+        )
+        supervisor_script.write_text(
+            textwrap.dedent(
+                f"""
+                #!/usr/bin/env python3
+                import signal
+                import subprocess
+                import sys
+                import time
+                from pathlib import Path
+
+                child = None
+
+                def _shutdown(_signum, _frame):
+                    global child
+                    if child is not None and child.poll() is None:
+                        child.terminate()
+                        try:
+                            child.wait(timeout=5)
+                        except subprocess.TimeoutExpired:
+                            child.kill()
+                    raise SystemExit(0)
+
+                signal.signal(signal.SIGTERM, _shutdown)
+                signal.signal(signal.SIGINT, _shutdown)
+
+                time.sleep(4)
+                child = subprocess.Popen([sys.executable, str(Path({str(child_script)!r}))])
+                while True:
+                    if child.poll() is not None:
+                        raise SystemExit(child.returncode or 0)
+                    time.sleep(0.2)
+                """
+            ).strip()
+            + "\n",
+            encoding="utf-8",
+        )
+
+        shell_script.write_text(
+            textwrap.dedent(
+                f"""\
+                #!/usr/bin/env bash
+                set -euo pipefail
+                {helpers}
+                python3 {shlex.quote(str(supervisor_script))} &
+                root_pid="$!"
+                startup_deadline_seconds=6
+                if wait_service_probably_ready_pid_tree "svc_plain" "$root_pid" 4 "$startup_deadline_seconds" "[test]"; then
+                  echo "unexpected success"
+                  kill "$root_pid" >/dev/null 2>&1 || true
+                  wait "$root_pid" >/dev/null 2>&1 || true
+                  exit 99
+                else
+                  wait_rc="$?"
+                fi
+                kill "$root_pid" >/dev/null 2>&1 || true
+                wait "$root_pid" >/dev/null 2>&1 || true
+                exit "$wait_rc"
+                """
+            ),
+            encoding="utf-8",
+        )
+        shell_script.chmod(0o755)
+
+        result = subprocess.run(
+            ["bash", str(shell_script)],
+            check=False,
+            capture_output=True,
+            text=True,
+            cwd=str(DEPLOYMENT_DIR.parent),
+            timeout=20,
+        )
+        assert result.returncode != 0, (
+            f"expected startup gate failure rc={result.returncode} stdout={result.stdout!r} stderr={result.stderr!r}"
+        )
+        assert "unexpected success" not in result.stdout, result.stdout
+        assert "child pid not stable long enough" in result.stdout, result.stdout
+        print("PASS: test_pid_ready_check_requires_full_stable_window_after_first_child_observation")
+
+
 def test_atomic_group_preserves_nested_heredoc_terminator() -> None:
     with tempfile.TemporaryDirectory(prefix="test_gen_bare_deploy_bash_atomic_heredoc_") as td:
         tmpdir = Path(td)
@@ -869,7 +984,7 @@ def _wait_until_selection_absent(
 
 def _assert_deadline_after_launch(*, script: str, wait_call: str) -> None:
     launch_check = 'if [[ ! "$SUPERVISOR_PID" =~ ^[0-9]+$ ]]; then'
-    deadline_assign = 'STARTUP_DEADLINE_TS=$(( $(date +%s) + 10 ))'
+    deadline_assign = 'STARTUP_DEADLINE_SECONDS=20'
     assert launch_check in script, script
     assert deadline_assign in script, script
     assert wait_call in script, script
@@ -883,7 +998,7 @@ def _assert_deadline_after_launch(*, script: str, wait_call: str) -> None:
 def _assert_standalone_deadline_after_launch(script: str) -> None:
     _assert_deadline_after_launch(
         script=script,
-        wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_TS" "[bare]"',
+        wait_call='wait_service_probably_ready_pid_tree "$SERVICE" "$SUPERVISOR_PID" 10 "$STARTUP_DEADLINE_SECONDS" "[bare]"',
     )
 
 
diff --git a/deployment/tests/test_start_test_bed_bootstrap_log.py b/deployment/tests/test_start_test_bed_bootstrap_log.py
index 9f5ef49..2bd6b00 100644
--- a/deployment/tests/test_start_test_bed_bootstrap_log.py
+++ b/deployment/tests/test_start_test_bed_bootstrap_log.py
@@ -191,6 +191,46 @@ def test_failed_status_includes_bootstrap_and_service_log_tails() -> None:
         print("PASS: test_failed_status_includes_bootstrap_and_service_log_tails")
 
 
+def test_failed_status_resolves_daily_sharded_service_log_tail() -> None:
+    module = _load_start_test_bed_module()
+    with tempfile.TemporaryDirectory(prefix="test_start_test_bed_sharded_failure_tails_") as td:
+        root = Path(td)
+        bootstrap_log = root / "fluxon_core_controller.bootstrap.log"
+        bootstrap_log.write_text("[rollout] probable-ready failed svc=owner\n", encoding="utf-8")
+        base_service_log = root / "log" / "master.log"
+        base_service_log.parent.mkdir(parents=True, exist_ok=True)
+        sharded_service_log = root / "log" / "master.2026-06-23.log"
+        sharded_service_log.write_text("FATAL: owner bootstrap dependency failed\n", encoding="utf-8")
+        local_node_cfg = {
+            "hostname": "node-a",
+            "hostworkdir": str(root),
+        }
+        result = _build_result(
+            bootstrap_log_path=bootstrap_log,
+            launcher_rc=1,
+            selection_name="fluxon_core_controller",
+            bare_script_name="fluxon_core_controller",
+            node_name="node-a",
+            expected_service_names=["master"],
+        )
+        statuses = module._collect_bare_runtime_statuses(
+            deployconf={},
+            cluster_nodes={},
+            local_node_cfg=local_node_cfg,
+            result=result,
+        )
+        assert len(statuses) == 1, statuses
+        status = statuses[0]
+        assert status["present"] is False, status
+        assert status["running"] is False, status
+        assert status["log_path"] == str(sharded_service_log.resolve()), status
+        err = status["status_error"]
+        assert isinstance(err, str) and "bootstrap_log_tail=" in err, err
+        assert "service_log_tail=" in err, err
+        assert "owner bootstrap dependency failed" in err, err
+        print("PASS: test_failed_status_resolves_daily_sharded_service_log_tail")
+
+
 def test_testbed_template_tikv_uses_low_fd_limits_for_ci_runner() -> None:
     deployconf = yaml.safe_load((REPO_ROOT / "fluxon_test_stack" / "deployconf_testbed.yml").read_text(encoding="utf-8"))
     tikv_cfg = deployconf["service"]["tikv"]["entrypoint"]
diff --git a/deployment/utils/proc_lifecycle_codegen.py b/deployment/utils/proc_lifecycle_codegen.py
index b0acd71..197829f 100644
--- a/deployment/utils/proc_lifecycle_codegen.py
+++ b/deployment/utils/proc_lifecycle_codegen.py
@@ -164,29 +164,42 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
   '
 }}
 
+_now_monotonic_ms() {{
+  python3 - <<'__FLUXON_MONOTONIC_MS__'
+import time
+
+print(time.monotonic_ns() // 1_000_000)
+__FLUXON_MONOTONIC_MS__
+}}
+
 wait_service_probably_ready_pid_tree() {{
   # Startup gate contract:
-  # - Success means one supervised direct child PID becomes visible and stays unchanged across the
-  #   fixed startup window.
+  # - Success means one supervised direct child PID becomes visible, then stays unchanged for the
+  #   full startup_window_seconds before the overall startup deadline expires.
   # - During this startup window we do not probe service ports or readiness endpoints.
   # - A child exit or restart inside the window is treated as startup failure even if the
   #   supervisor process itself stays alive and restarts again later.
   svc="$1"
   root_pid="$2"
   startup_window_seconds="$3"
-  deadline_ts="$4"
+  startup_deadline_seconds="$4"
   context="$5"
 
   if [[ ! "$startup_window_seconds" =~ ^[0-9]+$ ]] || [ "$startup_window_seconds" -le 0 ]; then
     echo "$context probable-ready: invalid startup_window_seconds=$startup_window_seconds svc=$svc"
     return 1
   fi
-  if [[ ! "$deadline_ts" =~ ^[0-9]+$ ]] || [ "$deadline_ts" -le 0 ]; then
-    echo "$context probable-ready: invalid deadline_ts=$deadline_ts svc=$svc"
+  if [[ ! "$startup_deadline_seconds" =~ ^[0-9]+$ ]] || [ "$startup_deadline_seconds" -le 0 ]; then
+    echo "$context probable-ready: invalid startup_deadline_seconds=$startup_deadline_seconds svc=$svc"
     return 1
   fi
 
+  startup_window_ms=$(( startup_window_seconds * 1000 ))
+  startup_deadline_ms=$(( startup_deadline_seconds * 1000 ))
+  started_at_monotonic_ms="$(_now_monotonic_ms)"
+  deadline_monotonic_ms=$(( started_at_monotonic_ms + startup_deadline_ms ))
   observed_child_pid=""
+  observed_child_since_monotonic_ms=""
   while true; do
     if ! _pid_exists "$root_pid"; then
       echo "$context probable-ready: supervisor pid exited svc=$svc pid=$root_pid"
@@ -204,6 +217,7 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
       current_child_pid="$1"
     fi
 
+    now_monotonic_ms="$(_now_monotonic_ms)"
     if [ -z "$current_child_pid" ]; then
       if [ -n "$observed_child_pid" ]; then
         echo "$context probable-ready: child pid exited svc=$svc supervisor_pid=$root_pid child_pid=$observed_child_pid"
@@ -211,19 +225,24 @@ def render_bash_proc_lifecycle_funcs_pid_tree(*, timeouts: StopTimeouts) -> str:
       fi
     elif [ -z "$observed_child_pid" ]; then
       observed_child_pid="$current_child_pid"
+      observed_child_since_monotonic_ms="$now_monotonic_ms"
     elif [ "$current_child_pid" != "$observed_child_pid" ]; then
       echo "$context probable-ready: child pid changed svc=$svc supervisor_pid=$root_pid child_pid=$observed_child_pid replacement_child_pid=$current_child_pid"
       return 1
     fi
 
-    now=$(date +%s)
-    if [ "$now" -ge "$deadline_ts" ]; then
+    if [ -n "$observed_child_since_monotonic_ms" ] && [ $(( now_monotonic_ms - observed_child_since_monotonic_ms )) -ge "$startup_window_ms" ]; then
+      echo "$context probable-ready: ok svc=$svc startup_window_seconds=$startup_window_seconds supervisor_pid=$root_pid child_pid=$observed_child_pid"
+      return 0
+    fi
+
+    if [ "$now_monotonic_ms" -ge "$deadline_monotonic_ms" ]; then
       if [ -z "$observed_child_pid" ]; then
-        echo "$context probable-ready: no child pid observed svc=$svc supervisor_pid=$root_pid startup_window_seconds=$startup_window_seconds"
+        echo "$context probable-ready: no child pid observed svc=$svc supervisor_pid=$root_pid startup_window_seconds=$startup_window_seconds startup_deadline_seconds=$startup_deadline_seconds"
         return 1
       fi
-      echo "$context probable-ready: ok svc=$svc startup_window_seconds=$startup_window_seconds supervisor_pid=$root_pid child_pid=$observed_child_pid"
-      return 0
+      echo "$context probable-ready: child pid not stable long enough svc=$svc supervisor_pid=$root_pid child_pid=$observed_child_pid observed_for_ms=$(( now_monotonic_ms - observed_child_since_monotonic_ms )) startup_window_seconds=$startup_window_seconds startup_deadline_seconds=$startup_deadline_seconds"
+      return 1
     fi
 
     sleep 0.2
diff --git a/examples/fluxon_quick_start/start.py b/examples/fluxon_quick_start/start.py
index c051598..472f45c 100644
--- a/examples/fluxon_quick_start/start.py
+++ b/examples/fluxon_quick_start/start.py
@@ -530,8 +530,7 @@ def _monitoring_block(greptime_http_port: int) -> Dict[str, Any]:
 
 def _owner_large_file_paths(workdir: Path) -> Dict[str, str]:
     return {
-        "log_root_path": str(workdir / "large" / "log" / "owner"),
-        "cache_root_path": str(workdir / "large" / "cache" / "owner"),
+        "root_paths": [str(workdir / "large" / "owner")],
     }
 
 
diff --git a/examples/start_kv_and_fs_svc.py b/examples/start_kv_and_fs_svc.py
index db7e4f6..b79043c 100644
--- a/examples/start_kv_and_fs_svc.py
+++ b/examples/start_kv_and_fs_svc.py
@@ -38,6 +38,12 @@
 FS_MASTER_ACCESS_DB_PATH = (WORKDIR / "fs_master" / "access.db").resolve()
 
 
+def build_owner_large_file_paths() -> dict:
+    return {
+        "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+    }
+
+
 def main() -> None:
     args = parse_args()
     WORKDIR.mkdir(parents=True, exist_ok=True)
@@ -198,6 +204,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": build_owner_large_file_paths(),
         },
     }
 
diff --git a/examples/start_master_owner.py b/examples/start_master_owner.py
index 964cf87..fbfb600 100644
--- a/examples/start_master_owner.py
+++ b/examples/start_master_owner.py
@@ -23,6 +23,12 @@
 OWNER_DRAM_BYTES = 1073741824
 
 
+def build_owner_large_file_paths() -> dict:
+    return {
+        "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+    }
+
+
 def main() -> None:
     args = parse_args()
     SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
@@ -127,6 +133,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": build_owner_large_file_paths(),
         },
     }
 
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
index 4f9f65e..7f273a1 100644
--- "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -282,10 +282,11 @@ fluxonkv_spec:
   # owner 必须声明自己属于哪个 sub-cluster
   sub_cluster: default
 
-  # owner 必须声明大文件根目录；日志和 cache 都从这里派生
+  # owner 必须声明大文件根目录列表；运行时按数组顺序选择第一个可用 root，
+  # 日志和 cache 等子目录都从固定相对位置派生
   large_file_paths:
-    log_root_path: /var/lib/fluxon/log
-    cache_root_path: /var/lib/fluxon/cache
+    root_paths:
+      - /var/lib/fluxon/large
 
   # 可选
   p2p_listen_port: 31001
diff --git "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md" "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
index 80a8184..ca85ac6 100644
--- "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
+++ "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
@@ -382,7 +382,7 @@ deploy.instances 不写死在 suite 中。Runner 会结合 scale、profile 和
 
 **稳定结论：**
 
-- owner 模式配置一律必须显式提供 `fluxonkv_spec.large_file_paths.log_root_path` 和 `cache_root_path`。
+- owner 模式配置一律必须显式提供 `fluxonkv_spec.large_file_paths.root_paths`，并按数组顺序表达大文件根目录优先级。
 - `fluxonkv_spec.p2p_listen_port` 不是 owner 模式的必填项；是否显式写入，取决于具体分支的运行契约。
 - 不要把 `TEST_STACK` case-local owner 的显式端口分配规则，复制到 shared testbed / CI owner 配置上。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"
index 123c31f..d31ba03 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
@@ -312,6 +312,9 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": {
+                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+            },
         },
     }
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"
index 6494221..97affbf 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
@@ -173,6 +173,9 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": {
+                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+            },
         },
     }
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"
index 89744a2..8805da8 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
@@ -199,6 +199,9 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": {
+                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+            },
         },
     }
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"
index 68ec80b..f06fe44 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
@@ -286,6 +286,9 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": {
+                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+            },
         },
     }
 
diff --git a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md
index 820a3a9..d466820 100644
--- a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
@@ -148,6 +148,9 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
+            "large_file_paths": {
+                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
+            },
         },
     }
 
diff --git a/fluxon_py/config.py b/fluxon_py/config.py
index b50caad..a59a9b1 100644
--- a/fluxon_py/config.py
+++ b/fluxon_py/config.py
@@ -110,9 +110,8 @@ def _yaml_template():
   cluster_name:                       # Cluster name (str)
   shared_memory_path:                 # Shared memory path (str)
   shared_file_path:                   # Shared file path for shared.json/logs/profiles (str)
-  large_file_paths:                   # Owner-mode large file roots (dict(optional))
-    log_root_path:                    # Log root path for owner/client large-file outputs (str)
-    cache_root_path:                  # Cache root path for owner/client large-file outputs (str)
+  large_file_paths:                   # Owner-mode ordered large-file roots (dict(optional))
+    root_paths:                       # Ordered root directories; runtime uses the first usable root and derives fixed relative subdirectories under it (['{str}'])
   p2p_listen_port:                    # P2P QUIC listen port override (int(optional))
   redis_compat:                       # Enable Redis protocol shim (dict(optional))
     listen_addr:                      # TCP listen addr, e.g. "127.0.0.1:16379" (str)
@@ -298,6 +297,122 @@ def _normalize_test_spec_config(raw: Any, ctx: str) -> Dict[str, Any]:
     return out
 
 
+def _is_zero_contribution_fluxonkv_config(cfg: Dict[str, Any]) -> bool:
+    """
+    Determine whether one Fluxon KV config uses zero-contribution mode.
+
+    Contract:
+    - Missing contribute_to_cluster_pool_size means zero-contribution.
+    - Explicit dram=0 with all vram entries=0 also means zero-contribution.
+    - Partial-zero configurations are rejected to keep the role contract explicit.
+    """
+    contrib_present = "contribute_to_cluster_pool_size" in cfg
+    contrib = cfg.get("contribute_to_cluster_pool_size")
+    if not contrib_present or contrib is None:
+        return True
+    if not isinstance(contrib, dict):
+        raise ValueError("contribute_to_cluster_pool_size must be a mapping when provided")
+
+    dram = int(contrib["dram"])
+    vram_raw = contrib.get("vram")
+    # Missing vram is normalized to "no GPU contribution".
+    if vram_raw is None:
+        vram: Dict[str, Any] = {}
+    elif not isinstance(vram_raw, dict):
+        raise ValueError("contribute_to_cluster_pool_size.vram must be a mapping")
+    else:
+        vram = vram_raw
+
+    vram_is_zero = True
+    for _, value in vram.items():
+        if int(value) != 0:
+            vram_is_zero = False
+            break
+    if dram == 0 and not vram_is_zero:
+        raise ValueError(
+            "contribute_to_cluster_pool_size is partially zero: dram=0 but vram has non-zero values"
+        )
+    return dram == 0 and vram_is_zero
+
+
+def _validate_fluxonkv_contract(cfg: Dict[str, Any]) -> None:
+    """
+    Validate the shared Fluxon KV contract and then apply role-specific checks.
+
+    The contract must stay canonical across Python construction, YAML export, and
+    the Rust bridge, so owner/external differences live inside this one path.
+    """
+    if "fluxonkv_spec" not in cfg:
+        return
+
+    spec = cfg.get("fluxonkv_spec")
+    if not isinstance(spec, dict):
+        raise ValueError("fluxonkv_spec must be a mapping")
+
+    is_zero_contribution = _is_zero_contribution_fluxonkv_config(cfg)
+
+    shared_memory_path = spec.get("shared_memory_path")
+    if not isinstance(shared_memory_path, str) or not shared_memory_path.strip():
+        raise ValueError("fluxonkv_spec.shared_memory_path must be a non-empty string")
+    shared_file_path = spec.get("shared_file_path")
+    if not isinstance(shared_file_path, str) or not shared_file_path.strip():
+        raise ValueError("fluxonkv_spec.shared_file_path must be a non-empty string")
+
+    if "rdma_device_names" in cfg:
+        raise ValueError("rdma_device_names has been removed from Fluxon KV config")
+
+    if "transfer_engine" in spec:
+        raise ValueError("fluxonkv_spec.transfer_engine has been removed from Fluxon KV config")
+
+    if is_zero_contribution:
+        forbidden_spec_keys = [
+            "etcd_addresses",
+            "redis_compat",
+            "sub_cluster",
+            "large_file_paths",
+        ]
+        for key in forbidden_spec_keys:
+            if key in spec:
+                raise ValueError(f"fluxonkv_spec.{key} is forbidden in zero-contribution mode")
+        return
+
+    contrib = cfg.get("contribute_to_cluster_pool_size")
+    if not isinstance(contrib, dict):
+        raise ValueError(
+            "contribute_to_cluster_pool_size is required for owner mode (non-zero contribution)"
+        )
+    if int(contrib["dram"]) == 0:
+        raise ValueError("owner mode requires non-zero contribute_to_cluster_pool_size.dram")
+
+    if "etcd_addresses" not in spec:
+        raise ValueError("fluxonkv_spec.etcd_addresses is required for owner mode")
+    etcd_addresses = spec.get("etcd_addresses")
+    if not isinstance(etcd_addresses, list) or len(etcd_addresses) == 0:
+        raise ValueError("fluxonkv_spec.etcd_addresses must be a non-empty list")
+
+    if "sub_cluster" not in spec:
+        raise ValueError("fluxonkv_spec.sub_cluster is required for owner mode")
+    sub_cluster = spec.get("sub_cluster")
+    if not isinstance(sub_cluster, str) or not sub_cluster.strip():
+        raise ValueError("fluxonkv_spec.sub_cluster must be a non-empty string in owner mode")
+    if sub_cluster != sub_cluster.strip():
+        raise ValueError("fluxonkv_spec.sub_cluster must not have leading/trailing whitespace")
+
+    if "large_file_paths" not in spec:
+        raise ValueError("fluxonkv_spec.large_file_paths is required for owner mode")
+    large_file_paths = spec.get("large_file_paths")
+    if not isinstance(large_file_paths, dict):
+        raise ValueError("fluxonkv_spec.large_file_paths must be a mapping in owner mode")
+    root_paths = large_file_paths.get("root_paths")
+    if not isinstance(root_paths, list) or len(root_paths) == 0:
+        raise ValueError("fluxonkv_spec.large_file_paths.root_paths must be a non-empty list in owner mode")
+    for idx, field_value in enumerate(root_paths):
+        if not isinstance(field_value, str) or not field_value.strip():
+            raise ValueError(
+                f"fluxonkv_spec.large_file_paths.root_paths[{idx}] must be a non-empty string in owner mode"
+            )
+
+
 class FluxonKvClientConfig():
     """Configuration class for KV Cache stores that reads from YAML config files."""
 
@@ -337,80 +452,8 @@ def __init__(self, config_dict: Dict[str, Any]):
                 raise ValueError("pprof_duration_seconds must be > 0")
             plain["pprof_duration_seconds"] = pprof_duration_seconds
 
-        # FluxonKV role selection contract:
-        # - Missing contribute_to_cluster_pool_size means "zero-contribution" mode.
-        # - Explicit contribute_to_cluster_pool_size with all zeros also means "zero-contribution" mode.
-        # - Any partial-zero contribution is rejected to avoid ambiguous behavior.
         if "fluxonkv_spec" in plain:
-            spec = plain.get("fluxonkv_spec")
-            if not isinstance(spec, dict):
-                raise ValueError("fluxonkv_spec must be a mapping")
-
-            contrib_present = "contribute_to_cluster_pool_size" in plain
-            contrib = plain.get("contribute_to_cluster_pool_size")
-
-            is_zero_contribution = False
-            if not contrib_present or contrib is None:
-                is_zero_contribution = True
-            elif isinstance(contrib, dict):
-                dram = int(contrib["dram"])
-                vram_raw = contrib.get("vram")
-                # English note:
-                # - Owner-mode often contributes DRAM only; forcing `vram: {}` everywhere is noise.
-                # - Missing vram means "no GPU contribution", which is equivalent to an empty dict.
-                # - This is a schema normalization rule (not a fallback): if callers want VRAM, they
-                #   must provide an explicit mapping with non-zero values.
-                if vram_raw is None:
-                    vram: Dict[str, Any] = {}
-                elif not isinstance(vram_raw, dict):
-                    raise ValueError("contribute_to_cluster_pool_size.vram must be a mapping")
-                else:
-                    vram = vram_raw
-                vram_is_zero = True
-                for _, v in vram.items():
-                    if int(v) != 0:
-                        vram_is_zero = False
-                        break
-                if dram == 0 and not vram_is_zero:
-                    raise ValueError(
-                        "contribute_to_cluster_pool_size is partially zero: dram=0 but vram has non-zero values"
-                    )
-                is_zero_contribution = dram == 0 and vram_is_zero
-            else:
-                raise ValueError("contribute_to_cluster_pool_size must be a mapping when provided")
-
-            if is_zero_contribution:
-                forbidden_spec_keys = [
-                    "etcd_addresses",
-                    "redis_compat",
-                    "sub_cluster",
-                ]
-                for k in forbidden_spec_keys:
-                    if k in spec:
-                        raise ValueError(f"fluxonkv_spec.{k} is forbidden in zero-contribution mode")
-            else:
-                if not contrib_present or not isinstance(contrib, dict):
-                    raise ValueError(
-                        "contribute_to_cluster_pool_size is required for owner mode (non-zero contribution)"
-                    )
-                if int(contrib["dram"]) == 0:
-                    raise ValueError("owner mode requires non-zero contribute_to_cluster_pool_size.dram")
-                if "etcd_addresses" not in spec:
-                    raise ValueError("fluxonkv_spec.etcd_addresses is required for owner mode")
-                etcd_addresses = spec.get("etcd_addresses")
-                if not isinstance(etcd_addresses, list) or len(etcd_addresses) == 0:
-                    raise ValueError("fluxonkv_spec.etcd_addresses must be a non-empty list")
-                if "sub_cluster" not in spec:
-                    raise ValueError("fluxonkv_spec.sub_cluster is required for owner mode")
-                sub_cluster = spec.get("sub_cluster")
-                if not isinstance(sub_cluster, str) or not sub_cluster.strip():
-                    raise ValueError(
-                        "fluxonkv_spec.sub_cluster must be a non-empty string in owner mode"
-                    )
-                if sub_cluster != sub_cluster.strip():
-                    raise ValueError(
-                        "fluxonkv_spec.sub_cluster must not have leading/trailing whitespace"
-                    )
+            _validate_fluxonkv_contract(plain)
 
         self.config_dict = plain
 
@@ -521,7 +564,9 @@ def __str__(self):
 
     def to_yaml_str(self) -> str:
         """Serialize the config dict into a YAML document string."""
-        return yaml.safe_dump(self.config_dict, sort_keys=False)
+        cfg = self.to_dict()
+        _validate_fluxonkv_contract(cfg)
+        return yaml.safe_dump(cfg, sort_keys=False)
 
     def to_fluxon_kv_client_config_yaml_str(self) -> str:
         """Build the YAML string expected by the Rust `ClientConfigYaml` schema."""
@@ -534,75 +579,7 @@ def to_fluxon_kv_client_config_yaml_str(self) -> str:
         spec = cfg.get("fluxonkv_spec")
         if not isinstance(spec, dict):
             raise ValueError("fluxonkv_spec is required for Fluxon KV client")
-
-        contrib_present = "contribute_to_cluster_pool_size" in cfg
-        contrib = cfg.get("contribute_to_cluster_pool_size")
-        is_zero_contribution = False
-        if not contrib_present or contrib is None:
-            is_zero_contribution = True
-        elif isinstance(contrib, dict):
-            dram = int(contrib["dram"])
-            vram_raw = contrib.get("vram")
-            if vram_raw is None:
-                vram = {}
-            elif not isinstance(vram_raw, dict):
-                raise ValueError("contribute_to_cluster_pool_size.vram must be a mapping")
-            else:
-                vram = vram_raw
-            vram_is_zero = True
-            for _, v in vram.items():
-                if int(v) != 0:
-                    vram_is_zero = False
-                    break
-            if dram == 0 and not vram_is_zero:
-                raise ValueError(
-                    "contribute_to_cluster_pool_size is partially zero: dram=0 but vram has non-zero values"
-                )
-            is_zero_contribution = dram == 0 and vram_is_zero
-        else:
-            raise ValueError("contribute_to_cluster_pool_size must be a mapping when provided")
-
-        shared_memory_path = spec.get("shared_memory_path")
-        if not isinstance(shared_memory_path, str) or not shared_memory_path.strip():
-            raise ValueError("fluxonkv_spec.shared_memory_path must be a non-empty string")
-        shared_file_path = spec.get("shared_file_path")
-        if not isinstance(shared_file_path, str) or not shared_file_path.strip():
-            raise ValueError("fluxonkv_spec.shared_file_path must be a non-empty string")
-
-        if "rdma_device_names" in cfg:
-            raise ValueError("rdma_device_names has been removed from Fluxon KV config")
-
-        if "transfer_engine" in spec:
-            raise ValueError("fluxonkv_spec.transfer_engine has been removed from Fluxon KV config")
-
-        if is_zero_contribution:
-            forbidden_spec_keys = [
-                "etcd_addresses",
-                "redis_compat",
-                "sub_cluster",
-            ]
-            for k in forbidden_spec_keys:
-                if k in spec:
-                    raise ValueError(f"fluxonkv_spec.{k} is forbidden in zero-contribution mode")
-
-            return yaml.safe_dump(cfg, sort_keys=False)
-
-        # Owner mode must always declare large-file roots for logs and caches.
-        # p2p_listen_port remains optional here: deterministic case-local
-        # topologies may pin it, while shared testbed flows can leave it unset
-        # and let runtime choose an available port.
-        if "large_file_paths" not in spec:
-            raise ValueError("fluxonkv_spec.large_file_paths is required for owner mode")
-        large_file_paths = spec.get("large_file_paths")
-        if not isinstance(large_file_paths, dict):
-            raise ValueError("fluxonkv_spec.large_file_paths must be a mapping in owner mode")
-        for field_name in ("log_root_path", "cache_root_path"):
-            field_value = large_file_paths.get(field_name)
-            if not isinstance(field_value, str) or not field_value.strip():
-                raise ValueError(
-                    f"fluxonkv_spec.large_file_paths.{field_name} must be a non-empty string in owner mode"
-                )
-
+        _validate_fluxonkv_contract(cfg)
         return yaml.safe_dump(cfg, sort_keys=False)
     
 
diff --git a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
index 38d98c4..1bad008 100644
--- a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
+++ b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
@@ -1598,6 +1598,9 @@ def _owner_kvclient_config(self) -> dict[str, Any]:
                 "shared_memory_path": str(self._shared_memory_root),
                 "shared_file_path": str(self._shared_file_root),
                 "sub_cluster": "transfer_owner",
+                "large_file_paths": {
+                    "root_paths": [str(self._work_root / "large" / "owner")],
+                },
             },
             "test_spec_config": {
                 "disable_observability": True,
diff --git a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
index 90ea518..52296a1 100644
--- a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
+++ b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
@@ -86,7 +86,10 @@ service:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
           shared_memory_path: "__OWNER1_SHM__"
+          shared_file_path: "__OWNER1_SHARED_FILE__"
           sub_cluster: "owner1"
+          large_file_paths:
+            root_paths: ["__OWNER1_LARGE_ROOT__"]
           p2p_listen_port: 31011
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner1"
@@ -115,7 +118,10 @@ service:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
           shared_memory_path: "__OWNER2_SHM__"
+          shared_file_path: "__OWNER2_SHARED_FILE__"
           sub_cluster: "owner2"
+          large_file_paths:
+            root_paths: ["__OWNER2_LARGE_ROOT__"]
           p2p_listen_port: 31012
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner2"
@@ -144,7 +150,10 @@ service:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
           shared_memory_path: "__OWNER3_SHM__"
+          shared_file_path: "__OWNER3_SHARED_FILE__"
           sub_cluster: "owner3"
+          large_file_paths:
+            root_paths: ["__OWNER3_LARGE_ROOT__"]
           p2p_listen_port: 31013
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner3"
@@ -173,7 +182,10 @@ service:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
           shared_memory_path: "__OWNER4_SHM__"
+          shared_file_path: "__OWNER4_SHARED_FILE__"
           sub_cluster: "owner4"
+          large_file_paths:
+            root_paths: ["__OWNER4_LARGE_ROOT__"]
           p2p_listen_port: 31014
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner4"
diff --git a/fluxon_py/tests/test_backend_relay_docker.py b/fluxon_py/tests/test_backend_relay_docker.py
index 20b970d..1699b0c 100644
--- a/fluxon_py/tests/test_backend_relay_docker.py
+++ b/fluxon_py/tests/test_backend_relay_docker.py
@@ -42,31 +42,36 @@ def main() -> None:
             raise RuntimeError("mode is required")
         mode = sys.argv[1]
         if mode == "wait-store":
-            if len(sys.argv) != 5:
-                raise RuntimeError("wait-store requires: cluster_name shared_memory_path timeout_seconds")
-            _wait_store(sys.argv[2], sys.argv[3], float(sys.argv[4]))
+            if len(sys.argv) != 6:
+                raise RuntimeError("wait-store requires: cluster_name shared_memory_path shared_file_path timeout_seconds")
+            _wait_store(sys.argv[2], sys.argv[3], sys.argv[4], float(sys.argv[5]))
             print("wait-store ok")
             return
         if mode == "put":
-            if len(sys.argv) != 6:
-                raise RuntimeError("put requires: cluster_name shared_memory_path key payload_base64")
-            _put(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5])
+            if len(sys.argv) != 7:
+                raise RuntimeError("put requires: cluster_name shared_memory_path shared_file_path key payload_base64")
+            _put(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], sys.argv[6])
             print("put ok")
             return
         if mode == "get":
-            if len(sys.argv) != 7:
-                raise RuntimeError("get requires: cluster_name shared_memory_path key expected_base64 timeout_seconds")
-            _get(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], float(sys.argv[6]))
+            if len(sys.argv) != 8:
+                raise RuntimeError("get requires: cluster_name shared_memory_path shared_file_path key expected_base64 timeout_seconds")
+            _get(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], sys.argv[6], float(sys.argv[7]))
             print("get ok")
             return
         raise RuntimeError(f"unknown mode: {mode}")
 
 
-    def _wait_store(cluster_name: str, shared_memory_path: str, timeout_seconds: float) -> None:
+    def _wait_store(
+        cluster_name: str,
+        shared_memory_path: str,
+        shared_file_path: str,
+        timeout_seconds: float,
+    ) -> None:
         deadline = time.time() + timeout_seconds
         last_error = ""
         while time.time() < deadline:
-            result = new_store(_new_config(cluster_name, shared_memory_path))
+            result = new_store(_new_config(cluster_name, shared_memory_path, shared_file_path))
             if result.is_ok():
                 store = result.unwrap()
                 _close_store(store)
@@ -76,9 +81,15 @@ def _wait_store(cluster_name: str, shared_memory_path: str, timeout_seconds: flo
         raise RuntimeError(f"wait-store timed out: {last_error}")
 
 
-    def _put(cluster_name: str, shared_memory_path: str, key: str, payload_base64: str) -> None:
+    def _put(
+        cluster_name: str,
+        shared_memory_path: str,
+        shared_file_path: str,
+        key: str,
+        payload_base64: str,
+    ) -> None:
         payload = base64.b64decode(payload_base64.encode("ascii"))
-        store = _open_store(cluster_name, shared_memory_path)
+        store = _open_store(cluster_name, shared_memory_path, shared_file_path)
         try:
             put_result = store.put(key, {"payload": payload})
             if not put_result.is_ok():
@@ -94,13 +105,14 @@ def _put(cluster_name: str, shared_memory_path: str, key: str, payload_base64: s
     def _get(
         cluster_name: str,
         shared_memory_path: str,
+        shared_file_path: str,
         key: str,
         expected_base64: str,
         timeout_seconds: float,
     ) -> None:
         expected = base64.b64decode(expected_base64.encode("ascii"))
         deadline = time.time() + timeout_seconds
-        store = _open_store(cluster_name, shared_memory_path)
+        store = _open_store(cluster_name, shared_memory_path, shared_file_path)
         try:
             last_error = ""
             while time.time() < deadline:
@@ -125,7 +137,11 @@ def _get(
             _close_store(store)
 
 
-    def _new_config(cluster_name: str, shared_memory_path: str) -> FluxonKvClientConfig:
+    def _new_config(
+        cluster_name: str,
+        shared_memory_path: str,
+        shared_file_path: str,
+    ) -> FluxonKvClientConfig:
         return FluxonKvClientConfig(
             {
                 "instance_key": f"relay_helper_{os.getpid()}_{int(time.time() * 1000)}",
@@ -133,13 +149,14 @@ def _new_config(cluster_name: str, shared_memory_path: str) -> FluxonKvClientCon
                 "fluxonkv_spec": {
                     "cluster_name": cluster_name,
                     "shared_memory_path": shared_memory_path,
+                    "shared_file_path": shared_file_path,
                 },
             }
         )
 
 
-    def _open_store(cluster_name: str, shared_memory_path: str):
-        result = new_store(_new_config(cluster_name, shared_memory_path))
+    def _open_store(cluster_name: str, shared_memory_path: str, shared_file_path: str):
+        result = new_store(_new_config(cluster_name, shared_memory_path, shared_file_path))
         if not result.is_ok():
             raise RuntimeError(f"new_store failed: {result.unwrap_error()}")
         return result.unwrap()
@@ -290,6 +307,7 @@ def _relay_wait_for_store(
     helper_path: str,
     cluster_name: str,
     shared_memory_path: str,
+    shared_file_path: str,
 ) -> None:
     _relay_run(
         [
@@ -301,6 +319,7 @@ def _relay_wait_for_store(
             "wait-store",
             cluster_name,
             shared_memory_path,
+            shared_file_path,
             str(RELAY_DOCKER_WAIT_TIMEOUT_SECONDS),
         ],
         timeout_seconds=RELAY_DOCKER_WAIT_TIMEOUT_SECONDS + 30,
@@ -423,6 +442,14 @@ def test_relay_docker_connectivity() -> int:
             owner_name: f"{container_runtime_root}/shm/{owner_name}"
             for owner_name in ("owner1", "owner2", "owner3", "owner4")
         }
+        owner_shared_file_paths = {
+            owner_name: f"{container_runtime_root}/sharefile/{owner_name}"
+            for owner_name in ("owner1", "owner2", "owner3", "owner4")
+        }
+        owner_large_root_paths = {
+            owner_name: f"{container_runtime_root}/large/{owner_name}"
+            for owner_name in ("owner1", "owner2", "owner3", "owner4")
+        }
         _relay_render_template(
             deployconf_template_path,
             rendered_deployconf_path,
@@ -448,6 +475,14 @@ def test_relay_docker_connectivity() -> int:
                 "__OWNER2_SHM__": owner_shm_paths["owner2"],
                 "__OWNER3_SHM__": owner_shm_paths["owner3"],
                 "__OWNER4_SHM__": owner_shm_paths["owner4"],
+                "__OWNER1_SHARED_FILE__": owner_shared_file_paths["owner1"],
+                "__OWNER2_SHARED_FILE__": owner_shared_file_paths["owner2"],
+                "__OWNER3_SHARED_FILE__": owner_shared_file_paths["owner3"],
+                "__OWNER4_SHARED_FILE__": owner_shared_file_paths["owner4"],
+                "__OWNER1_LARGE_ROOT__": owner_large_root_paths["owner1"],
+                "__OWNER2_LARGE_ROOT__": owner_large_root_paths["owner2"],
+                "__OWNER3_LARGE_ROOT__": owner_large_root_paths["owner3"],
+                "__OWNER4_LARGE_ROOT__": owner_large_root_paths["owner4"],
             },
         )
 
@@ -488,12 +523,14 @@ def test_relay_docker_connectivity() -> int:
             helper_path=helper_container_path,
             cluster_name=cluster_name,
             shared_memory_path=owner_shm_paths["owner1"],
+            shared_file_path=owner_shared_file_paths["owner1"],
         )
         _relay_wait_for_store(
             container_name=container_names["owner4"],
             helper_path=helper_container_path,
             cluster_name=cluster_name,
             shared_memory_path=owner_shm_paths["owner4"],
+            shared_file_path=owner_shared_file_paths["owner4"],
         )
 
         key = f"/relay_docker/{run_suffix}/payload"
@@ -509,6 +546,7 @@ def test_relay_docker_connectivity() -> int:
                 "get",
                 cluster_name,
                 owner_shm_paths["owner4"],
+                owner_shared_file_paths["owner4"],
                 key,
                 payload_base64,
                 str(RELAY_DOCKER_GET_TIMEOUT_SECONDS),
@@ -528,6 +566,7 @@ def test_relay_docker_connectivity() -> int:
                 "put",
                 cluster_name,
                 owner_shm_paths["owner1"],
+                owner_shared_file_paths["owner1"],
                 key,
                 payload_base64,
             ],
diff --git a/fluxon_py/tests/test_config.py b/fluxon_py/tests/test_config.py
index 2979d8e..b6ced9e 100644
--- a/fluxon_py/tests/test_config.py
+++ b/fluxon_py/tests/test_config.py
@@ -48,6 +48,7 @@ def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[
         ("fluxonkv_sub_cluster_config", test_fluxonkv_sub_cluster_config),
         ("fluxonkv_owner_requires_sub_cluster", test_fluxonkv_owner_requires_sub_cluster),
         ("fluxonkv_owner_requires_large_file_paths", test_fluxonkv_owner_requires_large_file_paths),
+        ("fluxonkv_external_forbids_large_file_paths", test_fluxonkv_external_forbids_large_file_paths),
         ("fluxonkv_p2p_relay_removed", test_fluxonkv_p2p_relay_removed),
         ("fluxon_client_config_yaml_shape", test_fluxon_client_config_yaml_shape),
         ("fluxonkv_protocol_field", test_fluxonkv_protocol_field),
@@ -143,21 +144,40 @@ def _import_fluxon_pyo3_tool_without_package_init():
 _PYO3_TOOL = _import_fluxon_pyo3_tool_without_package_init()
 
 
+def _owner_large_file_paths(tag: str) -> dict[str, list[str]]:
+    return {
+        "root_paths": [f"/tmp/kvcache_large/{tag}"],
+    }
+
+
+def _owner_fluxonkv_base_config(
+    *,
+    instance_key: str = "test_instance",
+    cluster_name: str = "test_cluster",
+    shared_memory_path: str = "/tmp/kvcache_shared_memory/test",
+    shared_file_path: str = "/tmp/kvcache_shared_files/test",
+    sub_cluster: str = "rack-a",
+    tag: str = "test",
+) -> dict:
+    return {
+        "instance_key": instance_key,
+        "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
+        "fluxonkv_spec": {
+            "etcd_addresses": ["localhost:2379"],
+            "cluster_name": cluster_name,
+            "shared_memory_path": shared_memory_path,
+            "shared_file_path": shared_file_path,
+            "sub_cluster": sub_cluster,
+            "large_file_paths": _owner_large_file_paths(tag),
+        },
+    }
+
+
 def test_fluxonkv_sub_cluster_config():
     """Test fluxonkv_spec.sub_cluster is accepted and exposed."""
     try:
         config = FluxonKvClientConfig(
-            {
-                "instance_key": "test_instance",
-                "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-                "fluxonkv_spec": {
-                    "etcd_addresses": ["localhost:2379"],
-                    "cluster_name": "test_cluster",
-                    "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                    "shared_file_path": "/tmp/kvcache_shared_files/test",
-                    "sub_cluster": "producer_side",
-                },
-            }
+            _owner_fluxonkv_base_config(sub_cluster="producer_side", tag="sub_cluster")
         )
         assert config.fluxonkv_spec_sub_cluster == "producer_side"
         print("✅ PASS: test_fluxonkv_sub_cluster_config")
@@ -226,16 +246,8 @@ def test_fluxon_pyo3_import_authority():
 def test_fluxonkv_owner_requires_sub_cluster():
     """Ensure owner mode requires a clean non-empty fluxonkv_spec.sub_cluster."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-            },
-        }
+        base = _owner_fluxonkv_base_config(tag="owner_requires_sub_cluster")
+        del base["fluxonkv_spec"]["sub_cluster"]
 
         try:
             FluxonKvClientConfig(copy.deepcopy(base))
@@ -274,20 +286,11 @@ def test_fluxonkv_owner_requires_sub_cluster():
 def test_fluxonkv_owner_requires_large_file_paths():
     """Ensure owner mode requires explicit large_file_paths roots."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
-            },
-        }
+        base = _owner_fluxonkv_base_config(tag="owner_requires_large_file_paths")
+        del base["fluxonkv_spec"]["large_file_paths"]
 
         try:
-            FluxonKvClientConfig(copy.deepcopy(base)).to_fluxon_kv_client_config_yaml_str()
+            FluxonKvClientConfig(copy.deepcopy(base))
             print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - missing large_file_paths should be rejected")
             return
         except ValueError:
@@ -295,44 +298,53 @@ def test_fluxonkv_owner_requires_large_file_paths():
 
         invalid_blank = copy.deepcopy(base)
         invalid_blank["fluxonkv_spec"]["large_file_paths"] = {
-            "log_root_path": "   ",
-            "cache_root_path": "/tmp/kvcache_large_cache/test",
+            "root_paths": ["   "],
         }
         try:
-            FluxonKvClientConfig(invalid_blank).to_fluxon_kv_client_config_yaml_str()
-            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - blank log_root_path should be rejected")
+            FluxonKvClientConfig(invalid_blank)
+            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - blank root_paths entry should be rejected")
             return
         except ValueError:
             pass
 
-        valid = copy.deepcopy(base)
-        valid["fluxonkv_spec"]["large_file_paths"] = {
-            "log_root_path": "/tmp/kvcache_large_logs/test",
-            "cache_root_path": "/tmp/kvcache_large_cache/test",
-        }
+        valid = _owner_fluxonkv_base_config(tag="owner_requires_large_file_paths_valid")
         rendered = FluxonKvClientConfig(valid).to_fluxon_kv_client_config_yaml_str()
         assert "large_file_paths:" in rendered
-        assert "log_root_path: /tmp/kvcache_large_logs/test" in rendered
-        assert "cache_root_path: /tmp/kvcache_large_cache/test" in rendered
+        assert "root_paths:" in rendered
+        assert "- /tmp/kvcache_large/owner_requires_large_file_paths_valid" in rendered
         print("✅ PASS: test_fluxonkv_owner_requires_large_file_paths")
     except Exception as e:
         print(f"❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - {e}")
 
 
-def test_fluxonkv_p2p_relay_removed():
-    """Ensure removed fluxonkv_spec.p2p_relay is rejected as an unknown key."""
+def test_fluxonkv_external_forbids_large_file_paths():
+    """Ensure zero-contribution external config cannot declare owner-only large_file_paths."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
+        external = {
+            "instance_key": "test_external",
+            "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
             "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
                 "cluster_name": "test_cluster",
                 "shared_memory_path": "/tmp/kvcache_shared_memory/test",
                 "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
+                "large_file_paths": _owner_large_file_paths("external_forbidden"),
             },
         }
+        try:
+            FluxonKvClientConfig(external)
+            print("❌ FAIL: test_fluxonkv_external_forbids_large_file_paths - external large_file_paths should be rejected")
+            return
+        except ValueError:
+            pass
+        print("✅ PASS: test_fluxonkv_external_forbids_large_file_paths")
+    except Exception as e:
+        print(f"❌ FAIL: test_fluxonkv_external_forbids_large_file_paths - {e}")
+
+
+def test_fluxonkv_p2p_relay_removed():
+    """Ensure removed fluxonkv_spec.p2p_relay is rejected as an unknown key."""
+    try:
+        base = _owner_fluxonkv_base_config(tag="p2p_relay_removed")
 
         _ = FluxonKvClientConfig(copy.deepcopy(base))
 
@@ -353,17 +365,7 @@ def test_fluxonkv_p2p_relay_removed():
 def test_fluxon_client_config_yaml_shape():
     """Test YAML shape required by Rust ClientConfigYaml."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
-            },
-        }
+        base = _owner_fluxonkv_base_config(tag="yaml_shape")
         config = FluxonKvClientConfig(copy.deepcopy(base))
         yaml_text = config.to_fluxon_kv_client_config_yaml_str()
         loaded = yaml.safe_load(yaml_text)
@@ -410,17 +412,7 @@ def test_fluxonkv_protocol_field():
 def test_fluxonkv_runtime_defaults_are_internal():
     """Ensure Fluxon KV runtime defaults stay internal and are not serialized into YAML."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
-            },
-        }
+        base = _owner_fluxonkv_base_config(tag="runtime_defaults")
         config = FluxonKvClientConfig(copy.deepcopy(base))
         assert config.fluxonkv_spec_transfer_engine == "closed"
         assert config.protocol_rdma_device_names is None
@@ -436,17 +428,7 @@ def test_fluxonkv_runtime_defaults_are_internal():
 def test_fluxonkv_removed_rdma_config_keys():
     """Ensure removed Fluxon KV RDMA config keys are rejected."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
-            },
-        }
+        base = _owner_fluxonkv_base_config(tag="removed_rdma_keys")
 
         invalid_rdma = copy.deepcopy(base)
         invalid_rdma["rdma_device_names"] = "mlx5_0:1"
@@ -474,21 +456,11 @@ def test_fluxonkv_removed_rdma_config_keys():
 def test_fluxonkv_test_spec_config():
     """Ensure test_spec_config is accepted, normalized, and serialized."""
     try:
-        base = {
-            "instance_key": "test_instance",
-            "contribute_to_cluster_pool_size": {"dram": 16777216, "vram": {}},
-            "fluxonkv_spec": {
-                "etcd_addresses": ["localhost:2379"],
-                "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
-                "sub_cluster": "rack-a",
-            },
-            "test_spec_config": {
-                "disable_observability": True,
-                "enable_iceoryx_logs": True,
-                "transport_mode": "transfer_only",
-            },
+        base = _owner_fluxonkv_base_config(tag="test_spec_config")
+        base["test_spec_config"] = {
+            "disable_observability": True,
+            "enable_iceoryx_logs": True,
+            "transport_mode": "transfer_only",
         }
 
         try:
diff --git a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
index 8e416a2..88c346b 100644
--- a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
+++ b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
@@ -486,6 +486,9 @@ def _build_example_config(
                 "shared_memory_path": shared_memory_path,
                 "shared_file_path": str((Path(shared_memory_path).parent / "sharefile").resolve()),
                 "sub_cluster": "demo",
+                "large_file_paths": {
+                    "root_paths": [str((Path(shared_memory_path).parent / "large" / "owner").resolve())],
+                },
             },
         },
         "kvexternal": {
diff --git a/fluxon_rs/fluxon_fs/src/agent.rs b/fluxon_rs/fluxon_fs/src/agent.rs
index 03a3dd0..a482616 100644
--- a/fluxon_rs/fluxon_fs/src/agent.rs
+++ b/fluxon_rs/fluxon_fs/src/agent.rs
@@ -1412,15 +1412,18 @@ impl FluxonFsAgent {
                 .external_client_api_view()
                 .external_client_api()
                 .inner()
-                .cache_root_path()
+                .large_file_paths()
+                .fs_disk_cache_base_dir()
+                .map_err(|err| format!("invalid external large_file_paths: {}", err))?
         } else {
             self.kv_framework
                 .client_seg_pool_view()
                 .client_seg_pool()
-                .cache_root_path()
-                .to_string()
+                .large_file_paths()
+                .fs_disk_cache_base_dir()
+                .map_err(|err| format!("invalid owner large_file_paths: {}", err))?
         };
-        let cache_root = resolve_disk_cache_root(Path::new(&cache_root_base), &instance_key);
+        let cache_root = resolve_disk_cache_root(cache_root_base.as_path(), &instance_key);
         let cache =
             RemoteDiskCacheManager::new(cache_root.clone(), disk_cache_max_bytes_from_env())
                 .map_err(|err| {
diff --git a/fluxon_rs/fluxon_fs/src/agent_service.rs b/fluxon_rs/fluxon_fs/src/agent_service.rs
index 91315df..395dfbc 100644
--- a/fluxon_rs/fluxon_fs/src/agent_service.rs
+++ b/fluxon_rs/fluxon_fs/src/agent_service.rs
@@ -56,6 +56,8 @@ use crate::write_session_rpc::{
     FsWriteSessionChunkResp, FsWriteSessionDataFrame,
 };
 
+pub(crate) mod transfer_agent;
+
 pub const CHUNK_BYTES: usize = 1024 * 1024;
 pub const READ_CHUNK_BYTES: usize = 8 * 1024 * 1024;
 pub const WRITE_SESSION_CHUNK_BYTES: usize = crate::agent::REMOTE_WRITE_SESSION_CHUNK_BYTES;
@@ -65,6 +67,9 @@ const WRITE_SESSION_MAX_QUEUED_BYTES: usize =
 const WRITE_SESSION_IDLE_TIMEOUT_SECS: u64 = 180;
 const WRITE_SESSION_REAP_INTERVAL_SECS: u64 = 30;
 const WRITE_SESSION_CLOSE_WAIT_TIMEOUT_SECS: u64 = 30;
+pub(crate) const TRANSFER_HEARTBEAT_INTERVAL_MS: i64 = 5_000;
+pub(crate) const TRANSFER_STREAM_RPC_TIMEOUT_MS: u64 = 60_000;
+pub(crate) const TRANSFER_WORKER_COORDINATION_RPC_TIMEOUT_MS: u64 = 30_000;
 const AGENT_EXPORTS_SNAPSHOT_SCHEMA_VERSION_KEY: &str = "schema_version";
 const AGENT_EXPORTS_SNAPSHOT_EXPORTS_JSON_KEY: &str = "exports_json";
 const AGENT_EXPORT_NAME_KEY: &str = "export_name";
@@ -4950,6 +4955,7 @@ mod tests {
         FluxonFsRuntimeAccessModel {
             users: vec![FluxonFsRuntimeAccessUser {
                 username: "alice".to_string(),
+                can_manage_users: false,
                 rpc_token_secret_sha256_hex: hex::encode(sha2::Sha256::digest(b"pw")),
             }],
             scope_access: vec![FluxonFsScopeAccess {
@@ -4965,6 +4971,7 @@ mod tests {
         FluxonFsRuntimeAccessModel {
             users: vec![FluxonFsRuntimeAccessUser {
                 username: "alice".to_string(),
+                can_manage_users: false,
                 rpc_token_secret_sha256_hex: hex::encode(sha2::Sha256::digest(b"pw")),
             }],
             scope_access: vec![FluxonFsScopeAccess {
diff --git a/fluxon_rs/fluxon_fs/src/agent_service/transfer_agent.rs b/fluxon_rs/fluxon_fs/src/agent_service/transfer_agent.rs
index f35d8e8..1738ade 100644
--- a/fluxon_rs/fluxon_fs/src/agent_service/transfer_agent.rs
+++ b/fluxon_rs/fluxon_fs/src/agent_service/transfer_agent.rs
@@ -6024,45 +6024,13 @@ mod tests {
     use std::os::unix::fs::PermissionsExt;
 
     use fluxon_fs_core::config::{
-        FluxonFsExport, FluxonFsExportRoutingMode, FluxonFsExportRpcPaths, FluxonFsGlobalConfig,
-        FluxonFsTransferDispositionWire,
+        FluxonFsExport, FluxonFsGlobalConfig, FluxonFsTransferDispositionWire,
+        agent_registry_export_for_name_and_root_v1,
     };
     use tempfile::TempDir;
 
     fn test_export(root_dir_abs: &str) -> FluxonFsExport {
-        FluxonFsExport {
-            remote_root_dir_abs: root_dir_abs.to_string(),
-            routing_mode: FluxonFsExportRoutingMode::AgentRegistry,
-            nodes: Vec::new(),
-            cache_kv_key_prefix: "/test/cache/".to_string(),
-            cache_bytes_field_key: "bytes".to_string(),
-            cache_max_bytes: 1,
-            rpc_paths: FluxonFsExportRpcPaths {
-                stat: "/stat".to_string(),
-                lstat: "/lstat".to_string(),
-                list_dir: "/list_dir".to_string(),
-                readlink: "/readlink".to_string(),
-                setxattr: "/setxattr".to_string(),
-                getxattr: "/getxattr".to_string(),
-                listxattr: "/listxattr".to_string(),
-                removexattr: "/removexattr".to_string(),
-                read_chunk: "/read_chunk".to_string(),
-                write_chunk: "/write_chunk".to_string(),
-                truncate: "/truncate".to_string(),
-                mkdir: "/mkdir".to_string(),
-                mkfifo: "/mkfifo".to_string(),
-                mknod: "/mknod".to_string(),
-                rmdir: "/rmdir".to_string(),
-                unlink: "/unlink".to_string(),
-                link: "/link".to_string(),
-                symlink: "/symlink".to_string(),
-                rename: "/rename".to_string(),
-                chmod: "/chmod".to_string(),
-                chown: "/chown".to_string(),
-                lchown: "/lchown".to_string(),
-                utime: "/utime".to_string(),
-            },
-        }
+        agent_registry_export_for_name_and_root_v1("src", root_dir_abs)
     }
 
     fn test_exports_handle(root_dir_abs: &str) -> AgentExportsHandle {
@@ -6071,6 +6039,7 @@ mod tests {
         AgentExportsHandle::new_from_static_cfg(
             &FluxonFsGlobalConfig {
                 stale_window_ms: 1,
+                write_session_target_inflight_bytes: 64 * 1024 * 1024,
                 rules: Vec::new(),
                 exports,
             },
diff --git a/fluxon_rs/fluxon_fs/src/remote_disk_cache.rs b/fluxon_rs/fluxon_fs/src/remote_disk_cache.rs
index 736592a..e45f15e 100644
--- a/fluxon_rs/fluxon_fs/src/remote_disk_cache.rs
+++ b/fluxon_rs/fluxon_fs/src/remote_disk_cache.rs
@@ -389,16 +389,14 @@ pub fn disk_cache_max_bytes_from_env() -> u64 {
         .unwrap_or(REMOTE_DISK_CACHE_MAX_BYTES_DEFAULT)
 }
 
-pub fn resolve_disk_cache_root(shared_file_path: &Path, instance_key: &str) -> PathBuf {
+pub fn resolve_disk_cache_root(cache_root_base: &Path, instance_key: &str) -> PathBuf {
     if let Some(raw) = env::var_os(REMOTE_DISK_CACHE_ROOT_ENV) {
         let trimmed = raw.to_string_lossy().trim().to_string();
         if !trimmed.is_empty() {
             return PathBuf::from(trimmed);
         }
     }
-    shared_file_path
-        .join(REMOTE_DISK_CACHE_DIRNAME)
-        .join(safe_cache_component(instance_key))
+    cache_root_base.join(safe_cache_component(instance_key))
 }
 
 fn write_meta(path: &Path, meta: &RemoteDiskCacheIndexMeta) -> io::Result<()> {
diff --git a/fluxon_rs/fluxon_kv/framework_init_steps.yaml b/fluxon_rs/fluxon_kv/framework_init_steps.yaml
index 95e18b5..923ae30 100644
--- a/fluxon_rs/fluxon_kv/framework_init_steps.yaml
+++ b/fluxon_rs/fluxon_kv/framework_init_steps.yaml
@@ -24,24 +24,24 @@ resources:
     publish_tags: [master, owner, external]
     published_by: ClusterManager.step.1.init2
     doc: |
-      - ClusterManager: member watch 已建立(具备持续观测能力)
-      - 提供: ClusterManager.listen() 可持续消费 ClusterEvent
+      - ClusterManager: member watch is established and continuous observation is available
+      - Provides: `ClusterManager.listen()` can continuously consume `ClusterEvent`
 
   - id: owner_shared_mem_bundle_ready
     tags: [external]
     publish_tags: []
     published_by: ExternalClientApi.step.1.prepare
     doc: |
-      - external: 等 shared.json+mmap.file -> mmap -> 等 owner member 可观测
-      - owner: shared.json 由 owner 的 segment registration 流程写入(不在 init DAG 内显式建模)
+      - external: wait until owner `shared.json` is readable and passes metadata validation, then wait for `mmap.file` -> mmap -> owner member observability
+      - owner: `shared.json` is written by the owner's segment-registration flow and is not modeled explicitly inside the init DAG
 
   - id: prom_remote_write_wait_ready
     tags: [owner, external]
     publish_tags: [master]
     published_by: MetricReporter.step.1.prepare
     doc: |
-      - master: 发布 prom remote_write urls(通过 cluster member state)
-      - owner/external: 等待直到可观测到 master prom remote_write urls(best-effort)
+      - master: publish Prometheus remote_write URLs through cluster member state
+      - owner/external: wait until the master's remote_write URLs become observable, best-effort
 
 # Init-step DAG source of truth.
 #
@@ -73,9 +73,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: ClusterManager(无PostView)
-      - 写 local_state: 保存连接参数/分配本地缓存；若提供 local_ipc_root，则在此处规范化后预填到 self member metadata(不启动任务)
-      - 依赖: 无
+      - Construct `ClusterManager` with no PostView
+      - Write local state: persist connection args and allocate local caches; if `local_ipc_root` is provided, normalize it here and prefill it into self-member metadata without starting tasks
+      - Depends on: none
     exec:
       kind: Construct
       call: "ClusterManager::construct"
@@ -87,9 +87,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: P2pModule(无PostView)
-      - 写 local_state: 分配 P2P 状态/缓存(不启动 transport)
-      - 依赖: 无
+      - Construct `P2pModule` with no PostView
+      - Write local state: allocate P2P state and caches without starting transport
+      - Depends on: none
     exec:
       kind: Construct
       call: "P2pModule::construct"
@@ -101,9 +101,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: MasterSegManager(无PostView)
-      - 写 local_state: 分配段管理器状态(不注册RPC)
-      - 依赖: 无
+      - Construct `MasterSegManager` with no PostView
+      - Write local state: allocate segment-manager state without registering RPCs
+      - Depends on: none
     exec:
       kind: Construct
       call: "MasterSegManager::construct"
@@ -115,9 +115,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: MasterKvRouter(无PostView)
-      - 写 local_state: 分配策略/缓存/通道(不注册RPC/不启动任务)
-      - 依赖: 无
+      - Construct `MasterKvRouter` with no PostView
+      - Write local state: allocate policy state, caches, and channels without registering RPCs or starting tasks
+      - Depends on: none
     exec:
       kind: Construct
       call: "MasterKvRouter::construct"
@@ -129,9 +129,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: MetricReporter(无PostView)
-      - 写 local_state: 准备 registry/缓冲区(不启动 loop)
-      - 依赖: 无
+      - Construct `MetricReporter` with no PostView
+      - Write local state: prepare registries and buffers without starting loops
+      - Depends on: none
     exec:
       kind: Construct
       call: "MetricReporter::construct"
@@ -143,9 +143,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: ClientKvApi(无PostView)
-      - 写 local_state: 分配 API 状态(不注册RPC)
-      - 依赖: 无
+      - Construct `ClientKvApi` with no PostView
+      - Write local state: allocate API state without registering RPCs
+      - Depends on: none
     exec:
       kind: Construct
       call: "ClientKvApi::construct"
@@ -157,9 +157,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: ClientSegPool(无PostView)
-      - 写 local_state: 准备共享内存相关状态(不写 cluster)
-      - 依赖: 无
+      - Construct `ClientSegPool` with no PostView
+      - Write local state: prepare shared-memory-related state without publishing cluster state
+      - Depends on: none
     exec:
       kind: Construct
       call: "ClientSegPool::construct"
@@ -171,9 +171,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: ClientTransferEngine(无PostView)
-      - 写 local_state: 准备 engine 状态(不启动后端)
-      - 依赖: 无
+      - Construct `ClientTransferEngine` with no PostView
+      - Write local state: prepare engine state without starting the backend
+      - Depends on: none
     exec:
       kind: Construct
       call: "ClientTransferEngine::construct"
@@ -185,9 +185,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: ExternalClientApi(无PostView)
-      - 写 local_state: 准备 external 状态(不做 owner discovery)
-      - 依赖: 无
+      - Construct `ExternalClientApi` with no PostView
+      - Write local state: prepare external-client state without doing owner discovery
+      - Depends on: none
     exec:
       kind: Construct
       call: "ExternalClientApi::construct"
@@ -199,9 +199,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 构造: MasterLeaseManager(无PostView)
-      - 写 local_state: 分配 lease 表/cleanup 状态(不注册RPC)
-      - 依赖: 无
+      - Construct `MasterLeaseManager` with no PostView
+      - Write local state: allocate lease-table and cleanup state without registering RPCs
+      - Depends on: none
     exec:
       kind: Construct
       call: "MasterLeaseManager::construct"
@@ -213,9 +213,9 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 加入: etcd cluster(lease + self member)
-      - 启动: watch members/metadata + event broadcast
-      - 产出: cluster_state 可读写 + cluster_event
+      - Join the etcd cluster with lease and self member registration
+      - Start member and metadata watches plus event broadcast
+      - Produces readable and writable `cluster_state` plus `cluster_event`
     exec:
       kind: Call
       call: "ClusterManager::init2_for_init_dag"
@@ -227,9 +227,9 @@ steps:
     deps:
       - res:cluster_member_watch_ready
     doc: |
-      - 启动: P2P transport + rpc core
-      - 启动: cluster_event listener
-      - 依赖: res:cluster_member_watch_ready(读成员变化)
+      - Start P2P transport and the RPC core
+      - Start the `cluster_event` listener
+      - Depends on: `res:cluster_member_watch_ready` to observe membership changes
     exec:
       kind: Call
       call: "P2pModule::init2_for_init_dag"
@@ -241,8 +241,8 @@ steps:
     deps:
       - P2pModule.step.1.init2
     doc: |
-      - 注册: seg RPC handler/caller
-      - 依赖: P2pModule.step.1.init2(rpc transport)
+      - Register segment RPC handlers and callers
+      - Depends on: `P2pModule.step.1.init2` for RPC transport
     exec:
       kind: Call
       call: "MasterSegManager::init2_for_init_dag"
@@ -255,9 +255,9 @@ steps:
       - ClusterManager.step.1.init2
       - P2pModule.step.1.init2
     doc: |
-      - 注册: master KV RPC handler/caller
-      - 启动: router tasks(delete broadcast + cluster listener)
-      - 依赖: ClusterManager.step.1.init2(监听成员) + P2pModule.step.1.init2(rpc)
+      - Register master KV RPC handlers and callers
+      - Start router tasks such as delete broadcast and cluster listener
+      - Depends on: `ClusterManager.step.1.init2` for membership observation and `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "MasterKvRouter::init2_for_init_dag"
@@ -269,9 +269,9 @@ steps:
     deps:
       - ClusterManager.step.1.init2
     doc: |
-      - 启动: monitoring config watcher(异步更新 monitoring_config)
-      - 注册: prom remote_write proxy RPC caller/handler
-      - 依赖: ClusterManager.step.1.init2(读广播)
+      - Start the monitoring-config watcher that updates `monitoring_config` asynchronously
+      - Register Prometheus remote_write proxy RPC handlers and callers
+      - Depends on: `ClusterManager.step.1.init2` to read broadcasts
     exec:
       kind: Call
       call: "MetricReporter::init2_prepare"
@@ -283,8 +283,8 @@ steps:
     deps:
       - res:prom_remote_write_wait_ready
     doc: |
-      - 启动: metric_reporter_loop
-      - 依赖: res:prom_remote_write_wait_ready(内部包含 publish/wait 逻辑) + 本模块 step.1(隐式顺序)
+      - Start `metric_reporter_loop`
+      - Depends on: `res:prom_remote_write_wait_ready`, which includes the internal publish-and-wait logic, plus the implicit ordering after this module's step 1
     exec:
       kind: Call
       call: "MetricReporter::init2_after_prom_remote_write_wait"
@@ -297,9 +297,9 @@ steps:
       - ClusterManager.step.1.init2
       - P2pModule.step.1.init2
     doc: |
-      - 注册: KV API RPC handler/caller
-      - 启动: client_cluster_listener
-      - 依赖: ClusterManager.step.1.init2(读cluster) + P2pModule.step.1.init2(rpc)
+      - Register KV API RPC handlers and callers
+      - Start `client_cluster_listener`
+      - Depends on: `ClusterManager.step.1.init2` to read cluster state and `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "ClientKvApi::init2_for_init_dag"
@@ -312,9 +312,9 @@ steps:
       - ClusterManager.step.1.init2
       - P2pModule.step.1.init2
     doc: |
-      - 注册: RequestSegmentRegistration RPC handler
-      - 写 cluster_state: share_group_binding(owner_id + owner_start_time)
-      - 依赖: ClusterManager.step.1.init2(写cluster) + P2pModule.step.1.init2(rpc)
+      - Register the `RequestSegmentRegistration` RPC handler
+      - Write cluster state: publish `share_group_binding(owner_id + owner_start_time)`
+      - Depends on: `ClusterManager.step.1.init2` to write cluster state and `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "ClientSegPool::init2_for_init_dag"
@@ -327,9 +327,9 @@ steps:
       - ClusterManager.step.1.init2
       - P2pModule.step.1.init2
     doc: |
-      - 等待: accessible_ip_ready(node_start_time)
-      - 构建: transfer engine backend + p2p transfer rpc
-      - 依赖: ClusterManager.step.1.init2(等ip/监听成员) + P2pModule.step.1.init2(rpc)
+      - Wait for `accessible_ip_ready(node_start_time)`
+      - Build the transfer-engine backend plus P2P transfer RPC
+      - Depends on: `ClusterManager.step.1.init2` to wait for IP visibility and observe members, and `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "ClientTransferEngine::init2_for_init_dag"
@@ -342,8 +342,8 @@ steps:
       - ClusterManager.step.1.init2
       - P2pModule.step.1.init2
     doc: |
-      - 准备: ExternalClientApi init(不等待 owner)
-      - 依赖: ClusterManager.step.1.init2(成员/广播) + P2pModule.step.1.init2(rpc)
+      - Prepare `ExternalClientApi` initialization without waiting for the owner
+      - Depends on: `ClusterManager.step.1.init2` for members and broadcasts, and `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "ExternalClientApi::init2_prepare"
@@ -355,8 +355,8 @@ steps:
     deps:
       - res:owner_shared_mem_bundle_ready
     doc: |
-      - external: 完成 owner generation / sub_cluster 绑定 + 注册 RPC
-      - 依赖: res:owner_shared_mem_bundle_ready + 本模块 step.1(隐式顺序)
+      - external: finish owner-generation and sub-cluster binding, then register RPCs
+      - Depends on: `res:owner_shared_mem_bundle_ready` plus the implicit ordering after this module's step 1
     exec:
       kind: Call
       call: "ExternalClientApi::init2_after_owner_shared_mem_bundle_ready"
@@ -368,9 +368,9 @@ steps:
     deps:
       - P2pModule.step.1.init2
     doc: |
-      - 注册: lease RPC
-      - 启动: cleanup loop
-      - 依赖: P2pModule.step.1.init2(rpc)
+      - Register lease RPCs
+      - Start the cleanup loop
+      - Depends on: `P2pModule.step.1.init2` for RPC
     exec:
       kind: Call
       call: "MasterLeaseManager::init2_for_init_dag"
@@ -381,8 +381,8 @@ steps:
     mode: Blocking
     deps: []
     doc: |
-      - 注册: 额外 RPC(route-probe/user-rpc)
-      - 依赖: 本模块 step.1 已完成(隐式顺序)
+      - Register extra RPCs such as route-probe and user-rpc
+      - Depends on: the implicit ordering after this module's step 1
     exec:
       kind: Call
       call: "P2pModule::init3_for_init_dag"
@@ -394,9 +394,9 @@ steps:
     deps:
       - ClientTransferEngine.step.1.init2
     doc: |
-      - 调用 transfer_engine: register segments + open_self_segment
-      - 写 cluster_state: publish transfer_ready
-      - 依赖: ClientTransferEngine.step.1.init2(engine ready)
+      - Call the transfer engine to register segments and open the self segment
+      - Write cluster state: publish `transfer_ready`
+      - Depends on: `ClientTransferEngine.step.1.init2` with the engine ready
     exec:
       kind: Call
       call: "ClientSegPool::init3_for_init_dag"
diff --git a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
index fb54c06..c31ef73 100644
--- a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
@@ -46,8 +46,7 @@ pub struct ClientSegPoolNewArg {
     pub contribute_size: ContributeToClusterPoolSize,
     pub shared_memory_path: String,
     pub shared_file_path: String,
-    pub log_root_path: String,
-    pub cache_root_path: String,
+    pub large_file_paths: crate::config::LargeFilePaths,
     pub cluster_name: String,
     pub etcd_addresses: Vec<String>,
     pub attach_existing_meta: Option<SharedJsonMeta>,
@@ -206,10 +205,8 @@ pub struct ClientSegPoolInner {
     shared_memory_path: String,
     /// Directory path for regular files (shared.json, side-transfer metadata).
     shared_file_path: String,
-    /// Base directory for runtime logs and profile outputs.
-    log_root_path: String,
-    /// Base directory for large cache files.
-    cache_root_path: String,
+    /// Ordered large-file roots; concrete subdirectories are derived by fixed relative layout.
+    large_file_paths: crate::config::LargeFilePaths,
     side_transfer_worker: bool,
     attach_owner_ref: Option<ShareGroupOwnerRef>,
 
@@ -269,8 +266,7 @@ impl ClientSegPool {
         let contribute_size = arg.contribute_size;
         let shared_memory_path = arg.shared_memory_path;
         let shared_file_path = arg.shared_file_path;
-        let log_root_path = arg.log_root_path;
-        let cache_root_path = arg.cache_root_path;
+        let large_file_paths = arg.large_file_paths;
         let cluster_name = arg.cluster_name;
         let etcd_addresses = arg.etcd_addresses;
         let attach_existing_meta = arg.attach_existing_meta;
@@ -365,8 +361,7 @@ impl ClientSegPool {
                 view: std::sync::OnceLock::new(),
                 shared_memory_path: shared_memory_path.clone(),
                 shared_file_path: shared_file_path.clone(),
-                log_root_path: log_root_path.clone(),
-                cache_root_path: cache_root_path.clone(),
+                large_file_paths: large_file_paths.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
                 cluster_name: cluster_name.clone(),
@@ -383,8 +378,7 @@ impl ClientSegPool {
                 view: std::sync::OnceLock::new(),
                 shared_memory_path: shared_memory_path.clone(),
                 shared_file_path: shared_file_path.clone(),
-                log_root_path: log_root_path.clone(),
-                cache_root_path: cache_root_path.clone(),
+                large_file_paths: large_file_paths.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
                 cluster_name: cluster_name.clone(),
@@ -548,8 +542,7 @@ impl ClientSegPool {
             view: std::sync::OnceLock::new(),
             shared_memory_path: base_path.to_string(),
             shared_file_path: shared_file_path.clone(),
-            log_root_path,
-            cache_root_path,
+            large_file_paths,
             side_transfer_worker,
             attach_owner_ref,
             cluster_name,
@@ -568,8 +561,8 @@ impl ClientSegPool {
         &self.inner().shared_file_path
     }
 
-    pub fn cache_root_path(&self) -> &str {
-        &self.inner().cache_root_path
+    pub fn large_file_paths(&self) -> &crate::config::LargeFilePaths {
+        &self.inner().large_file_paths
     }
 
     fn transfer_rpc_fast_path_eligible_members(&self) -> Vec<ClusterMember> {
@@ -1180,10 +1173,7 @@ impl ClientSegPool {
             etcd_addresses: inner.etcd_addresses.clone(),
             shared_memory_path: shared_memory_canonical,
             shared_file_path: shared_file_canonical,
-            large_file_paths: crate::config::LargeFilePaths {
-                log_root_path: inner.log_root_path.clone(),
-                cache_root_path: inner.cache_root_path.clone(),
-            },
+            large_file_paths: inner.large_file_paths.clone(),
 
             protocol_version,
 
diff --git a/fluxon_rs/fluxon_kv/src/config.rs b/fluxon_rs/fluxon_kv/src/config.rs
index 8ea906f..973d15e 100644
--- a/fluxon_rs/fluxon_kv/src/config.rs
+++ b/fluxon_rs/fluxon_kv/src/config.rs
@@ -390,6 +390,23 @@ fn verify_non_empty_root_path(root: &str, field_name: &str) -> KvResult<String>
     Ok(trimmed.to_string())
 }
 
+fn verify_non_empty_root_path_list(root_paths: &[String], field_name: &str) -> KvResult<Vec<String>> {
+    if root_paths.is_empty() {
+        return Err(ConfigError::InvalidClientConfig {
+            detail: format!("{field_name} must contain at least one path"),
+        }
+        .into_kverror());
+    }
+    let mut out = Vec::with_capacity(root_paths.len());
+    for (idx, root) in root_paths.iter().enumerate() {
+        out.push(verify_non_empty_root_path(
+            root,
+            &format!("{field_name}[{idx}]"),
+        )?);
+    }
+    Ok(out)
+}
+
 fn resolve_compiled_rdma_transfer_engine() -> KvResult<TransferEngineType> {
     Ok(TransferEngineType::Closed)
 }
@@ -575,8 +592,7 @@ pub struct FluxonKvSpecYaml {
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 #[serde(deny_unknown_fields)]
 pub struct LargeFilePathsYaml {
-    pub log_root_path: String,
-    pub cache_root_path: String,
+    pub root_paths: Vec<String>,
 }
 
 #[derive(Debug, Clone, Serialize, Deserialize)]
@@ -630,8 +646,71 @@ pub struct FluxonKvSpec {
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
 pub struct LargeFilePaths {
-    pub log_root_path: String,
-    pub cache_root_path: String,
+    pub root_paths: Vec<String>,
+}
+
+impl LargeFilePaths {
+    fn require_configured_root_paths(&self) -> KvResult<()> {
+        if self.root_paths.is_empty() {
+            return Err(ConfigError::InvalidClientConfig {
+                detail: "large_file_paths.root_paths must contain at least one path".to_string(),
+            }
+            .into_kverror());
+        }
+        Ok(())
+    }
+
+    fn resolve_preferred_root_subdir(
+        &self,
+        relative_dir: &Path,
+        target_name: &str,
+    ) -> KvResult<PathBuf> {
+        self.require_configured_root_paths()?;
+        let mut errors = Vec::new();
+        for root in &self.root_paths {
+            let candidate = Path::new(root).join(relative_dir);
+            match fs::create_dir_all(&candidate) {
+                Ok(()) => return Ok(candidate),
+                Err(err) => errors.push(format!("{} ({})", candidate.display(), err)),
+            }
+        }
+        Err(ConfigError::InvalidClientConfig {
+            detail: format!(
+                "large_file_paths.root_paths contains no usable root for {}; tried: {}",
+                target_name,
+                errors.join(", ")
+            ),
+        }
+        .into_kverror())
+    }
+
+    pub fn kv_logs_dir(&self, cluster_name: &str) -> KvResult<PathBuf> {
+        let relative_dir = PathBuf::from(format!("{cluster_name}_cluster_kv_logs"));
+        self.resolve_preferred_root_subdir(&relative_dir, "kv logs")
+    }
+
+    pub fn kv_profiles_dir(&self, cluster_name: &str) -> KvResult<PathBuf> {
+        let relative_dir = PathBuf::from(format!("{cluster_name}_cluster_kv_profiles"));
+        self.resolve_preferred_root_subdir(&relative_dir, "kv profiles")
+    }
+
+    pub fn side_transfer_runtime_dir(
+        &self,
+        cluster_name: &str,
+        instance_key: &str,
+    ) -> KvResult<PathBuf> {
+        let relative_dir = PathBuf::from(format!(
+            "{cluster_name}_cluster_kv_logs/side_transfer_runtime/{instance_key}"
+        ));
+        self.resolve_preferred_root_subdir(&relative_dir, "side-transfer runtime")
+    }
+
+    pub fn fs_disk_cache_base_dir(&self) -> KvResult<PathBuf> {
+        self.resolve_preferred_root_subdir(
+            Path::new("fluxon_fs_disk_cache"),
+            "fluxon fs disk cache",
+        )
+    }
 }
 
 /// KV client backend types supported by the system
@@ -1086,15 +1165,12 @@ impl ClientConfigYaml {
             }
             .into_kverror());
         }
-        // Owner mode always needs explicit large-file roots for logs and caches.
+        // Owner mode always needs explicit ordered large-file roots.
         // The listen port stays optional at this contract layer: deterministic
         // callers may pin it, while shared testbed owners can leave it unset
         // and let the runtime bind a free port.
         let large_file_paths = if is_external {
-            LargeFilePaths {
-                log_root_path: String::new(),
-                cache_root_path: String::new(),
-            }
+            LargeFilePaths { root_paths: Vec::new() }
         } else {
             let Some(large_file_paths_yaml) = self.fluxonkv_spec.large_file_paths.as_ref() else {
                 return Err(ConfigError::InvalidClientConfig {
@@ -1103,17 +1179,11 @@ impl ClientConfigYaml {
                 }
                 .into_kverror());
             };
-            let log_root_path = verify_non_empty_root_path(
-                &large_file_paths_yaml.log_root_path,
-                "large_file_paths.log_root_path",
-            )?;
-            let cache_root_path = verify_non_empty_root_path(
-                &large_file_paths_yaml.cache_root_path,
-                "large_file_paths.cache_root_path",
-            )?;
             LargeFilePaths {
-                log_root_path,
-                cache_root_path,
+                root_paths: verify_non_empty_root_path_list(
+                    &large_file_paths_yaml.root_paths,
+                    "large_file_paths.root_paths",
+                )?,
             }
         };
 
@@ -1477,6 +1547,13 @@ impl MasterConfigYaml {
 #[cfg(test)]
 mod tests {
     use super::*;
+    use uuid::Uuid;
+
+    fn new_test_dir(prefix: &str) -> PathBuf {
+        let path = std::env::temp_dir().join(format!("{}_{}", prefix, Uuid::new_v4()));
+        std::fs::create_dir_all(&path).unwrap();
+        path
+    }
 
     #[test]
     fn cluster_scoped_shared_path_appends_cluster_name() {
@@ -1498,8 +1575,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   disable_observability: true
@@ -1547,8 +1623,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
         )
@@ -1574,8 +1649,7 @@ fluxonkv_spec:
         )
         .unwrap();
         let verified = cfg.verify().unwrap();
-        assert_eq!(verified.large_file_paths.log_root_path, "");
-        assert_eq!(verified.large_file_paths.cache_root_path, "");
+        assert_eq!(verified.large_file_paths.root_paths, Vec::<String>::new());
         assert_eq!(verified.fluxonkv_spec.etcd_addresses, Vec::<String>::new());
         assert_eq!(verified.fluxonkv_spec.sub_cluster, None);
     }
@@ -1590,8 +1664,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_external
   shared_file_path: /tmp/test_external_files
   large_file_paths:
-    log_root_path: /tmp/test_external_logs
-    cache_root_path: /tmp/test_external_cache
+    root_paths: [/tmp/test_external_large]
 "#,
         )
         .unwrap();
@@ -1600,6 +1673,28 @@ fluxonkv_spec:
         assert!(text.contains("fluxonkv_spec.large_file_paths is forbidden in zero-contribution mode"));
     }
 
+    #[test]
+    fn large_file_paths_prefers_first_usable_root() {
+        let tempdir = new_test_dir("fluxon_large_paths_prefers_first_usable_root");
+        let first_root = tempdir.join("first_root");
+        let second_root = tempdir.join("second_root");
+        std::fs::create_dir_all(&second_root).unwrap();
+
+        let large_file_paths = LargeFilePaths {
+            root_paths: vec![
+                first_root.join("child").to_string_lossy().into_owned(),
+                second_root.to_string_lossy().into_owned(),
+            ],
+        };
+
+        let logs_dir = large_file_paths.kv_logs_dir("test_cluster").unwrap();
+        assert_eq!(
+            logs_dir,
+            first_root.join("child").join("test_cluster_cluster_kv_logs")
+        );
+        assert!(logs_dir.exists());
+    }
+
     #[test]
     fn client_test_spec_config_accepts_explicit_rdma_device_names() {
         let cfg = ClientConfigYaml::from_str(
@@ -1614,8 +1709,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1670,8 +1764,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -1708,8 +1801,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1742,8 +1834,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   require_transfer_rpc_fast_path_ready_timeout_seconds: 45
@@ -1770,8 +1861,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   tcp_thread_control_lane_count: 0
@@ -1799,8 +1889,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1833,8 +1922,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1860,8 +1948,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -1917,8 +2004,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
   large_file_paths:
-    log_root_path: /tmp/test_side_worker_logs
-    cache_root_path: /tmp/test_side_worker_cache
+    root_paths: [/tmp/test_side_worker_large]
   p2p_listen_port: 18081
 test_spec_config:
   enable_side_transfer: true
@@ -1959,8 +2045,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
   large_file_paths:
-    log_root_path: /tmp/test_side_worker_logs
-    cache_root_path: /tmp/test_side_worker_cache
+    root_paths: [/tmp/test_side_worker_large]
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -1993,8 +2078,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
   large_file_paths:
-    log_root_path: /tmp/test_side_worker_logs
-    cache_root_path: /tmp/test_side_worker_cache
+    root_paths: [/tmp/test_side_worker_large]
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -2025,8 +2109,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   p2p_listen_port: 18081
   sub_cluster: rack-a
 test_spec_config:
@@ -2060,8 +2143,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
         )
@@ -2088,8 +2170,7 @@ fluxonkv_spec:
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
   large_file_paths:
-    log_root_path: /tmp/test_owner_logs
-    cache_root_path: /tmp/test_owner_cache
+    root_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
index 6a36ca7..765881a 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
@@ -83,8 +83,7 @@ fn new_client_config(
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
         large_file_paths: LargeFilePaths {
-            log_root_path: format!("{}_logs", shm_path),
-            cache_root_path: format!("{}_cache", shm_path),
+            root_paths: vec![format!("{}_large", shm_path)],
         },
         test_spec_config: TestSpecConfig::default(),
     }
@@ -128,10 +127,7 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
-        large_file_paths: LargeFilePaths {
-            log_root_path: String::new(),
-            cache_root_path: String::new(),
-        },
+        large_file_paths: LargeFilePaths { root_paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
index 0758ab5..3830e21 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
@@ -253,7 +253,7 @@ define_module!(
 pub struct ExternalClientApiNewArg {
     pub shared_memory_path: String,
     pub shared_file_path: String,
-    pub cache_root_path: String,
+    pub large_file_paths: crate::config::LargeFilePaths,
     pub expected_cluster_name: String,
     pub expected_protocol_version: String,
     pub enable_side_transfer: bool,
@@ -313,7 +313,7 @@ pub struct ExternalInner {
     expected_protocol_version: String,
     external_shared_memory_path: String,
     external_shared_file_path: String,
-    external_cache_root_path: String,
+    external_large_file_paths: crate::config::LargeFilePaths,
     _enable_side_transfer: bool,
     short_circuit_put_payload_path: bool,
     side_rr_next: AtomicUsize,
@@ -365,7 +365,7 @@ impl ExternalClientApi {
             expected_protocol_version: arg.expected_protocol_version,
             external_shared_memory_path: arg.shared_memory_path,
             external_shared_file_path: arg.shared_file_path,
-            external_cache_root_path: arg.cache_root_path,
+            external_large_file_paths: arg.large_file_paths,
             _enable_side_transfer: arg.enable_side_transfer,
             short_circuit_put_payload_path: arg.short_circuit_put_payload_path,
             side_rr_next: AtomicUsize::new(0),
@@ -1240,8 +1240,8 @@ impl ExternalInner {
         self.external_shared_file_path.clone()
     }
 
-    pub fn cache_root_path(&self) -> String {
-        self.external_cache_root_path.clone()
+    pub fn large_file_paths(&self) -> &crate::config::LargeFilePaths {
+        &self.external_large_file_paths
     }
 
     fn should_fallback_side_p2p_error(err: &crate::p2p::P2PError) -> bool {
diff --git a/fluxon_rs/fluxon_kv/src/kv_test.rs b/fluxon_rs/fluxon_kv/src/kv_test.rs
index 8c3a711..b1b79c9 100644
--- a/fluxon_rs/fluxon_kv/src/kv_test.rs
+++ b/fluxon_rs/fluxon_kv/src/kv_test.rs
@@ -767,8 +767,8 @@ struct KvTestRoundOptions {
     round_profile: KvTestRoundProfile,
     round_name: String,
     cluster_name: String,
-    master_port: u16,
-    step8_master_port: u16,
+    master_port: Option<u16>,
+    step8_master_port: Option<u16>,
     master_options: KvTestClientOptions,
     owner_client_options: KvTestClientOptions,
     external_client_options: KvTestClientOptions,
@@ -857,14 +857,10 @@ fn default_client_large_file_paths(
     if contribute_to_cluster_pool_size.dram == 0
         && contribute_to_cluster_pool_size.vram.is_empty()
     {
-        return LargeFilePaths {
-            log_root_path: String::new(),
-            cache_root_path: String::new(),
-        };
+        return LargeFilePaths { root_paths: Vec::new() };
     }
     LargeFilePaths {
-        log_root_path: format!("/tmp/kvcache_large/log/{}", instance_key),
-        cache_root_path: format!("/tmp/kvcache_large/cache/{}", instance_key),
+        root_paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
     }
 }
 
@@ -910,7 +906,7 @@ fn default_external_test_client_options() -> KvTestClientOptions {
     }
 }
 
-fn new_kv_test_round(round_profile: KvTestRoundProfile, master_port: u16) -> KvTestRoundOptions {
+fn new_kv_test_round(round_profile: KvTestRoundProfile) -> KvTestRoundOptions {
     let round_name = round_profile.round_name();
     KvTestRoundOptions {
         round_profile,
@@ -918,8 +914,8 @@ fn new_kv_test_round(round_profile: KvTestRoundProfile, master_port: u16) -> KvT
         // Keep each process run on its own cluster namespace so a crashed/aborted previous run
         // cannot poison the next rerun with stale members.
         cluster_name: format!("test_cluster_{}_{}", round_name, kv_test_run_scope()),
-        master_port,
-        step8_master_port: master_port + 10,
+        master_port: None,
+        step8_master_port: None,
         master_options: default_master_test_client_options(round_profile),
         owner_client_options: default_owner_test_client_options(round_profile),
         external_client_options: default_external_test_client_options(),
@@ -937,16 +933,16 @@ fn default_kv_test_run_options() -> KvTestRunOptions {
             .map(str::trim)
             .filter(|item| !item.is_empty())
         {
-            let (profile, port) = match round_name {
-                "p2p_only" => (KvTestRoundProfile::P2pOnly, 50220),
-                "rdma_transfer_only" => (KvTestRoundProfile::RdmaTransferOnly, 50240),
-                "rdma_transfer_with_rpc" => (KvTestRoundProfile::RdmaTransferWithRpc, 50260),
+            let profile = match round_name {
+                "p2p_only" => KvTestRoundProfile::P2pOnly,
+                "rdma_transfer_only" => KvTestRoundProfile::RdmaTransferOnly,
+                "rdma_transfer_with_rpc" => KvTestRoundProfile::RdmaTransferWithRpc,
                 other => panic!(
                     "unsupported FLUXON_KV_TEST_ROUNDS entry '{}'; expected one of: p2p_only, rdma_transfer_only, rdma_transfer_with_rpc",
                     other
                 ),
             };
-            rounds.push(new_kv_test_round(profile, port));
+            rounds.push(new_kv_test_round(profile));
         }
         if rounds.is_empty() {
             panic!("FLUXON_KV_TEST_ROUNDS was set but produced no valid rounds");
@@ -956,9 +952,9 @@ fn default_kv_test_run_options() -> KvTestRunOptions {
 
     KvTestRunOptions {
         rounds: vec![
-            new_kv_test_round(KvTestRoundProfile::P2pOnly, 50220),
-            new_kv_test_round(KvTestRoundProfile::RdmaTransferOnly, 50240),
-            new_kv_test_round(KvTestRoundProfile::RdmaTransferWithRpc, 50260),
+            new_kv_test_round(KvTestRoundProfile::P2pOnly),
+            new_kv_test_round(KvTestRoundProfile::RdmaTransferOnly),
+            new_kv_test_round(KvTestRoundProfile::RdmaTransferWithRpc),
         ],
     }
 }
@@ -967,7 +963,7 @@ fn default_kv_test_run_options() -> KvTestRunOptions {
 fn new_master_launch(
     round: &KvTestRoundOptions,
     instance_key: &str,
-    port: u16,
+    port: Option<u16>,
 ) -> KvTestMasterLaunch {
     // Read etcd endpoint from project root build_config_ext.yml
     let etcd = fluxon_util::dev_config::read_etcd_endpoint_from_build_config()
@@ -998,7 +994,7 @@ fn new_master_launch(
         config: MasterConfig {
             instance_key: round.scoped_instance_key(instance_key),
             cluster_name: round.cluster_name.clone(),
-            port: Some(port),
+            port,
             etcd_endpoints: vec![etcd.clone()],
             protocol,
             transfer_engine,
@@ -1879,7 +1875,7 @@ async fn run_kv_step8(round: &KvTestRoundOptions) {
 
 async fn run_kv_round(round: &KvTestRoundOptions) {
     info!(
-        "Round '{}' uses cluster '{}' and master ports {} / {}",
+        "Round '{}' uses cluster '{}' and master ports {:?} / {:?}",
         round.round_name, round.cluster_name, round.master_port, round.step8_master_port
     );
 
diff --git a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
index 1b5754d..b569fe0 100644
--- a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
+++ b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
@@ -148,8 +148,7 @@ fn new_client_config_with_cluster_and_dram(
         shared_memory_path,
         shared_file_path,
         large_file_paths: crate::config::LargeFilePaths {
-            log_root_path: format!("{}/large_logs/{}", base, instance_key),
-            cache_root_path: format!("{}/large_cache/{}", base, instance_key),
+            root_paths: vec![format!("{}/large/{}", base, instance_key)],
         },
         test_spec_config: TestSpecConfig::default(),
     };
diff --git a/fluxon_rs/fluxon_kv/src/lib.rs b/fluxon_rs/fluxon_kv/src/lib.rs
index 96e9b28..0a35f69 100644
--- a/fluxon_rs/fluxon_kv/src/lib.rs
+++ b/fluxon_rs/fluxon_kv/src/lib.rs
@@ -112,6 +112,13 @@ struct ExternalBootstrapBundle {
     etcd_endpoints: Vec<String>,
 }
 
+struct ExternalBootstrapMetadata {
+    meta: SharedJsonMeta,
+    shared_memory_path: String,
+    shared_file_path: String,
+    etcd_endpoints: Vec<String>,
+}
+
 fn cluster_manager_rdma_control_init_from_transfer_config(
     _transfer_engine: TransferEngineType,
     _protocol: &ProtocolConfig,
@@ -849,10 +856,10 @@ fn build_side_transfer_worker_config_yaml(
 }
 
 fn side_transfer_runtime_dir(owner_config: &ClientConfig) -> PathBuf {
-    Path::new(&owner_config.large_file_paths.log_root_path)
-        .join(format!("{}_cluster_kv_logs", owner_config.cluster_name))
-        .join("side_transfer_runtime")
-        .join(&owner_config.instance_key)
+    owner_config
+        .large_file_paths
+        .side_transfer_runtime_dir(&owner_config.cluster_name, &owner_config.instance_key)
+        .unwrap_or_else(|err| panic!("invalid owner large_file_paths: {}", err))
 }
 
 fn cluster_manager_local_ipc_root(
@@ -1592,44 +1599,34 @@ async fn bootstrap_zero_contribution_client_config(config: ClientConfig) -> KvRe
         return Ok(config);
     }
 
-    let bundle = wait_for_external_bootstrap_bundle(&config).await?;
+    let metadata = load_external_bootstrap_metadata(
+        &config.shared_memory_path,
+        &config.shared_file_path,
+        &config.cluster_name,
+    )
+    .await?;
     let mut final_config = config;
-    final_config.etcd_addresses_raw = bundle.meta.etcd_addresses.clone();
-    final_config.fluxonkv_spec.etcd_addresses = bundle.etcd_endpoints;
-    final_config.fluxonkv_spec.sub_cluster = bundle.meta.sub_cluster.clone();
-    final_config.shared_memory_path = bundle.shared_memory_path;
-    final_config.shared_file_path = bundle.shared_file_path;
-    final_config.large_file_paths = bundle.meta.large_file_paths;
+    final_config.etcd_addresses_raw = metadata.meta.etcd_addresses.clone();
+    final_config.fluxonkv_spec.etcd_addresses = metadata.etcd_endpoints;
+    final_config.fluxonkv_spec.sub_cluster = metadata.meta.sub_cluster.clone();
+    final_config.shared_memory_path = metadata.shared_memory_path;
+    final_config.shared_file_path = metadata.shared_file_path;
+    final_config.large_file_paths = metadata.meta.large_file_paths;
     Ok(final_config)
 }
 
-async fn wait_for_external_bootstrap_bundle(
-    config: &ClientConfig,
-) -> KvResult<ExternalBootstrapBundle> {
+async fn load_external_bootstrap_metadata(
+    shared_memory_path: &str,
+    shared_file_path: &str,
+    expected_cluster_name: &str,
+) -> KvResult<ExternalBootstrapMetadata> {
     let build_version = fluxon_util::git_version_build_record::get_current_git_commitid().unwrap();
-    let shared_memory_dir = Path::new(&config.shared_memory_path);
-    let shared_file_dir = Path::new(&config.shared_file_path);
+    let shared_memory_dir = Path::new(shared_memory_path);
+    let shared_file_dir = Path::new(shared_file_path);
     let shared_json_path = shared_file_dir.join("shared.json");
-    let mmap_file_path = shared_memory_dir.join("mmap.file");
 
     let mut waited_ticks: u64 = 0;
     loop {
-        if !shared_json_path.exists() || !mmap_file_path.exists() {
-            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-            waited_ticks += 1;
-            if waited_ticks % 25 == 0 {
-                info!(
-                    "Waiting owner shared bundle to be ready... ({}s), shm_dir={} file_dir={} (shared.json={}, mmap.file={})",
-                    waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_file_dir.to_string_lossy(),
-                    shared_json_path.exists(),
-                    mmap_file_path.exists()
-                );
-            }
-            continue;
-        }
-
         let shared_json_buf = match std::fs::read_to_string(&shared_json_path) {
             Ok(v) => v,
             Err(e) => {
@@ -1680,7 +1677,7 @@ async fn wait_for_external_bootstrap_bundle(
             continue;
         }
 
-        if meta.cluster_name != config.cluster_name {
+        if meta.cluster_name != expected_cluster_name {
             limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
@@ -1689,14 +1686,14 @@ async fn wait_for_external_bootstrap_bundle(
                     waited_ticks / 5,
                     shared_memory_dir.to_string_lossy(),
                     shared_file_dir.to_string_lossy(),
-                    config.cluster_name,
+                    expected_cluster_name,
                     meta.cluster_name
                 );
             }
             continue;
         }
 
-        let shared_memory_path_canonical = match std::fs::canonicalize(&config.shared_memory_path) {
+        let shared_memory_path_canonical = match std::fs::canonicalize(shared_memory_path) {
             Ok(v) => v.to_string_lossy().into_owned(),
             Err(e) => {
                 limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
@@ -1706,7 +1703,7 @@ async fn wait_for_external_bootstrap_bundle(
                         "Waiting shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
                         waited_ticks / 5,
                         shared_memory_dir.to_string_lossy(),
-                        config.shared_memory_path,
+                        shared_memory_path,
                         e
                     );
                 }
@@ -1732,7 +1729,7 @@ async fn wait_for_external_bootstrap_bundle(
             }
         };
 
-        let shared_file_path_canonical = match std::fs::canonicalize(&config.shared_file_path) {
+        let shared_file_path_canonical = match std::fs::canonicalize(shared_file_path) {
             Ok(v) => v.to_string_lossy().into_owned(),
             Err(e) => {
                 limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
@@ -1742,7 +1739,7 @@ async fn wait_for_external_bootstrap_bundle(
                         "Waiting shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
                         waited_ticks / 5,
                         shared_file_dir.to_string_lossy(),
-                        config.shared_file_path,
+                        shared_file_path,
                         e
                     );
                 }
@@ -1830,7 +1827,7 @@ async fn wait_for_external_bootstrap_bundle(
             }
         };
 
-        return Ok(ExternalBootstrapBundle {
+        return Ok(ExternalBootstrapMetadata {
             meta,
             shared_memory_path: meta_shm_canonical,
             shared_file_path: meta_file_canonical,
@@ -1839,6 +1836,46 @@ async fn wait_for_external_bootstrap_bundle(
     }
 }
 
+async fn wait_for_external_bootstrap_bundle(
+    config: &ClientConfig,
+) -> KvResult<ExternalBootstrapBundle> {
+    let metadata = load_external_bootstrap_metadata(
+        &config.shared_memory_path,
+        &config.shared_file_path,
+        &config.cluster_name,
+    )
+    .await?;
+    let shared_memory_dir = Path::new(&metadata.shared_memory_path);
+    let shared_file_dir = Path::new(&metadata.shared_file_path);
+    let shared_json_path = shared_file_dir.join("shared.json");
+    let mmap_file_path = shared_memory_dir.join("mmap.file");
+
+    let mut waited_ticks: u64 = 0;
+    loop {
+        if !shared_json_path.exists() || !mmap_file_path.exists() {
+            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
+            waited_ticks += 1;
+            if waited_ticks % 25 == 0 {
+                info!(
+                    "Waiting owner shared bundle to be ready... ({}s), shm_dir={} file_dir={} (shared.json={}, mmap.file={})",
+                    waited_ticks / 5,
+                    shared_memory_dir.to_string_lossy(),
+                    shared_file_dir.to_string_lossy(),
+                    shared_json_path.exists(),
+                    mmap_file_path.exists()
+                );
+            }
+            continue;
+        }
+        return Ok(ExternalBootstrapBundle {
+            meta: metadata.meta,
+            shared_memory_path: metadata.shared_memory_path,
+            shared_file_path: metadata.shared_file_path,
+            etcd_endpoints: metadata.etcd_endpoints,
+        });
+    }
+}
+
 async fn run_client_impl(
     config_arg: ConfigArg<ClientConfig>,
     test_overrides: Option<ClientRunTestOverrides>,
@@ -1869,8 +1906,10 @@ async fn run_client_impl(
     let source_sha256 = fluxon_util::build_info::SOURCE_SHA256;
 
     // Logs and other large files are isolated from shared.json/peer metadata.
-    let kv_logs_dir = Path::new(&config.large_file_paths.log_root_path)
-        .join(format!("{}_cluster_kv_logs", config.cluster_name));
+    let kv_logs_dir = config
+        .large_file_paths
+        .kv_logs_dir(&config.cluster_name)
+        .map_err(|e| anyhow::anyhow!("invalid large_file_paths for kv logs: {}", e))?;
     let observability_disabled = config.test_spec_config.disable_observability;
     let greptime_tracing_rx = if observability_disabled {
         fluxon_util::init_log(&kv_logs_dir, &config.instance_key);
@@ -1920,7 +1959,7 @@ async fn run_client_impl(
             config.test_spec_config.side_transfer_role,
             Some(SideTransferRole::Worker)
         );
-    let bootstrapped_shared_meta = if is_external {
+    let bootstrapped_shared_meta = if is_side_transfer_worker {
         Some(wait_for_external_bootstrap_bundle(&config).await?.meta)
     } else {
         None
@@ -2028,7 +2067,7 @@ async fn run_client_impl(
             external_client_api_arg: ExternalClientApiNewArg {
                 shared_memory_path: config.shared_memory_path.clone(),
                 shared_file_path: config.shared_file_path.clone(),
-                cache_root_path: config.large_file_paths.cache_root_path.clone(),
+                large_file_paths: config.large_file_paths.clone(),
                 expected_cluster_name: config.cluster_name.clone(),
                 expected_protocol_version: build_version.clone(),
                 enable_side_transfer: config.test_spec_config.enable_side_transfer,
@@ -2080,8 +2119,7 @@ async fn run_client_impl(
                 // Read shared memory path from config (must not be empty).
                 shared_memory_path: config.shared_memory_path.clone(),
                 shared_file_path: config.shared_file_path.clone(),
-                log_root_path: config.large_file_paths.log_root_path.clone(),
-                cache_root_path: config.large_file_paths.cache_root_path.clone(),
+                large_file_paths: config.large_file_paths.clone(),
                 cluster_name: config.cluster_name.clone(),
                 etcd_addresses: config.etcd_addresses_raw.clone(),
                 attach_existing_meta: if is_side_transfer_worker {
@@ -2424,8 +2462,10 @@ async fn run_client_impl(
     }
 
     let shutdown_waiter = framework.cluster_manager_view().register_shutdown_waiter();
-    let kv_profiles_dir = Path::new(&config.large_file_paths.log_root_path)
-        .join(format!("{}_cluster_kv_profiles", config.cluster_name));
+    let kv_profiles_dir = config
+        .large_file_paths
+        .kv_profiles_dir(&config.cluster_name)
+        .map_err(|e| anyhow::anyhow!("invalid large_file_paths for kv profiles: {}", e))?;
     profile::spawn_pprof_flamegraph_on_timeout_or_shutdown(
         config.pprof_duration_seconds,
         kv_profiles_dir,
@@ -2505,8 +2545,7 @@ mod tests {
             shared_memory_path: "/tmp/fluxon_side_transfer_test".to_string(),
             shared_file_path: "/tmp/fluxon_side_transfer_test_files".to_string(),
             large_file_paths: crate::config::LargeFilePaths {
-                log_root_path: "/tmp/fluxon_side_transfer_test_large/log".to_string(),
-                cache_root_path: "/tmp/fluxon_side_transfer_test_large/cache".to_string(),
+                root_paths: vec!["/tmp/fluxon_side_transfer_test_large".to_string()],
             },
             test_spec_config: TestSpecConfig {
                 enable_side_transfer: true,
@@ -2757,12 +2796,10 @@ mod tests {
         let tempdir = new_test_dir("fluxon_external_bootstrap_large_paths");
         let shared_memory_root = tempdir.join("shared_mem");
         let shared_file_root = tempdir.join("shared_file");
-        let owner_log_root = tempdir.join("owner_logs");
-        let owner_cache_root = tempdir.join("owner_cache");
+        let owner_large_root = tempdir.join("owner_large");
         std::fs::create_dir_all(&shared_memory_root).unwrap();
         std::fs::create_dir_all(&shared_file_root).unwrap();
-        std::fs::create_dir_all(&owner_log_root).unwrap();
-        std::fs::create_dir_all(&owner_cache_root).unwrap();
+        std::fs::create_dir_all(&owner_large_root).unwrap();
         std::fs::write(shared_memory_root.join("mmap.file"), vec![0u8; 4096]).unwrap();
 
         let shared_meta = SharedJsonMeta {
@@ -2782,8 +2819,7 @@ mod tests {
                 .to_string_lossy()
                 .into_owned(),
             large_file_paths: crate::config::LargeFilePaths {
-                log_root_path: owner_log_root.to_string_lossy().into_owned(),
-                cache_root_path: owner_cache_root.to_string_lossy().into_owned(),
+                root_paths: vec![owner_large_root.to_string_lossy().into_owned()],
             },
             protocol_version:
                 fluxon_util::git_version_build_record::get_current_git_commitid().unwrap(),
@@ -2819,10 +2855,7 @@ mod tests {
             },
             shared_memory_path: shared_memory_root.to_string_lossy().into_owned(),
             shared_file_path: shared_file_root.to_string_lossy().into_owned(),
-            large_file_paths: crate::config::LargeFilePaths {
-                log_root_path: String::new(),
-                cache_root_path: String::new(),
-            },
+            large_file_paths: crate::config::LargeFilePaths { root_paths: Vec::new() },
             test_spec_config: TestSpecConfig::default(),
         };
 
@@ -2830,12 +2863,8 @@ mod tests {
             .await
             .expect("bootstrap zero-contribution config");
         assert_eq!(
-            bootstrapped.large_file_paths.log_root_path,
-            owner_log_root.to_string_lossy()
-        );
-        assert_eq!(
-            bootstrapped.large_file_paths.cache_root_path,
-            owner_cache_root.to_string_lossy()
+            bootstrapped.large_file_paths.root_paths,
+            vec![owner_large_root.to_string_lossy().into_owned()]
         );
         assert_eq!(
             bootstrapped.fluxonkv_spec.sub_cluster,
diff --git a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
index 5b260c3..625cb91 100644
--- a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
+++ b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
@@ -95,8 +95,7 @@ fn new_client_config_with_size(
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", instance_key),
         large_file_paths: crate::config::LargeFilePaths {
-            log_root_path: format!("/tmp/kvcache_large_logs/{}", instance_key),
-            cache_root_path: format!("/tmp/kvcache_large_cache/{}", instance_key),
+            root_paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
         },
         test_spec_config: TestSpecConfig::default(),
     }
@@ -131,10 +130,7 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", owner_instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", owner_instance_key),
-        large_file_paths: crate::config::LargeFilePaths {
-            log_root_path: String::new(),
-            cache_root_path: String::new(),
-        },
+        large_file_paths: crate::config::LargeFilePaths { root_paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_rs/fluxon_util/src/log.rs b/fluxon_rs/fluxon_util/src/log.rs
index 648650f..fc6066f 100644
--- a/fluxon_rs/fluxon_util/src/log.rs
+++ b/fluxon_rs/fluxon_util/src/log.rs
@@ -342,13 +342,17 @@ pub fn latest_existing_daily_sharded_log_path(base_path: &Path) -> Option<PathBu
     let mut latest: Option<(chrono::NaiveDate, PathBuf)> = None;
     let entries = std::fs::read_dir(parent).ok()?;
     for entry in entries {
-        let entry = entry.ok()?;
+        let Ok(entry) = entry else {
+            continue;
+        };
         let path = entry.path();
         if !path.is_file() {
             continue;
         }
         let entry_name = entry.file_name();
-        let entry_name = entry_name.to_str()?;
+        let Some(entry_name) = entry_name.to_str() else {
+            continue;
+        };
         if !entry_name.starts_with(prefix.as_str()) || !entry_name.ends_with(".log") {
             continue;
         }
@@ -356,7 +360,9 @@ pub fn latest_existing_daily_sharded_log_path(base_path: &Path) -> Option<PathBu
             continue;
         }
         let date_text = &entry_name[prefix.len()..entry_name.len() - ".log".len()];
-        let date = chrono::NaiveDate::parse_from_str(date_text, "%Y-%m-%d").ok()?;
+        let Ok(date) = chrono::NaiveDate::parse_from_str(date_text, "%Y-%m-%d") else {
+            continue;
+        };
         let replace = match latest.as_ref() {
             Some((prev, _)) => date > *prev,
             None => true,
diff --git a/fluxon_rs/fluxon_util/tests/log_mgmt.rs b/fluxon_rs/fluxon_util/tests/log_mgmt.rs
index 03de37c..431c5fc 100644
--- a/fluxon_rs/fluxon_util/tests/log_mgmt.rs
+++ b/fluxon_rs/fluxon_util/tests/log_mgmt.rs
@@ -118,3 +118,17 @@ fn resolve_readable_log_path_ignores_plain_base_log_when_daily_shards_exist() {
     let resolved = fluxon_util::resolve_readable_log_path(&base_path).expect("resolve readable log path");
     assert_eq!(resolved, shard_path);
 }
+
+#[test]
+fn latest_existing_daily_sharded_log_path_skips_invalid_candidates() {
+    let temp_dir = TempDir::new().expect("create temp dir");
+    let base_path = temp_dir.path().join("demo.log");
+    let invalid_shard_path = temp_dir.path().join("demo.not-a-date.log");
+    let valid_shard_path = temp_dir.path().join("demo.2026-06-20.log");
+    fs::write(&invalid_shard_path, "invalid\n").expect("write invalid shard");
+    fs::write(&valid_shard_path, "valid\n").expect("write valid shard");
+
+    let resolved =
+        fluxon_util::latest_existing_daily_sharded_log_path(&base_path).expect("resolve latest shard");
+    assert_eq!(resolved, valid_shard_path);
+}
diff --git a/fluxon_test_stack/start_test_bed.py b/fluxon_test_stack/start_test_bed.py
index d2d2504..2b13d22 100644
--- a/fluxon_test_stack/start_test_bed.py
+++ b/fluxon_test_stack/start_test_bed.py
@@ -1513,6 +1513,23 @@ def _bare_service_runtime_log_path(*, local_node_cfg: dict[str, Any], service_na
     return root / "log" / f"{service_name}.log"
 
 
+def _resolve_bare_service_readable_runtime_log_path(
+    *,
+    local_node_cfg: dict[str, Any],
+    service_name: str,
+) -> Path | None:
+    runtime_log_path = _bare_service_runtime_log_path(
+        local_node_cfg=local_node_cfg,
+        service_name=service_name,
+    )
+    if runtime_log_path is None:
+        return None
+    resolved_log_path = log_shard.resolve_readable_log_path(runtime_log_path)
+    if resolved_log_path is not None:
+        return resolved_log_path
+    return runtime_log_path
+
+
 def _test_runner_ui_health_payload(*, probe_url: str, timeout_seconds: float) -> dict[str, Any] | None:
     req = urllib.request.Request(probe_url.rstrip("/") + "/health", method="GET")
     try:
@@ -3400,7 +3417,7 @@ def _collect_bare_runtime_statuses(
         raise ValueError("bare_launch_result.bootstrap_log_path must be a Path")
     statuses: list[dict[str, Any]] = []
     for service_name in expected_service_names:
-        runtime_log_path = _bare_service_runtime_log_path(
+        runtime_log_path = _resolve_bare_service_readable_runtime_log_path(
             local_node_cfg=local_node_cfg,
             service_name=service_name,
         )
diff --git a/skills/browser-helm/SKILL.md b/skills/browser-helm/SKILL.md
deleted file mode 100644
index dbe1afd..0000000
--- a/skills/browser-helm/SKILL.md
+++ /dev/null
@@ -1,232 +0,0 @@
----
-name: browser-helm
-description: Helm-only browser runtime workflow for operating Browser Helm managed tabs via `browser-helm`, with namespaced `browser` / `tab` / `page` / `picker` / `events` commands and namespaced `.tmp/browser-helm/` output conventions.
-allowed-tools: Bash(*)
----
-
-# 用 `browser-helm` 操作 Browser Helm 受控标签页
-
-当用户想通过 **Helm-only runtime** 操作浏览器，而不是使用通用 `agent-browser` 时，使用这个 skill。
-
-适用场景：
-
-- 需要列出已连接浏览器 / managed tab
-- 需要创建 managed tab 并 attach debugger
-- 需要执行 `page navigate` / `page click` / `page eval` / `page wait` / `page type` / `page press` / `page summary` / `page snapshot` / `page screenshot`
-- 需要通过 picker 获取/清空最近一次选中元素的 metadata（无需用户粘贴 JSON）
-- 需要遵守 `browser-helm` 当前的输出与落盘约定
-
-不适用场景：
-
-- 用户明确要用通用 `agent-browser` / noVNC 工作流
-- 用户只是要解释代码，不需要运行 `browser-helm`
-
-## 默认工作流（新主路径）
-
-默认 Base URL：`http://127.0.0.1:5181`（不需要设置环境变量）。
-
-如需覆盖（可选）：在命令前追加 `--base-url http://127.0.0.1:5181`。
-
-如本机未全局安装 `browser-helm`，也可以用 `node browser-helm/dist/cli.js` 替代下方命令。
-
-## 多人/多 AI 会话（互信）约定（重要）
-
-当前产品定位下，daemon / Web UI / WS **默认不做鉴权**，更偏向“同一局域网多人互信”的协作模型。
-
-但为了避免 **同一台浏览器 + 多个 AI 对话** 时出现“串台/误操作”，推荐强制使用 `session` 做操作隔离：
-
-- 每个 AI 对话固定用一个 `--session <name>`（或设置环境变量 `BROWSER_HELM_SESSION=<name>`）
-- `session` 会隔离：
-  - CLI context 落盘：`.tmp/browser-helm/context.json`（default）或 `.tmp/browser-helm/sessions/<session>/context.json`
-  - CLI 输出落盘：`.tmp/browser-helm/<type>/...`（default）或 `.tmp/browser-helm/sessions/<session>/<type>/...`
-  - `tab create` 会自动加前缀：`[session:<session>] ...`（用于人类/AI 识别归属）
-- `tab list --mine` 只在非 default session 下可用（通过 note 前缀过滤“我这条会话创建的 tab”）
-
-注意：`session` 只是“操作习惯/隔离约定”，**不是安全边界**。知道 `managed-tab-id` 仍然能跨 session 操作；不要把端口暴露到不可信网络。
-
-### 前置（必须）：安装插件并配对
-
-`browser-helm` 的所有浏览器动作都依赖 **Chrome 插件已连接 daemon（WebSocket）**：
-
-- 创建 managed tab 时建议提供 `--note <text>`，用于描述这个 tab 的意图/用途。
-  - 若省略 `--note` 且提供 URL，CLI 会自动生成：`打开页面：<url>`
-
-- 若 `browser-helm browser list` 一直为空，优先判断是「插件未安装/未 Connect」而不是 CLI 出错。
-
-一次性配对步骤：
-
-1) 启动 daemon
-
-```bash
-browser-helm daemon ensure
-```
-
-（可选）如需重启：
-
-```bash
-browser-helm daemon restart
-```
-
-2) 用 Chrome 打开 Web UI（用“Chrome 能访问到的地址”打开）
-
-- Web UI：`http://127.0.0.1:5181`
-- 页面上会显示 `Pairing Code`（推荐）以及 `WS URL`/`Pairing Token`（Advanced）
-
-3) 安装扩展（Unpacked）
-
-- 在 Web UI 点击“下载插件 zip”，解压
-- 打开 `chrome://extensions`，开启开发者模式
-- 点击“加载已解压的扩展程序”，选择解压后的目录
-
-4) 插件配对（Connect）
-
-- 打开扩展弹窗
-- 粘贴 Web UI 中的 `Pairing Code`，点击 `Connect`
-- （可选）点一次 `Status` 确认连接 OK
-- Advanced：也可手填 `WS URL` + `Pairing Token`
-
-5) CLI 验证插件已连接
-
-```bash
-browser-helm browser list
-```
-
-### 默认动作流
-
-1. 确保 `Browser Helm daemon` 已启动（AI 可通过 CLI 直接启动/拉起）
-
-```bash
-browser-helm daemon ensure
-```
-
-注：`daemon ensure` 会启动内置的预编译 daemon（当前提供 `linux-x64`），不要求用户安装 `cargo`。
-
-2. 确认扩展已连接，并列出浏览器
-
-```bash
-browser-helm browser list
-```
-
-（推荐）3. Pin 默认 browser/tab（减少长对话遗忘成本）
-
-```bash
-browser-helm context use-browser <browser-id>
-browser-helm context use-tab <managed-tab-id>
-browser-helm context show
-```
-
-4. 列 tab；如无 tab，则创建新 tab
-
-```bash
-browser-helm browser list
-browser-helm tab list <browser-id>
-browser-helm tab create <browser-id> https://example.com --note "说明这个 tab 的用途"
-```
-
-5. （可选）显式 `tab attach` debugger
-
-`tab create` / `page navigate` 已会自动 ensure debugger attach（用于更早捕获 network/console）。如果你准备在浏览器里手动刷新/导航，也建议先 `tab attach`。
-
-```bash
-browser-helm tab attach <browser-id> <managed-tab-id>
-```
-
-6. 页面分析优先走返回值主路
-
-```bash
-browser-helm page summary <browser-id> <managed-tab-id>
-browser-helm page snapshot <browser-id> <managed-tab-id>
-```
-
-7. 只有在需要留档时才显式保存 `page summary` / `page snapshot`
-
-```bash
-browser-helm --save page summary <browser-id> <managed-tab-id>
-browser-helm --save page snapshot <browser-id> <managed-tab-id>
-```
-
-8. `page screenshot` 默认会落盘；`page click` 会走受控页遮罩下的程序化点击
-
-```bash
-browser-helm page click <browser-id> <managed-tab-id> '#selector'
-browser-helm page click <browser-id> <managed-tab-id> '#selector' --wait-text 'Finished working' --timeout-ms 15000
-browser-helm page eval <browser-id> <managed-tab-id> '1+1'
-browser-helm page wait <browser-id> <managed-tab-id> --until-text 'Finished working' --timeout-ms 15000
-browser-helm page type <browser-id> <managed-tab-id> 'div[aria-label="Composer"]' 'hello'
-browser-helm page press <browser-id> <managed-tab-id> 'Enter'
-browser-helm page screenshot <browser-id> <managed-tab-id>
-```
-
-9. 推荐先 `page snapshot` 生成 `@iN` refs，再用 ref 操作（类似 agent-browser 的 `@eN`）
-
-```bash
-browser-helm page snapshot <browser-id> <managed-tab-id>
-browser-helm page click @i1
-browser-helm page type @i2 'hello'
-```
-
-9. 如用户在 SidePanel 做了元素选择（Start Picking），AI 可直接从 daemon 拉取最近一次选择结果
-
-```bash
-browser-helm picker last
-browser-helm picker clear
-```
-
-### 交互录制（用户手动复现）
-
-当你需要「AI 先打开受控 tab，然后用户自己操作复现问题，再让 AI 回看」时，可以开启交互录制：
-
-```bash
-# 记录起始时间（ms）
-t0=$(date +%s%3N)
-
-# 开始录制（会注入监听脚本，并临时隐藏遮罩，允许用户点击/输入）
-browser-helm recorder start <browser-id> <managed-tab-id>
-
-# ...用户在该 tab 上手动复现...
-
-# 拉取复现阶段的交互/console/network 事件（按 since 过滤）
-browser-helm events interaction <browser-id> <managed-tab-id> --since $t0 --limit 2000
-browser-helm events console <browser-id> <managed-tab-id> --since $t0 --limit 2000
-browser-helm events network <browser-id> <managed-tab-id> --since $t0 --limit 2000
-
-# 停止录制（恢复遮罩）
-browser-helm recorder stop <browser-id> <managed-tab-id>
-```
-
-注意：交互录制会包含 input 的原始 value（不脱敏）。仅建议在互信/本地环境使用。
-
-## 输出与落盘约定
-
-- `page summary`：默认只打印；传 `output-path` 或 `--save` 时，写入 `.tmp/browser-helm/summaries/`
-- `page snapshot`：默认只打印；传 `output-path` 或 `--save` 时，写入 `.tmp/browser-helm/snapshots/`
-- `page screenshot`：默认写入 `.tmp/browser-helm/screenshots/`
-- 若使用 `--session <name>` / `BROWSER_HELM_SESSION=<name>`：上述目录会自动切换到 `.tmp/browser-helm/sessions/<session>/...`
-- 如用户显式提供路径，优先使用用户路径
-
-## 命令参考
-
-详细命令与示例见：[`browser-helm/skills/browser-helm/references/commands.md`]
-
-优先顺序建议：
-
-1. `browser list`
-2. `tab list`
-3. `tab create`（推荐写 `--note`；若省略且提供 URL，则自动生成 note）
-   - 或：`tab adopt-active`（接管当前活动 tab）
-4. `tab attach`
-5. `page navigate`
-6. `page summary` / `page snapshot`
-7. `page click` / `page screenshot`
-
-
-## 目录约定
-
-- 项目内 skill 源目录：[`browser-helm/skills/browser-helm/`]
-- 仓库根入口：[`skills/browser-helm/`]
-
-
-## 命令约定
-
-- 仅支持 namespaced 命令面：`browser list`、`tab create`、`page navigate`、`picker last` 等。
-- 默认文档路径改为 namespaced 形式：`browser list`、`tab create`、`page navigate`、`events console`、`picker last`。
diff --git a/skills/browser-helm/agents/openai.yaml b/skills/browser-helm/agents/openai.yaml
deleted file mode 100644
index 686f428..0000000
--- a/skills/browser-helm/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: Browser Helm
-  short_description: 通过 Browser Helm 操作 Browser Helm 受控标签页流程
-  default_prompt: Use $browser-helm to inspect and operate Browser Helm managed tabs.
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/browser-helm/references/commands.md b/skills/browser-helm/references/commands.md
deleted file mode 100644
index d22d465..0000000
--- a/skills/browser-helm/references/commands.md
+++ /dev/null
@@ -1,131 +0,0 @@
-# `browser-helm` 命令参考
-
-## 前置（必须）：插件安装与配对
-
-CLI 能否操作浏览器，取决于 **Chrome 插件是否已连接 daemon（WebSocket）**。
-
-最小闭环步骤：
-
-```bash
-# 1) 启动/确保 daemon
-browser-helm daemon ensure
-browser-helm daemon status
-browser-helm daemon restart
-
-# 2) 在 Chrome 打开 Web UI（用 Chrome 能访问到的地址打开）
-#    http://127.0.0.1:5181
-#    从页面复制 Pairing Code（推荐；含多网卡候选地址）或 WS URL + Pairing Token（Advanced）
-#
-# 3) 安装扩展（Unpacked）
-#    - Web UI 下载插件 zip -> 解压
-#    - chrome://extensions 开启开发者模式 -> 加载已解压扩展
-#
-# 4) 插件弹窗填 Pairing Code -> Connect
-
-# 5) 验证浏览器已连接
-browser-helm browser list
-```
-
-## 基础命令（新主路径）
-
-```bash
-browser-helm daemon status
-browser-helm daemon ensure
-browser-helm daemon stop
-browser-helm daemon restart
-browser-helm status
-browser-helm browser list
-browser-helm tab list [browser-id] [--mine]
-browser-helm recorder start [browser-id] [managed-tab-id]
-browser-helm recorder stop [browser-id] [managed-tab-id]
-```
-
-## 受控 tab 生命周期
-
-```bash
-browser-helm tab create [browser-id] [url] [--note <text>]
-browser-helm tab adopt-active [browser-id] [--note <text>]
-browser-helm tab attach [browser-id] [managed-tab-id]
-browser-helm page navigate [browser-id] [managed-tab-id] <url>
-```
-
-## 交互与分析
-
-```bash
-browser-helm page click [browser-id] [managed-tab-id] <selector> [--wait-(selector|text|js) <value>] [--timeout-ms <n>] [--interval-ms <n>]
-browser-helm page eval [browser-id] [managed-tab-id] <expression>
-browser-helm page wait [browser-id] [managed-tab-id] --until-(selector|text|js) <value> [--timeout-ms <n>] [--interval-ms <n>]
-browser-helm page type [browser-id] [managed-tab-id] <selector> <text>
-browser-helm page press [browser-id] [managed-tab-id] <key>
-browser-helm page summary [browser-id] [managed-tab-id] [output-path]
-browser-helm page snapshot [browser-id] [managed-tab-id] [output-path]
-browser-helm page screenshot [browser-id] [managed-tab-id] [output-path]
-browser-helm events console [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
-browser-helm events network [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
-browser-helm events interaction [browser-id] [managed-tab-id] [--limit <n>] [--since <ms>]
-browser-helm picker last [browser-id] [managed-tab-id]
-browser-helm picker clear [browser-id] [managed-tab-id]
-```
-
-说明：
-
-- `page snapshot` 会生成可复用的 interactive refs：`@i1/@i2/...`（按 interactives 列表顺序）。
-- `page click/@iN`、`page type/@iN` 会把 ref 解析为 snapshot 中记录的 selector（落盘于 `.tmp/browser-helm/refs/<managed_tab_id>.json`，按 `--session` 隔离）。
-
-## Context（session-like，新主路径）
-
-长对话/长任务里，为了避免反复提供 `browser-id` / `managed-tab-id`，可以把默认对象写入本地 context：
-
-```bash
-browser-helm context use-browser <browser-id>
-browser-helm context use-tab <managed-tab-id>
-browser-helm context show
-browser-helm context clear
-```
-
-## 多 AI 对话隔离（推荐）
-
-为了避免“同一浏览器 + 多个 AI 对话”串台，建议为每条对话固定一个 `session`：
-
-```bash
-browser-helm --session chat-a browser list
-browser-helm --session chat-a tab list --mine
-browser-helm --session chat-a tab create <browser-id> https://example.com --note "这条对话的用途说明"
-```
-
-说明：
-
-- `tab create` 会自动加前缀：`[session:chat-a] ...`
-- `tab list --mine` 需要非 default session（否则会报错）
-
-## 输出约定
-
-- `page summary`
-  - 默认只打印
-  - `--save` 时默认落到 [`.tmp/browser-helm/summaries/`]
-- `page snapshot`
-  - 默认只打印
-  - `--save` 时默认落到 [`.tmp/browser-helm/snapshots/`]
-- `page screenshot`
-  - 默认落到 [`.tmp/browser-helm/screenshots/`]
-- 若使用 `--session <name>` / `BROWSER_HELM_SESSION=<name>`：上述目录会自动切换到 [`.tmp/browser-helm/sessions/<session>/...`]
-
-## 推荐示例
-
-```bash
-browser-helm browser list
-browser-helm tab create <browser-id> https://example.com --note "说明这个 tab 的用途"
-browser-helm tab attach <browser-id> <managed-tab-id>
-browser-helm page snapshot <browser-id> <managed-tab-id>
-browser-helm --save page summary <browser-id> <managed-tab-id>
-browser-helm page screenshot <browser-id> <managed-tab-id>
-```
-
-说明：
-
-- `tab create` 若省略 `--note` 且提供 URL，会自动生成：`打开页面：<url>`
-
-## 命令约定
-
-- 仅支持 namespaced 命令面：`browser list`、`tab create`、`tab attach`、`page navigate`、`picker last` 等。
-- 文档与 skill 后续默认都以 namespaced 命令作为主路径。
diff --git a/skills/canvas-dag_organizer-v1/SKILL.md b/skills/canvas-dag_organizer-v1/SKILL.md
deleted file mode 100644
index db3dc0d..0000000
--- a/skills/canvas-dag_organizer-v1/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "canvas-dag_organizer-v1"
-description: "Canvas DAG Organizer v1"
-metadata:
-  short-description: "Canvas DAG Organizer v1"
----
-
-# Canvas DAG Organizer v1
-
-你是「Canvas DAG 可读性优化专家」(canvas_dag_organizer)。\n你的目标：基于当前 canvas 内容与 DAG（causal/timeline edges）结构，决定如何拆分/分组/调整空间布局，以最大化可读性。\n\n硬约束（必须遵守）：\n- 禁止要求用户手工编辑 `.canvas` / `.canvas.ext` JSON。\n- 你不能执行任何命令；你只能输出一个严格 JSON 对象（不要 markdown、不要 code fence、不要额外文本）。\n- 你输出的修改必须是“可复现/确定性”的（同一输入得到同一输出）。\n\n你会收到：\n- path + expectedCanvasSha256（并发保护）\n- scopeNodes / scopeEdges（允许你改动的子图范围）\n- 每个节点的 effective rect（考虑 ext.dx/dy/scale）\n\n你的输出 JSON schema（version=1）：\n{\n  "version": 1,\n  "kind": "canvas_dag_organize_apply_v1",\n  "path": "<same as input.path>",\n  "expectedCanvasSha256": "<same as input.expectedCanvasSha256>",\n  "summary": "一句话总结你做了什么（用于 UI 提示）",\n  "ops": [\n    // CanvasOpsRequestV1.ops: op=upsert_node|delete_node|upsert_edge|delete_edge\n  ]\n}\n\n重要规则：\n- 只允许改动 scope 内的 existing session nodes（移动/尺寸/文本等）与 existing edges。\n- 允许创建 group 节点用于分区（id 必须以 "group-" 开头；type="group"）。\n- 禁止删除任何 session 节点（dever_kind=session）。\n- 如果你删除 node，必须同时删除所有引用它的 edges（否则服务端会拒绝 apply）。\n- 优先做：分组 + 分层/泳道 + 对齐 + 留白；不要盲目网格化。
diff --git a/skills/canvas-dag_organizer-v1/agents/openai.yaml b/skills/canvas-dag_organizer-v1/agents/openai.yaml
deleted file mode 100644
index f7ffc0e..0000000
--- a/skills/canvas-dag_organizer-v1/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "Canvas DAG Organizer v1"
-  short_description: "Canvas DAG Organizer v1"
-  default_prompt: "Use $canvas-dag_organizer-v1."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/canvas-ops-v1/SKILL.md b/skills/canvas-ops-v1/SKILL.md
deleted file mode 100644
index ffa8017..0000000
--- a/skills/canvas-ops-v1/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "canvas-ops-v1"
-description: "Canvas Ops v1"
-metadata:
-  short-description: "Canvas Ops v1"
----
-
-# Canvas Ops v1
-
-你是「Canvas 文件操作助手」(canvas_ops)。\n你的目标：对 `*.canvas` / `*.canvas.ext` 的任何修改，都必须通过项目内的脚本执行；禁止手工编辑 JSON。\n\n唯一允许的执行入口：\n- `.dever/tools/canvas_ops/canvas_ops.sh`\n- 配置：`.dever/tools/canvas_ops/config.json`\n\n硬约束：\n- 你只能生成 `apply` 需要的 request JSON（version=1），并给出一条可执行命令来调用脚本。\n- 禁止直接输出/粘贴完整 `.canvas` 内容作为“修改后的文件”。\n- 如果需要删除 node：必须同时显式删除所有依赖该 node 的 edges（否则脚本会拒绝执行）。\n\n你的输出格式（两段，且仅两段）：\n(1) request JSON（纯 JSON，不要 markdown，不要 code fence）\n(2) 一段 bash 命令（用 heredoc 把 JSON 送进脚本；命令内必须显式传 `-w` 与 `-c`）\n\n命令模板（把 <WORKDIR> 替换为项目根；一般是 `.`）：\n.dever/tools/canvas_ops/canvas_ops.sh apply -w <WORKDIR> -c .dever/tools/canvas_ops/config.json --request-stdin <<'JSON'\n{...}\nJSON\n\n建议（可选）：命令后再跑一次 validate，确认写盘结果可读且 ext sha 一致。
diff --git a/skills/canvas-ops-v1/agents/openai.yaml b/skills/canvas-ops-v1/agents/openai.yaml
deleted file mode 100644
index 5566cff..0000000
--- a/skills/canvas-ops-v1/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: Canvas Ops v1
-  short_description: Canvas Ops v1
-  default_prompt: Use $canvas-ops-v1.
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/canvas-tidy_selection-v1/SKILL.md b/skills/canvas-tidy_selection-v1/SKILL.md
deleted file mode 100644
index 0dbfdf1..0000000
--- a/skills/canvas-tidy_selection-v1/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "canvas-tidy_selection-v1"
-description: "Canvas Tidy Selection v1"
-metadata:
-  short-description: "Canvas Tidy Selection v1"
----
-
-# Canvas Tidy Selection v1
-
-你是「Canvas 会话块整理专家」(canvas_tidy_selection)。\n你的目标：为“画布上选中的会话块”提供一键自动整理（确定性布局、可复现）。\n\n硬约束：\n- 禁止建议用户手工编辑 `.canvas` / `.canvas.ext` JSON。\n- 不要输出“修改后的完整 canvas 文件内容”。\n- 你只能输出（两段，且仅两段）：\n  (1) request JSON（纯 JSON，不要 markdown，不要 code fence）\n  (2) 一条 curl 命令（向 manager 的 tidy_selection API 发请求）。\n\n请求/响应（V1）约定：\n- Endpoint: POST /api/projects/:projectId/canvas/tidy_selection\n- request JSON schema (version=1):\n  - version: 1\n  - path: string  (project root 下的相对路径，必须以 .canvas 结尾)\n  - expectedCanvasSha256: string  (并发保护；必须来自最新 load 响应的 canvas_sha256)\n  - selectedSessionIds: string[]  (选中的会话块 node id 列表；会去重并保持稳定顺序)\n  - layout: { kind: "grid_sqrt_v1"; gapX: number; gapY: number }\n  - anchor: { kind: "keep_bounds_topleft_v1" }\n  - resetConnectedEdgeRoutes: boolean  (true 表示清空相关连线 ext 路由，回到默认路由)\n\ncurl 模板（把 <PROJECT_ID> 替换为实际 id）：\ncurl -sS -X POST 'http://localhost:8788/api/projects/<PROJECT_ID>/canvas/tidy_selection' \\n  -H 'Content-Type: application/json' \\n  -d '<REQUEST_JSON>'\n\n输出策略：\n- 不要向用户提问；基于已给信息直接产出最强可执行请求。\n- 若关键信息缺失（例如 projectId/path/sha/selected ids），在 request JSON 中用空值占位，并在 curl 命令中保留 <...> 占位符。
diff --git a/skills/canvas-tidy_selection-v1/agents/openai.yaml b/skills/canvas-tidy_selection-v1/agents/openai.yaml
deleted file mode 100644
index 120f1ac..0000000
--- a/skills/canvas-tidy_selection-v1/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "Canvas Tidy Selection v1"
-  short_description: "Canvas Tidy Selection v1"
-  default_prompt: "Use $canvas-tidy_selection-v1."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/find-skills/SKILL.md b/skills/find-skills/SKILL.md
deleted file mode 100644
index c797184..0000000
--- a/skills/find-skills/SKILL.md
+++ /dev/null
@@ -1,133 +0,0 @@
----
-name: find-skills
-description: Helps users discover and install agent skills when they ask questions like "how do I do X", "find a skill for X", "is there a skill that can...", or express interest in extending capabilities. This skill should be used when the user is looking for functionality that might exist as an installable skill.
----
-
-# Find Skills
-
-This skill helps you discover and install skills from the open agent skills ecosystem.
-
-## When to Use This Skill
-
-Use this skill when the user:
-
-- Asks "how do I do X" where X might be a common task with an existing skill
-- Says "find a skill for X" or "is there a skill for X"
-- Asks "can you do X" where X is a specialized capability
-- Expresses interest in extending agent capabilities
-- Wants to search for tools, templates, or workflows
-- Mentions they wish they had help with a specific domain (design, testing, deployment, etc.)
-
-## What is the Skills CLI?
-
-The Skills CLI (`npx skills`) is the package manager for the open agent skills ecosystem. Skills are modular packages that extend agent capabilities with specialized knowledge, workflows, and tools.
-
-**Key commands:**
-
-- `npx skills find [query]` - Search for skills interactively or by keyword
-- `npx skills add <package>` - Install a skill from GitHub or other sources
-- `npx skills check` - Check for skill updates
-- `npx skills update` - Update all installed skills
-
-**Browse skills at:** https://skills.sh/
-
-## How to Help Users Find Skills
-
-### Step 1: Understand What They Need
-
-When a user asks for help with something, identify:
-
-1. The domain (e.g., React, testing, design, deployment)
-2. The specific task (e.g., writing tests, creating animations, reviewing PRs)
-3. Whether this is a common enough task that a skill likely exists
-
-### Step 2: Search for Skills
-
-Run the find command with a relevant query:
-
-```bash
-npx skills find [query]
-```
-
-For example:
-
-- User asks "how do I make my React app faster?" → `npx skills find react performance`
-- User asks "can you help me with PR reviews?" → `npx skills find pr review`
-- User asks "I need to create a changelog" → `npx skills find changelog`
-
-The command will return results like:
-
-```
-Install with npx skills add <owner/repo@skill>
-
-vercel-labs/agent-skills@vercel-react-best-practices
-└ https://skills.sh/vercel-labs/agent-skills/vercel-react-best-practices
-```
-
-### Step 3: Present Options to the User
-
-When you find relevant skills, present them to the user with:
-
-1. The skill name and what it does
-2. The install command they can run
-3. A link to learn more at skills.sh
-
-Example response:
-
-```
-I found a skill that might help! The "vercel-react-best-practices" skill provides
-React and Next.js performance optimization guidelines from Vercel Engineering.
-
-To install it:
-npx skills add vercel-labs/agent-skills@vercel-react-best-practices
-
-Learn more: https://skills.sh/vercel-labs/agent-skills/vercel-react-best-practices
-```
-
-### Step 4: Offer to Install
-
-If the user wants to proceed, you can install the skill for them:
-
-```bash
-npx skills add <owner/repo@skill> -g -y
-```
-
-The `-g` flag installs globally (user-level) and `-y` skips confirmation prompts.
-
-## Common Skill Categories
-
-When searching, consider these common categories:
-
-| Category        | Example Queries                          |
-| --------------- | ---------------------------------------- |
-| Web Development | react, nextjs, typescript, css, tailwind |
-| Testing         | testing, jest, playwright, e2e           |
-| DevOps          | deploy, docker, kubernetes, ci-cd        |
-| Documentation   | docs, readme, changelog, api-docs        |
-| Code Quality    | review, lint, refactor, best-practices   |
-| Design          | ui, ux, design-system, accessibility     |
-| Productivity    | workflow, automation, git                |
-
-## Tips for Effective Searches
-
-1. **Use specific keywords**: "react testing" is better than just "testing"
-2. **Try alternative terms**: If "deploy" doesn't work, try "deployment" or "ci-cd"
-3. **Check popular sources**: Many skills come from `vercel-labs/agent-skills` or `ComposioHQ/awesome-claude-skills`
-
-## When No Skills Are Found
-
-If no relevant skills exist:
-
-1. Acknowledge that no existing skill was found
-2. Offer to help with the task directly using your general capabilities
-3. Suggest the user could create their own skill with `npx skills init`
-
-Example:
-
-```
-I searched for skills related to "xyz" but didn't find any matches.
-I can still help you with this task directly! Would you like me to proceed?
-
-If this is something you do often, you could create your own skill:
-npx skills init my-xyz-skill
-```
diff --git a/skills/imagegen/LICENSE.txt b/skills/imagegen/LICENSE.txt
deleted file mode 100644
index 13e25df..0000000
--- a/skills/imagegen/LICENSE.txt
+++ /dev/null
@@ -1,201 +0,0 @@
-Apache License
-Version 2.0, January 2004
-http://www.apache.org/licenses/
-
-TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-1. Definitions.
-
-   "License" shall mean the terms and conditions for use, reproduction,
-   and distribution as defined by Sections 1 through 9 of this document.
-
-   "Licensor" shall mean the copyright owner or entity authorized by
-   the copyright owner that is granting the License.
-
-   "Legal Entity" shall mean the union of the acting entity and all
-   other entities that control, are controlled by, or are under common
-   control with that entity. For the purposes of this definition,
-   "control" means (i) the power, direct or indirect, to cause the
-   direction or management of such entity, whether by contract or
-   otherwise, or (ii) ownership of fifty percent (50%) or more of the
-   outstanding shares, or (iii) beneficial ownership of such entity.
-
-   "You" (or "Your") shall mean an individual or Legal Entity
-   exercising permissions granted by this License.
-
-   "Source" form shall mean the preferred form for making modifications,
-   including but not limited to software source code, documentation
-   source, and configuration files.
-
-   "Object" form shall mean any form resulting from mechanical
-   transformation or translation of a Source form, including but
-   not limited to compiled object code, generated documentation,
-   and conversions to other media types.
-
-   "Work" shall mean the work of authorship, whether in Source or
-   Object form, made available under the License, as indicated by a
-   copyright notice that is included in or attached to the work
-   (an example is provided in the Appendix below).
-
-   "Derivative Works" shall mean any work, whether in Source or Object
-   form, that is based on (or derived from) the Work and for which the
-   editorial revisions, annotations, elaborations, or other modifications
-   represent, as a whole, an original work of authorship. For the purposes
-   of this License, Derivative Works shall not include works that remain
-   separable from, or merely link (or bind by name) to the interfaces of,
-   the Work and Derivative Works thereof.
-
-   "Contribution" shall mean any work of authorship, including
-   the original version of the Work and any modifications or additions
-   to that Work or Derivative Works thereof, that is intentionally
-   submitted to Licensor for inclusion in the Work by the copyright owner
-   or by an individual or Legal Entity authorized to submit on behalf of
-   the copyright owner. For the purposes of this definition, "submitted"
-   means any form of electronic, verbal, or written communication sent
-   to the Licensor or its representatives, including but not limited to
-   communication on electronic mailing lists, source code control systems,
-   and issue tracking systems that are managed by, or on behalf of, the
-   Licensor for the purpose of discussing and improving the Work, but
-   excluding communication that is conspicuously marked or otherwise
-   designated in writing by the copyright owner as "Not a Contribution."
-
-   "Contributor" shall mean Licensor and any individual or Legal Entity
-   on behalf of whom a Contribution has been received by Licensor and
-   subsequently incorporated within the Work.
-
-2. Grant of Copyright License. Subject to the terms and conditions of
-   this License, each Contributor hereby grants to You a perpetual,
-   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-   copyright license to reproduce, prepare Derivative Works of,
-   publicly display, publicly perform, sublicense, and distribute the
-   Work and such Derivative Works in Source or Object form.
-
-3. Grant of Patent License. Subject to the terms and conditions of
-   this License, each Contributor hereby grants to You a perpetual,
-   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-   (except as stated in this section) patent license to make, have made,
-   use, offer to sell, sell, import, and otherwise transfer the Work,
-   where such license applies only to those patent claims licensable
-   by such Contributor that are necessarily infringed by their
-   Contribution(s) alone or by combination of their Contribution(s)
-   with the Work to which such Contribution(s) was submitted. If You
-   institute patent litigation against any entity (including a
-   cross-claim or counterclaim in a lawsuit) alleging that the Work
-   or a Contribution incorporated within the Work constitutes direct
-   or contributory patent infringement, then any patent licenses
-   granted to You under this License for that Work shall terminate
-   as of the date such litigation is filed.
-
-4. Redistribution. You may reproduce and distribute copies of the
-   Work or Derivative Works thereof in any medium, with or without
-   modifications, and in Source or Object form, provided that You
-   meet the following conditions:
-
-   (a) You must give any other recipients of the Work or
-       Derivative Works a copy of this License; and
-
-   (b) You must cause any modified files to carry prominent notices
-       stating that You changed the files; and
-
-   (c) You must retain, in the Source form of any Derivative Works
-       that You distribute, all copyright, patent, trademark, and
-       attribution notices from the Source form of the Work,
-       excluding those notices that do not pertain to any part of
-       the Derivative Works; and
-
-   (d) If the Work includes a "NOTICE" text file as part of its
-       distribution, then any Derivative Works that You distribute must
-       include a readable copy of the attribution notices contained
-       within such NOTICE file, excluding those notices that do not
-       pertain to any part of the Derivative Works, in at least one
-       of the following places: within a NOTICE text file distributed
-       as part of the Derivative Works; within the Source form or
-       documentation, if provided along with the Derivative Works; or,
-       within a display generated by the Derivative Works, if and
-       wherever such third-party notices normally appear. The contents
-       of the NOTICE file are for informational purposes only and
-       do not modify the License. You may add Your own attribution
-       notices within Derivative Works that You distribute, alongside
-       or as an addendum to the NOTICE text from the Work, provided
-       that such additional attribution notices cannot be construed
-       as modifying the License.
-
-   You may add Your own copyright statement to Your modifications and
-   may provide additional or different license terms and conditions
-   for use, reproduction, or distribution of Your modifications, or
-   for any such Derivative Works as a whole, provided Your use,
-   reproduction, and distribution of the Work otherwise complies with
-   the conditions stated in this License.
-
-5. Submission of Contributions. Unless You explicitly state otherwise,
-   any Contribution intentionally submitted for inclusion in the Work
-   by You to the Licensor shall be under the terms and conditions of
-   this License, without any additional terms or conditions.
-   Notwithstanding the above, nothing herein shall supersede or modify
-   the terms of any separate license agreement you may have executed
-   with Licensor regarding such Contributions.
-
-6. Trademarks. This License does not grant permission to use the trade
-   names, trademarks, service marks, or product names of the Licensor,
-   except as required for reasonable and customary use in describing the
-   origin of the Work and reproducing the content of the NOTICE file.
-
-7. Disclaimer of Warranty. Unless required by applicable law or
-   agreed to in writing, Licensor provides the Work (and each
-   Contributor provides its Contributions) on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-   implied, including, without limitation, any warranties or conditions
-   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-   PARTICULAR PURPOSE. You are solely responsible for determining the
-   appropriateness of using or redistributing the Work and assume any
-   risks associated with Your exercise of permissions under this License.
-
-8. Limitation of Liability. In no event and under no legal theory,
-   whether in tort (including negligence), contract, or otherwise,
-   unless required by applicable law (such as deliberate and grossly
-   negligent acts) or agreed to in writing, shall any Contributor be
-   liable to You for damages, including any direct, indirect, special,
-   incidental, or consequential damages of any character arising as a
-   result of this License or out of the use or inability to use the
-   Work (including but not limited to damages for loss of goodwill,
-   work stoppage, computer failure or malfunction, or any and all
-   other commercial damages or losses), even if such Contributor
-   has been advised of the possibility of such damages.
-
-9. Accepting Warranty or Additional Liability. While redistributing
-   the Work or Derivative Works thereof, You may choose to offer,
-   and charge a fee for, acceptance of support, warranty, indemnity,
-   or other liability obligations and/or rights consistent with this
-   License. However, in accepting such obligations, You may act only
-   on Your own behalf and on Your sole responsibility, not on behalf of
-   any other Contributor, and only if You agree to indemnify,
-   defend, and hold each Contributor harmless for any liability
-   incurred by, or claims asserted against, such Contributor by reason
-   of your accepting any such warranty or additional liability.
-
-END OF TERMS AND CONDITIONS
-
-APPENDIX: How to apply the Apache License to your work.
-
-   To apply the Apache License to your work, attach the following
-   boilerplate notice, with the fields enclosed by brackets "[]"
-   replaced with your own identifying information. (Don\'t include
-   the brackets!)  The text should be enclosed in the appropriate
-   comment syntax for the file format. We also recommend that a
-   file or class name and description of purpose be included on the
-   same "printed page" as the copyright notice for easier
-   identification within third-party archives.
-
-Copyright [yyyy] [name of copyright owner]
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
diff --git a/skills/imagegen/SKILL.md b/skills/imagegen/SKILL.md
deleted file mode 100644
index 4285e5e..0000000
--- a/skills/imagegen/SKILL.md
+++ /dev/null
@@ -1,356 +0,0 @@
----
-name: "imagegen"
-description: "Generate or edit raster images when the task benefits from AI-created bitmap visuals such as photos, illustrations, textures, sprites, mockups, or transparent-background cutouts. Use when Codex should create a brand-new image, transform an existing image, or derive visual variants from references, and the output should be a bitmap asset rather than repo-native code or vector. Do not use when the task is better handled by editing existing SVG/vector/code-native assets, extending an established icon or logo system, or building the visual directly in HTML/CSS/canvas."
----
-
-# Image Generation Skill
-
-Generates or edits images for the current project (for example website assets, game assets, UI mockups, product mockups, wireframes, logo design, photorealistic images, or infographics).
-
-## Top-level modes and rules
-
-This skill has exactly two top-level modes:
-
-- **Default built-in tool mode (preferred):** built-in `image_gen` tool for normal image generation, editing, and simple transparent-image requests. Does not require `OPENAI_API_KEY`.
-- **Fallback CLI mode:** `scripts/image_gen.py` CLI. Use when the user explicitly asks for the CLI/API/model path, or after the user explicitly confirms a true model-native transparency fallback with `gpt-image-1.5`. Requires `OPENAI_API_KEY`.
-
-Within CLI fallback, the CLI exposes three subcommands:
-
-- `generate`
-- `edit`
-- `generate-batch`
-
-Rules:
-- Use the built-in `image_gen` tool by default for normal image generation and editing requests.
-- Do not switch to CLI fallback for ordinary quality, size, or file-path control.
-- If the user explicitly asks for a transparent image/background, stay on built-in `image_gen` first: prompt for a flat removable chroma-key background, then remove it locally with the installed helper at `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`.
-- Never silently switch from built-in `image_gen` or CLI `gpt-image-2` to CLI `gpt-image-1.5`. Treat this as a model/path downgrade and ask the user before doing it, unless the user has already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
-- If a transparent request appears too complex for clean chroma-key removal, asks for true/native transparency, or local removal fails validation, explain that true transparency requires CLI `gpt-image-1.5 --background transparent --output-format png` because `gpt-image-2` does not support `background=transparent`, then ask whether to proceed. Run the CLI fallback only after the user confirms.
-- The word `batch` by itself does not mean CLI fallback. If the user asks for many assets or says to batch-generate assets without explicitly asking for CLI/API/model controls, stay on the built-in path and issue one built-in call per requested asset or variant.
-- If the built-in tool fails or is unavailable, tell the user the CLI fallback exists and that it requires `OPENAI_API_KEY`. Proceed only if the user explicitly asks for that fallback.
-- If the user explicitly asks for CLI mode, use the bundled `scripts/image_gen.py` workflow. Do not create one-off SDK runners.
-- Never modify `scripts/image_gen.py`. If something is missing, ask the user before doing anything else.
-
-Built-in save-path policy:
-- In built-in tool mode, Codex saves generated images under `$CODEX_HOME/*` by default.
-- Do not describe or rely on OS temp as the default built-in destination.
-- Do not describe or rely on a destination-path argument (if any) on the built-in `image_gen` tool. If a specific location is needed, generate first and then move or copy the selected output from `$CODEX_HOME/generated_images/...`.
-- Save-path precedence in built-in mode:
-  1. If the user names a destination, move or copy the selected output there.
-  2. If the image is meant for the current project, move or copy the final selected image into the workspace before finishing.
-  3. If the image is only for preview or brainstorming, render it inline; the underlying file can remain at the default `$CODEX_HOME/*` path.
-- Never leave a project-referenced asset only at the default `$CODEX_HOME/*` path.
-- Do not overwrite an existing asset unless the user explicitly asked for replacement; otherwise create a sibling versioned filename such as `hero-v2.png` or `item-icon-edited.png`.
-
-Shared prompt guidance for both modes lives in `references/prompting.md` and `references/sample-prompts.md`.
-
-Fallback-only docs/resources for CLI mode:
-- `references/cli.md`
-- `references/image-api.md`
-- `references/codex-network.md`
-- `scripts/image_gen.py`
-
-Local post-processing helper:
-- `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`: removes a flat chroma-key background from a generated image and writes a PNG/WebP with alpha. Prefer auto-key sampling, soft matte, and despill for antialiased edges.
-
-## When to use
-- Generate a new image (concept art, product shot, cover, website hero)
-- Generate a new image using one or more reference images for style, composition, or mood
-- Edit an existing image (inpainting, lighting or weather transformations, background replacement, object removal, compositing, transparent background)
-- Produce many assets or variants for one task
-
-## When not to use
-- Extending or matching an existing SVG/vector icon set, logo system, or illustration library inside the repo
-- Creating simple shapes, diagrams, wireframes, or icons that are better produced directly in SVG, HTML/CSS, or canvas
-- Making a small project-local asset edit when the source file already exists in an editable native format
-- Any task where the user clearly wants deterministic code-native output instead of a generated bitmap
-
-## Decision tree
-
-Think about two separate questions:
-
-1. **Intent:** is this a new image or an edit of an existing image?
-2. **Execution strategy:** is this one asset or many assets/variants?
-
-Intent:
-- If the user wants to modify an existing image while preserving parts of it, treat the request as **edit**.
-- If the user provides images only as references for style, composition, mood, or subject guidance, treat the request as **generate**.
-- If the user provides no images, treat the request as **generate**.
-
-Built-in edit semantics:
-- Built-in edit mode is for images already visible in the conversation context, such as attached images or images generated earlier in the thread.
-- If the user wants to edit a local image file with the built-in tool, first load it with built-in `view_image` tool so the image is visible in the conversation context, then proceed with the built-in edit flow.
-- Do not promise arbitrary filesystem-path editing through the built-in tool.
-- If a local file still needs direct file-path control, masks, or other explicit CLI-only parameters, use the explicit CLI fallback only when the user asks for it.
-- For edits, preserve invariants aggressively and save non-destructively by default.
-
-Execution strategy:
-- In the built-in default path, produce many assets or variants by issuing one `image_gen` call per requested asset or variant.
-- In the CLI fallback path, use the CLI `generate-batch` subcommand only when the user explicitly chose CLI mode and needs many prompts/assets.
-- For many distinct assets, do not use `n` as a substitute for separate prompts. `n` is for variants of one prompt; distinct assets need distinct built-in calls or distinct CLI `generate-batch` jobs.
-
-Assume the user wants a new image unless they clearly ask to change an existing one.
-
-## Workflow
-1. Decide the top-level mode: built-in by default, including simple transparent-output requests; fallback CLI only if explicitly requested or after the user explicitly confirms a transparent-output fallback.
-2. Decide the intent: `generate` or `edit`.
-3. Decide whether the output is preview-only or meant to be consumed by the current project.
-4. Decide the execution strategy: single asset vs repeated built-in calls vs CLI `generate-batch`.
-5. Collect inputs up front: prompt(s), exact text (verbatim), constraints/avoid list, and any input images.
-6. For every input image, label its role explicitly:
-   - reference image
-   - edit target
-   - supporting insert/style/compositing input
-7. If the edit target is only on the local filesystem and you are staying on the built-in path, inspect it with `view_image` first so the image is available in conversation context.
-8. If the user asked for a photo, illustration, sprite, product image, banner, or other explicitly raster-style asset, use `image_gen` rather than substituting SVG/HTML/CSS placeholders. If the request is for an icon, logo, or UI graphic that should match existing repo-native SVG/vector/code assets, prefer editing those directly instead.
-9. Augment the prompt based on specificity:
-   - If the user's prompt is already specific and detailed, normalize it into a clear spec without adding creative requirements.
-   - If the user's prompt is generic, add tasteful augmentation only when it materially improves output quality.
-10. Use the built-in `image_gen` tool by default.
-11. For transparent-output requests, follow the transparent image guidance below: generate with built-in `image_gen` on a flat chroma-key background, copy the selected output into the workspace or `tmp/imagegen/`, run the installed `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py` helper, and validate the alpha result before using it. If this path looks unsuitable or fails, ask before switching to CLI `gpt-image-1.5`.
-12. Inspect outputs and validate: subject, style, composition, text accuracy, and invariants/avoid items.
-13. Iterate with a single targeted change, then re-check.
-14. For preview-only work, render the image inline; the underlying file may remain at the default `$CODEX_HOME/generated_images/...` path.
-15. For project-bound work, move or copy the selected artifact into the workspace and update any consuming code or references. Never leave a project-referenced asset only at the default `$CODEX_HOME/generated_images/...` path.
-16. For batches or multi-asset requests, persist every requested deliverable final in the workspace unless the user explicitly asked to keep outputs preview-only. Discarded variants do not need to be kept unless requested.
-17. If the user explicitly chooses or confirms the CLI fallback, then use the fallback-only docs for model, quality, size, `input_fidelity`, masks, output format, output paths, and network setup.
-18. Always report the final saved path(s) for any workspace-bound asset(s), plus the final prompt or prompt set and whether the built-in tool or fallback CLI mode was used.
-
-## Transparent image requests
-
-Transparent-image requests still use built-in `image_gen` first. Because the built-in tool does not expose a true transparent-background control, create a removable chroma-key source image and then convert the key color to alpha locally.
-
-Default sequence:
-1. Use built-in `image_gen` to generate the requested subject on a perfectly flat solid chroma-key background.
-2. Choose a key color that is unlikely to appear in the subject: default `#00ff00`, use `#ff00ff` for green subjects, and avoid `#0000ff` for blue subjects.
-3. After generation, move or copy the selected source image from `$CODEX_HOME/generated_images/...` into the workspace or `tmp/imagegen/`.
-4. Run the installed helper path, not a project-relative script path:
-   ```bash
-   python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" \
-     --input <source> \
-     --out <final.png> \
-     --auto-key border \
-     --soft-matte \
-     --transparent-threshold 12 \
-     --opaque-threshold 220 \
-     --despill
-   ```
-5. Validate that the output has an alpha channel, transparent corners, plausible subject coverage, and no obvious key-color fringe. If a thin fringe remains, retry once with `--edge-contract 1`; use `--edge-feather 0.25` only when the edge is visibly stair-stepped and the subject is not shiny or reflective.
-6. Save the final alpha PNG/WebP in the project if the asset is project-bound. Never leave a project-referenced transparent asset only under `$CODEX_HOME/*`.
-
-Prompt transparent requests like this:
-
-```text
-Create the requested subject on a perfectly flat solid #00ff00 chroma-key background for background removal.
-The background must be one uniform color with no shadows, gradients, texture, reflections, floor plane, or lighting variation.
-Keep the subject fully separated from the background with crisp edges and generous padding.
-Do not use #00ff00 anywhere in the subject.
-No cast shadow, no contact shadow, no reflection, no watermark, and no text unless explicitly requested.
-```
-
-Do not automatically use CLI `gpt-image-1.5 --background transparent --output-format png` instead of chroma keying. Ask the user first when the user asks for true/native transparency, when local removal fails validation, or when the requested image is complex: hair, fur, feathers, smoke, glass, liquids, translucent materials, reflective objects, soft shadows, realistic product grounding, or subject colors that conflict with all practical key colors.
-
-Use a concise confirmation like:
-
-```text
-This likely needs true native transparency. The default built-in path uses a chroma-key background plus local removal, but true transparency requires the CLI fallback with gpt-image-1.5 because gpt-image-2 does not support background=transparent. It also requires OPENAI_API_KEY. Should I proceed with that CLI fallback?
-```
-
-## Prompt augmentation
-
-Reformat user prompts into a structured, production-oriented spec. Make the user's goal clearer and more actionable, but do not blindly add detail.
-
-Treat this as prompt-shaping guidance, not a closed schema. Use only the lines that help, and add a short extra labeled line when it materially improves clarity.
-
-### Specificity policy
-
-Use the user's prompt specificity to decide how much augmentation is appropriate:
-
-- If the prompt is already specific and detailed, preserve that specificity and only normalize/structure it.
-- If the prompt is generic, you may add tasteful augmentation when it will materially improve the result.
-
-Allowed augmentations:
-- composition or framing hints
-- polish level or intended-use hints
-- practical layout guidance
-- reasonable scene concreteness that supports the stated request
-
-Not allowed augmentations:
-- extra characters or objects that are not implied by the request
-- brand names, slogans, palettes, or narrative beats that are not implied
-- arbitrary side-specific placement unless the surrounding layout supports it
-
-## Use-case taxonomy (exact slugs)
-
-Classify each request into one of these buckets and keep the slug consistent across prompts and references.
-
-Generate:
-- photorealistic-natural — candid/editorial lifestyle scenes with real texture and natural lighting.
-- product-mockup — product/packaging shots, catalog imagery, merch concepts.
-- ui-mockup — app/web interface mockups and wireframes; specify the desired fidelity.
-- infographic-diagram — diagrams/infographics with structured layout and text.
-- scientific-educational — classroom explainers, scientific diagrams, and learning visuals with required labels and accuracy constraints.
-- ads-marketing — campaign concepts and ad creatives with audience, brand position, scene, and exact tagline/copy.
-- productivity-visual — slide, chart, workflow, and data-heavy business visuals.
-- logo-brand — logo/mark exploration, vector-friendly.
-- illustration-story — comics, children’s book art, narrative scenes.
-- stylized-concept — style-driven concept art, 3D/stylized renders.
-- historical-scene — period-accurate/world-knowledge scenes.
-
-Edit:
-- text-localization — translate/replace in-image text, preserve layout.
-- identity-preserve — try-on, person-in-scene; lock face/body/pose.
-- precise-object-edit — remove/replace a specific element (including interior swaps).
-- lighting-weather — time-of-day/season/atmosphere changes only.
-- background-extraction — transparent background / clean cutout. Use built-in `image_gen` with chroma-key removal first for simple opaque subjects; ask before using CLI true transparency for complex subjects.
-- style-transfer — apply reference style while changing subject/scene.
-- compositing — multi-image insert/merge with matched lighting/perspective.
-- sketch-to-render — drawing/line art to photoreal render.
-
-## Shared prompt schema
-
-Use the following labeled spec as shared prompt scaffolding for both top-level modes:
-
-```text
-Use case: <taxonomy slug>
-Asset type: <where the asset will be used>
-Primary request: <user's main prompt>
-Input images: <Image 1: role; Image 2: role> (optional)
-Scene/backdrop: <environment>
-Subject: <main subject>
-Style/medium: <photo/illustration/3D/etc>
-Composition/framing: <wide/close/top-down; placement>
-Lighting/mood: <lighting + mood>
-Color palette: <palette notes>
-Materials/textures: <surface details>
-Text (verbatim): "<exact text>"
-Constraints: <must keep/must avoid>
-Avoid: <negative constraints>
-```
-
-Notes:
-- `Asset type` and `Input images` are prompt scaffolding, not dedicated CLI flags.
-- `Scene/backdrop` refers to the visual setting. It is not the same as the fallback CLI `background` parameter, which controls output transparency behavior.
-- Fallback-only execution notes such as `Quality:`, `Input fidelity:`, masks, output format, and output paths belong in the CLI path only. Do not treat them as built-in `image_gen` tool arguments.
-
-Augmentation rules:
-- Keep it short.
-- Add only the details needed to improve the prompt materially.
-- For edits, explicitly list invariants (`change only X; keep Y unchanged`).
-- If any critical detail is missing and blocks success, ask a question; otherwise proceed.
-
-## Examples
-
-### Generation example (hero image)
-```text
-Use case: product-mockup
-Asset type: landing page hero
-Primary request: a minimal hero image of a ceramic coffee mug
-Style/medium: clean product photography
-Composition/framing: wide composition with usable negative space for page copy if needed
-Lighting/mood: soft studio lighting
-Constraints: no logos, no text, no watermark
-```
-
-### Edit example (invariants)
-```text
-Use case: precise-object-edit
-Asset type: product photo background replacement
-Primary request: replace only the background with a warm sunset gradient
-Constraints: change only the background; keep the product and its edges unchanged; no text; no watermark
-```
-
-## Prompting best practices
-- Structure prompt as scene/backdrop -> subject -> details -> constraints.
-- Include intended use (ad, UI mock, infographic) to set the mode and polish level.
-- Use camera/composition language for photorealism.
-- Only use SVG/vector stand-ins when the user explicitly asked for vector output or a non-image placeholder.
-- Quote exact text and specify typography + placement.
-- For tricky words, spell them letter-by-letter and require verbatim rendering.
-- For multi-image inputs, reference images by index and describe how they should be used.
-- For edits, repeat invariants every iteration to reduce drift.
-- Iterate with single-change follow-ups.
-- If the prompt is generic, add only the extra detail that will materially help.
-- If the prompt is already detailed, normalize it instead of expanding it.
-- For CLI fallback only, see `references/cli.md` and `references/image-api.md` for model, `quality`, `input_fidelity`, masks, output format, and output-path guidance.
-- For transparent images, use the built-in-first chroma-key workflow unless the request is complex enough to need true CLI transparency; ask before switching to CLI `gpt-image-1.5`.
-
-More principles shared by both modes: `references/prompting.md`.
-Copy/paste specs shared by both modes: `references/sample-prompts.md`.
-
-## Guidance by asset type
-Asset-type templates (website assets, game assets, wireframes, logo) are consolidated in `references/sample-prompts.md`.
-
-## gpt-image-2 guidance for CLI fallback
-
-The fallback CLI defaults to `gpt-image-2`.
-
-- Use `gpt-image-2` for new CLI/API workflows unless the request needs true model-native transparent output.
-- If a transparent request may need CLI fallback, ask before using `gpt-image-1.5` unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Explain that the built-in chroma-key path is the default, but true transparency requires `gpt-image-1.5` because `gpt-image-2` does not support `background=transparent`.
-- `gpt-image-2` always uses high fidelity for image inputs; do not set `input_fidelity` with this model.
-- `gpt-image-2` supports `quality` values `low`, `medium`, `high`, and `auto`.
-- Use `quality low` for fast drafts, thumbnails, and quick iterations. Use `medium`, `high`, or `auto` for final assets, dense text, diagrams, identity-sensitive edits, or high-resolution outputs.
-- Square images are typically fastest to generate. Use `1024x1024` for fast square drafts.
-- If the user asks for 4K-style output, use `3840x2160` for landscape or `2160x3840` for portrait.
-- `gpt-image-2` size may be `auto` or `WIDTHxHEIGHT` if all constraints hold: max edge `<= 3840px`, both edges multiples of `16px`, long-to-short ratio `<= 3:1`, total pixels between `655,360` and `8,294,400`.
-
-Popular `gpt-image-2` sizes:
-- `1024x1024` square
-- `1536x1024` landscape
-- `1024x1536` portrait
-- `2048x2048` 2K square
-- `2048x1152` 2K landscape
-- `3840x2160` 4K landscape
-- `2160x3840` 4K portrait
-- `auto`
-
-## Fallback CLI mode only
-
-### Temp and output conventions
-These conventions apply only to the CLI fallback. They do not describe built-in `image_gen` output behavior.
-- Use `tmp/imagegen/` for intermediate files (for example JSONL batches); delete them when done.
-- Write final artifacts under `output/imagegen/`.
-- Use `--out` or `--out-dir` to control output paths; keep filenames stable and descriptive.
-
-### Dependencies
-Prefer `uv` for dependency management in this repo.
-
-Required Python package:
-```bash
-uv pip install openai
-```
-
-Required for local chroma-key removal and optional downscaling:
-```bash
-uv pip install pillow
-```
-
-Portability note:
-- If you are using the installed skill outside this repo, install dependencies into that environment with its package manager.
-- In uv-managed environments, `uv pip install ...` remains the preferred path.
-
-### Environment
-- `OPENAI_API_KEY` must be set for live API calls.
-- Do not ask the user for `OPENAI_API_KEY` when using the built-in `image_gen` tool.
-- Never ask the user to paste the full key in chat. Ask them to set it locally and confirm when ready.
-
-If the key is missing, give the user these steps:
-1. Create an API key in the OpenAI platform UI: https://platform.openai.com/api-keys
-2. Set `OPENAI_API_KEY` as an environment variable in their system.
-3. Offer to guide them through setting the environment variable for their OS/shell if needed.
-
-If installation is not possible in this environment, tell the user which dependency is missing and how to install it into their active environment.
-
-### Script-mode notes
-- CLI commands + examples: `references/cli.md`
-- API parameter quick reference: `references/image-api.md`
-- Network approvals / sandbox settings for CLI mode: `references/codex-network.md`
-
-## Reference map
-- `references/prompting.md`: shared prompting principles for both modes.
-- `references/sample-prompts.md`: shared copy/paste prompt recipes for both modes.
-- `references/cli.md`: fallback-only CLI usage via `scripts/image_gen.py`.
-- `references/image-api.md`: fallback-only API/CLI parameter reference.
-- `references/codex-network.md`: fallback-only network/sandbox troubleshooting for CLI mode.
-- `scripts/image_gen.py`: fallback-only CLI implementation. Do not load or use it unless the user explicitly chooses CLI mode or explicitly confirms a transparent request's true CLI transparency fallback.
-- `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`: local post-processing helper for built-in transparent-image requests.
diff --git a/skills/imagegen/agents/openai.yaml b/skills/imagegen/agents/openai.yaml
deleted file mode 100644
index 5e01d44..0000000
--- a/skills/imagegen/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "Image Gen"
-  short_description: "Generate or edit images for websites, games, and more"
-  icon_small: "./assets/imagegen-small.svg"
-  icon_large: "./assets/imagegen.png"
-  default_prompt: "Use $imagegen to make or edit an image for this project."
diff --git a/skills/imagegen/assets/imagegen-small.svg b/skills/imagegen/assets/imagegen-small.svg
deleted file mode 100644
index 20128b2..0000000
--- a/skills/imagegen/assets/imagegen-small.svg
+++ /dev/null
@@ -1,5 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" viewBox="0 0 16 16">
-  <path fill="currentColor" d="M7.51 6.827a1 1 0 1 1 .278 1.982 1 1 0 0 1-.278-1.982Z"/>
-  <path fill="currentColor" fill-rule="evenodd" d="M8.31 4.47c.368-.016.699.008 1.016.124l.186.075c.423.194.786.5 1.047.888l.067.107c.148.253.235.533.3.848.073.354.126.797.193 1.343l.277 2.25.088.745c.024.224.041.425.049.605.013.322-.004.615-.085.896l-.04.12a2.53 2.53 0 0 1-.802 1.115l-.16.118c-.281.189-.596.292-.956.366a9.46 9.46 0 0 1-.6.1l-.743.094-2.25.277c-.547.067-.99.121-1.35.136a2.765 2.765 0 0 1-.896-.085l-.12-.039a2.533 2.533 0 0 1-1.115-.802l-.118-.161c-.189-.28-.292-.596-.366-.956a9.42 9.42 0 0 1-.1-.599l-.094-.744-.276-2.25a17.884 17.884 0 0 1-.137-1.35c-.015-.367.009-.698.124-1.015l.076-.185c.193-.423.5-.787.887-1.048l.107-.067c.253-.148.534-.234.849-.3.354-.073.796-.126 1.343-.193l2.25-.277.744-.088c.224-.024.425-.041.606-.049Zm-2.905 5.978a1.47 1.47 0 0 0-.875.074c-.127.052-.267.146-.475.344-.212.204-.462.484-.822.889l-.314.351c.018.115.036.219.055.313.061.295.127.458.206.575l.07.094c.167.211.39.372.645.465l.109.032c.119.027.273.038.499.029.308-.013.7-.06 1.264-.13l2.25-.275.727-.093.198-.03-2.05-1.64a16.848 16.848 0 0 0-.96-.738c-.18-.121-.31-.19-.421-.23l-.106-.03Zm2.95-4.915c-.154.006-.33.021-.536.043l-.729.086-2.25.276c-.564.07-.956.118-1.257.18a1.937 1.937 0 0 0-.478.15l-.097.057a1.47 1.47 0 0 0-.515.608l-.044.107c-.048.133-.073.307-.06.608.012.307.06.7.129 1.264l.22 1.8.178-.197c.145-.159.278-.298.403-.418.255-.243.507-.437.809-.56l.181-.067a2.526 2.526 0 0 1 1.328-.06l.118.029c.27.079.517.215.772.387.287.194.619.46 1.03.789l2.52 2.016c.146-.148.26-.326.332-.524l.031-.109c.027-.119.039-.273.03-.499a8.311 8.311 0 0 0-.044-.536l-.086-.728-.276-2.25c-.07-.564-.118-.956-.18-1.258a1.935 1.935 0 0 0-.15-.477l-.057-.098a1.468 1.468 0 0 0-.608-.515l-.107-.043c-.133-.049-.306-.074-.607-.061Z" clip-rule="evenodd"/>
-  <path fill="currentColor" d="M7.783 1.272c.36.014.803.07 1.35.136l2.25.277.743.095c.224.03.423.062.6.099.36.074.675.177.955.366l.161.118c.364.29.642.675.802 1.115l.04.12c.081.28.098.574.085.896a9.42 9.42 0 0 1-.05.605l-.087.745-.277 2.25c-.067.547-.12.989-.193 1.343a2.765 2.765 0 0 1-.3.848l-.067.107a2.534 2.534 0 0 1-.415.474l-.086.064a.532.532 0 0 1-.622-.858l.13-.13c.04-.046.077-.094.111-.145l.057-.098c.055-.109.104-.256.15-.477.062-.302.11-.694.18-1.258l.276-2.25.086-.728c.022-.207.037-.382.043-.536.01-.226-.002-.38-.029-.5l-.032-.108a1.469 1.469 0 0 0-.464-.646l-.094-.069c-.118-.08-.28-.145-.575-.206a8.285 8.285 0 0 0-.53-.088l-.728-.092-2.25-.276c-.565-.07-.956-.117-1.264-.13a1.94 1.94 0 0 0-.5.029l-.108.032a1.469 1.469 0 0 0-.647.465l-.068.094c-.054.08-.102.18-.146.33l-.04.1a.533.533 0 0 1-.98-.403l.055-.166c.059-.162.133-.314.23-.457l.117-.16c.29-.365.675-.643 1.115-.803l.12-.04c.28-.08.574-.097.896-.084Z"/>
-</svg>
diff --git a/skills/imagegen/assets/imagegen.png b/skills/imagegen/assets/imagegen.png
deleted file mode 100644
index 94b54541a9affd39a7aa09d0efd5bc6b712b723b..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1711
zcmV;g22lBlP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH21H3jK~#7F?VV3-
z6Gs$>f8*GWodgmJ0xDHBC~1!*z7`}xiD+*{^u{6Wtr9m>;F?6e6%akq_R>NQ97`^h
zS_ISw!l_acdMv2|s@jkWFo}~maqQ{5Ar6jXJ8OGpcRf3wwDM+c*~)zT-u&HNh6Xr2
z$-B~6@6U&DoN@F6Tx_gMyw!zZkYd0r7n}J1r^VmNyNO5=4Zu(bgOk|-gzyRH_#DA0
ze5a&Dv5qs&Z`LEHCLtt(GYpH}0a%=n6p=Gpix@{jKAv3Z&a&_|v3nYpI$$><yk+#4
z1e@LQlRJH2BPwpgrltlFGC0oPON7U(eJWJ#&B5vHu#oW^tPBP4ZZLlPLs6#HK2<S7
zqzsM`Sd=49@{#*}k<oJRl@(%T=!f&%`TL33H>Jn72{}2rewsoH7VU@@*oo2>*cKtL
zTT?Bf&S2fJxIt<c4<8;+uvFo|mP$R#BEwdOt8^{0^&g85Y(|JpRo+pYy52+x%U^@V
z6E;RaBvObRn*!^G#VZD0JJ=Ay8T$+tPvINGQnC&?IhB10+Z*>9+2RUqgo>5nJ#ub|
zQq}-0z927LghkRij)2h@&){gs3Jyeb=#8#z9#4y@PugZO5lp1xm|ls&O&Ie1Y;Y<&
zDJqnH7*0nhk28A~<wpBXn9GLoXt@<*FFNJEe%LG%6*`CEoY}L0p}h-^MU+BO^V7>+
z7<=9c&7_PLLIN%we2x!9dQ!nmCW_&I_i2rm5DevDWF6nVJEu$r(Gy$4m3QXlck9AP
zAru+93XZ;0rxYWFoZJ6W>sd_Seeu8x=)gE3r*<#NO*egQ8QEe}jd4PT_P&B!&~Me-
za;t<<LMSqHrm9j3eH)b+CFD~LDP$+CkP1*_^t7(QZ751;C`J{=2ssj8g;yL^*w-;e
zNUsOcQQ$ySUA<+Dke*l;UeOa(_uIw}oir;}h|e%a$WpGZi@}sY!}F>zMu<BTNab0w
zLbfxr7KK+#i&;fg7$an2F%GY=LdrmSe0tg4MF|9@N|lQtjA~{5y3hu<xwFs?l^7-D
z&O(Q)l{@{G6|w`D=iY)_j6L72`~)yg2<3BHvZI@a>9~wY)fm}Rzy9AItra{)#n*Ft
zp#x)wPKN*4hndv~RP#6!#f883EA5>ZW2_J=urHpxtu%d61x_+_HXOVgZ*U1pUyntk
z&{EQR=i5oZ_4zJ5T+-jH*0PkegJp0u{3nitpQ5+rnfUw7Y~EbH6KNj9MD{&AT0ew2
zu6@1iCZ~3%@lofp<0)5aAWWoVxbvz*TZ$@0sgS;wrx=Pokgrae&K<&7=9qkS3pxKD
zT|-~ns+{fX2)!<Xbe`eaT3FOQQB1A0;+Y2nmP&*i486j|_|G+oC}m>(eSEue($$FZ
zBMl2V75M|_V)ta4Qo-2jF}VemhGKH4^?}?}Lf=PnuV)4kMCz`oE{PPST1J60(ckfX
z`wz;Zu9>J=2o=)R_FFPl>7=J+9#`9L1x`v$La6e-A_}RI%DWbVD8;dmf{b2KNNy4|
zDUO8nhUTRVlHvtHlCq-^sw=LvdncnnP^459LaiNYP5Gq|f*_@$5Ngt%i`|9aFkMPn
zAtXXqA43HuOW7i%(8r)u<#$Y#vMI#vK86ZRlp=+A)yGhQX;MO7_c2spk`%T$bD5iR
zcFpAW<ICl<az?UQ37M3CO^6iZR-H7v6eE`bHM10B*JU-U6r(TtY(^=@UxnLjQUY;V
zbTdf_%ysI`A|+5a4rm4`fxDA~-=zfd)*61664-m4_*F`vZ$9HgDXGBU4aiSY=-KRn
z7ee?&3g`JJR>%f^kirm}vO<dRfs~{bQi6w4QuJ_1E2IqGNMZ89_f|*++?K*Pze%rF
zNEKX^lHC3*TuWKpkis}d3;R}x1N2H^H;Nx}Z-qESj}$hW<1M4bN34(<P%eezd@{ji
ziw{{LHKIxi7xl)yM0mXPxD`?djY=UI_Y;wka_?CobyBaCYBC5bqycJ_k`m3^6V+r8
zR!D<5ks{_fk~tnu6gO`xVTCB5k`xj_QE|6Fa-y^~RSCxb`pWpHMY{!EpK@XOY-*9m
z$7yWJNko)lg)~M=6k!UCO(CCuBJz!B#^$Ej;gJ;T<bMJ3q~G?jZnFRY002ovPDHLk
FV1gqn4#EHc

diff --git a/skills/imagegen/references/cli.md b/skills/imagegen/references/cli.md
deleted file mode 100644
index f4a5a63..0000000
--- a/skills/imagegen/references/cli.md
+++ /dev/null
@@ -1,242 +0,0 @@
-# CLI reference (`scripts/image_gen.py`)
-
-This file is for the fallback CLI mode only. Read it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
-
-`generate-batch` is a CLI subcommand in this fallback path. It is not a top-level mode of the skill.
-The word `batch` in a user request is not CLI opt-in by itself.
-
-## What this CLI does
-- `generate`: generate a new image from a prompt
-- `edit`: edit one or more existing images
-- `generate-batch`: run many generation jobs from a JSONL file after the user explicitly chooses CLI/API/model controls
-
-Real API calls require **network access** + `OPENAI_API_KEY`. `--dry-run` does not.
-
-## Quick start (works from any repo)
-Set a stable path to the skill CLI (default `CODEX_HOME` is `~/.codex`):
-
-```
-export CODEX_HOME="${CODEX_HOME:-$HOME/.codex}"
-export IMAGE_GEN="$CODEX_HOME/skills/.system/imagegen/scripts/image_gen.py"
-```
-
-Install dependencies into that environment with its package manager. In uv-managed environments, `uv pip install ...` remains the preferred path.
-
-## Quick start
-
-Dry-run (no API call; no network required; does not require the `openai` package):
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "Test" \
-  --out output/imagegen/test.png \
-  --dry-run
-```
-
-Notes:
-- One-off dry-runs print the API payload and the computed output path(s).
-- Repo-local finals should live under `output/imagegen/`.
-
-Generate (requires `OPENAI_API_KEY` + network):
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A cozy alpine cabin at dawn" \
-  --size 1024x1024 \
-  --out output/imagegen/alpine-cabin.png
-```
-
-Edit:
-
-```bash
-python "$IMAGE_GEN" edit \
-  --image input.png \
-  --prompt "Replace only the background with a warm sunset" \
-  --out output/imagegen/sunset-edit.png
-```
-
-## Guardrails
-- Use the bundled CLI directly (`python "$IMAGE_GEN" ...`) after activating the correct environment.
-- Do **not** create one-off runners (for example `gen_images.py`) unless the user explicitly asks for a custom wrapper.
-- **Never modify** `scripts/image_gen.py`. If something is missing, ask the user before doing anything else.
-- Do not silently downgrade from CLI `gpt-image-2` or built-in `image_gen` to CLI `gpt-image-1.5`; ask first unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
-
-## Defaults
-- Model: `gpt-image-2`
-- Supported model family for this CLI: GPT Image models (`gpt-image-*`)
-- Size: `auto`
-- Quality: `medium`
-- Output format: `png`
-- Default one-off output path: `output/imagegen/output.png`
-- Background: unspecified unless `--background` is set
-
-## gpt-image-2 size and model guidance
-
-`gpt-image-2` is the default model for new CLI fallback work.
-
-- Use `--quality low` for fast drafts, thumbnails, and quick iterations.
-- Use `--quality medium`, `--quality high`, or `--quality auto` for final assets, dense text, diagrams, identity-sensitive edits, and high-resolution outputs.
-- Square images are typically fastest. Use `--size 1024x1024` for quick square drafts.
-- If the user asks for 4K-style output, use `--size 3840x2160` for landscape or `--size 2160x3840` for portrait.
-- Do not pass `--input-fidelity` with `gpt-image-2`; this model always uses high fidelity for image inputs.
-- Do not use `--background transparent` with `gpt-image-2`; the default transparent-image workflow uses built-in `image_gen` on a flat chroma-key background plus local removal. Use `gpt-image-1.5` only after the user explicitly confirms the true-transparent CLI fallback, unless they already requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
-
-Popular `gpt-image-2` sizes:
-- `1024x1024`
-- `1536x1024`
-- `1024x1536`
-- `2048x2048`
-- `2048x1152`
-- `3840x2160`
-- `2160x3840`
-- `auto`
-
-`gpt-image-2` size constraints:
-- max edge `<= 3840px`
-- both edges multiples of `16px`
-- long edge to short edge ratio `<= 3:1`
-- total pixels between `655,360` and `8,294,400`
-- outputs above `2560x1440` total pixels are experimental
-
-Fast draft:
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A product thumbnail of a matte ceramic mug on a stone surface" \
-  --quality low \
-  --size 1024x1024 \
-  --out output/imagegen/mug-draft.png
-```
-
-Final 2K landscape:
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A polished landing-page hero image of a matte ceramic mug on a stone surface" \
-  --quality high \
-  --size 2048x1152 \
-  --out output/imagegen/mug-hero.png
-```
-
-4K landscape:
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A detailed architectural visualization at golden hour" \
-  --size 3840x2160 \
-  --quality high \
-  --out output/imagegen/architecture-4k.png
-```
-
-True transparent fallback request:
-
-Ask for confirmation before using this command unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
-
-```bash
-python "$IMAGE_GEN" generate \
-  --model gpt-image-1.5 \
-  --prompt "A clean product cutout on a transparent background" \
-  --background transparent \
-  --output-format png \
-  --out output/imagegen/product-cutout.png
-```
-
-When using this path, explain briefly that built-in `image_gen` plus chroma-key removal is the default transparent-image path, but this request needs true model-native transparency. `gpt-image-2` does not support `background=transparent`, so `gpt-image-1.5` is required for this confirmed fallback.
-
-## Quality, input fidelity, and masks (CLI fallback only)
-These are explicit CLI controls. They are not built-in `image_gen` tool arguments.
-
-- `--quality` works for `generate`, `edit`, and `generate-batch`: `low|medium|high|auto`
-- `--input-fidelity` is **edit-only** and validated as `low|high`; it is not supported for `gpt-image-2`
-- `--mask` is **edit-only**
-
-Example:
-
-```bash
-python "$IMAGE_GEN" edit \
-  --model gpt-image-1.5 \
-  --image input.png \
-  --prompt "Change only the background" \
-  --quality high \
-  --input-fidelity high \
-  --out output/imagegen/background-edit.png
-```
-
-Mask notes:
-- For multi-image edits, pass repeated `--image` flags. Their order is meaningful, so describe each image by index and role in the prompt.
-- The CLI accepts a single `--mask`.
-- Image and mask must be the same size and format and each under 50MB.
-- Masks must include an alpha channel.
-- If multiple input images are provided, the mask applies to the first image.
-- Masking is prompt-guided; do not promise exact pixel-perfect mask boundaries.
-- Use a PNG mask when possible; the script treats mask handling as best-effort and does not perform full preflight validation beyond file checks/warnings.
-- In the edit prompt, repeat invariants (`change only the background; keep the subject unchanged`) to reduce drift.
-
-## Output handling
-- Use `tmp/imagegen/` for temporary JSONL inputs or scratch files.
-- Use `output/imagegen/` for final outputs.
-- Reruns fail if a target file already exists unless you pass `--force`.
-- `--out-dir` changes one-off naming to `image_1.<ext>`, `image_2.<ext>`, and so on.
-- Downscaled copies use the default suffix `-web` unless you override it.
-
-## Common recipes
-
-Generate with augmentation fields:
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A minimal hero image of a ceramic coffee mug" \
-  --use-case "product-mockup" \
-  --style "clean product photography" \
-  --composition "wide product shot with usable negative space for page copy" \
-  --constraints "no logos, no text" \
-  --out output/imagegen/mug-hero.png
-```
-
-Generate + also write a downscaled copy for fast web loading:
-
-```bash
-python "$IMAGE_GEN" generate \
-  --prompt "A cozy alpine cabin at dawn" \
-  --size 1024x1024 \
-  --downscale-max-dim 1024 \
-  --out output/imagegen/alpine-cabin.png
-```
-
-Generate multiple prompts concurrently (async batch):
-
-```bash
-mkdir -p tmp/imagegen output/imagegen/batch
-cat > tmp/imagegen/prompts.jsonl << 'EOF'
-{"prompt":"Cavernous hangar interior with a compact shuttle parked near the center","use_case":"stylized-concept","composition":"wide-angle, low-angle","lighting":"volumetric light rays through drifting fog","constraints":"no logos or trademarks; no watermark","size":"1536x1024"}
-{"prompt":"Gray wolf in profile in a snowy forest","use_case":"photorealistic-natural","composition":"eye-level","constraints":"no logos or trademarks; no watermark","size":"1024x1024"}
-EOF
-
-python "$IMAGE_GEN" generate-batch \
-  --input tmp/imagegen/prompts.jsonl \
-  --out-dir output/imagegen/batch \
-  --concurrency 5
-
-rm -f tmp/imagegen/prompts.jsonl
-```
-
-Notes:
-- `generate-batch` requires `--out-dir`.
-- generate-batch requires --out-dir.
-- Use `--concurrency` to control parallelism (default `5`).
-- Per-job overrides are supported in JSONL (for example `size`, `quality`, `background`, `output_format`, `output_compression`, `moderation`, `n`, `model`, `out`, and prompt-augmentation fields).
-- `--n` generates multiple variants for a single prompt; `generate-batch` is for many different prompts.
-- In batch mode, per-job `out` is treated as a filename under `--out-dir`.
-- For many requested deliverable assets, provide one prompt/job per distinct asset and use semantic filenames when possible.
-
-## CLI notes
-- Supported sizes depend on the model. `gpt-image-2` supports flexible constrained sizes; older GPT Image models support `1024x1024`, `1536x1024`, `1024x1536`, or `auto`.
-- True transparent CLI outputs require `output_format` to be `png` or `webp` and are not supported by `gpt-image-2`.
-- `--prompt-file`, `--output-compression`, `--moderation`, `--max-attempts`, `--fail-fast`, `--force`, and `--no-augment` are supported.
-- This CLI is intended for GPT Image models. Do not assume older non-GPT image-model behavior applies here.
-
-## See also
-- API parameter quick reference for fallback CLI mode: `references/image-api.md`
-- Prompt examples shared across both top-level modes: `references/sample-prompts.md`
-- Network/sandbox notes for fallback CLI mode: `references/codex-network.md`
-- Built-in-first transparent image workflow: `SKILL.md` and `$CODEX_HOME/skills/.system/imagegen/scripts/remove_chroma_key.py`
diff --git a/skills/imagegen/references/codex-network.md b/skills/imagegen/references/codex-network.md
deleted file mode 100644
index 5ce1fbc..0000000
--- a/skills/imagegen/references/codex-network.md
+++ /dev/null
@@ -1,33 +0,0 @@
-# Codex network approvals / sandbox notes
-
-This file is for the fallback CLI mode only. Read it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
-
-This guidance is intentionally isolated from `SKILL.md` because it can vary by environment and may become stale. Prefer the defaults in your environment when in doubt.
-
-## Why am I asked to approve image generation calls?
-The fallback CLI uses the OpenAI Image API, so it needs outbound network access. In many Codex setups, network access is disabled by default and/or the approval policy requires confirmation before networked commands run.
-
-## Important note about approvals vs network
-- `--ask-for-approval never` suppresses approval prompts.
-- It does **not** by itself enable network access.
-- In `workspace-write`, network access still depends on your Codex configuration (for example `[sandbox_workspace_write] network_access = true`).
-
-## How do I reduce repeated approval prompts?
-If you trust the repo and want fewer prompts, use a configuration or profile that both:
-- enables network for the sandbox mode you plan to use
-- sets an approval policy that matches your risk tolerance
-
-Example `~/.codex/config.toml` pattern:
-
-```toml
-approval_policy = "on-request"
-sandbox_mode = "workspace-write"
-
-[sandbox_workspace_write]
-network_access = true
-```
-
-If you want quieter automation after network is enabled, you can choose a stricter approval policy, but do that intentionally and with care.
-
-## Safety note
-Enabling network and reducing approvals lowers friction, but increases risk if you run untrusted code or work in an untrusted repository.
diff --git a/skills/imagegen/references/image-api.md b/skills/imagegen/references/image-api.md
deleted file mode 100644
index db8567d..0000000
--- a/skills/imagegen/references/image-api.md
+++ /dev/null
@@ -1,90 +0,0 @@
-# Image API quick reference
-
-This file is for the fallback CLI mode only. Use it when the user explicitly asks to use `scripts/image_gen.py` / CLI / API / model controls, or after the user explicitly confirms that a transparent-output request should use the `gpt-image-1.5` true-transparency fallback path.
-
-These parameters describe the Image API and bundled CLI fallback surface. Do not assume they are normal arguments on the built-in `image_gen` tool.
-
-## Scope
-- This fallback CLI is intended for GPT Image models (`gpt-image-2`, `gpt-image-1.5`, `gpt-image-1`, and `gpt-image-1-mini`).
-- The built-in `image_gen` tool and the fallback CLI do not expose the same controls.
-
-## Model summary
-
-| Model | Quality | Input fidelity | Resolutions | Recommended use |
-| --- | --- | --- | --- | --- |
-| `gpt-image-2` | `low`, `medium`, `high`, `auto` | Always high fidelity for image inputs; do not set `input_fidelity` | `auto` or flexible sizes that satisfy the constraints below | Default for new CLI/API workflows: high-quality generation and editing, text-heavy images, photorealism, compositing, identity-sensitive edits, and workflows where fewer retries matter |
-| `gpt-image-1.5` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | True transparent-background fallback and backward-compatible workflows |
-| `gpt-image-1` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | Legacy compatibility |
-| `gpt-image-1-mini` | `low`, `medium`, `high`, `auto` | `low`, `high` | `1024x1024`, `1024x1536`, `1536x1024`, `auto` | Cost-sensitive draft batches and lower-stakes previews |
-
-## gpt-image-2 sizes
-
-`gpt-image-2` accepts `auto` or any `WIDTHxHEIGHT` size that satisfies all constraints:
-
-- Maximum edge length must be less than or equal to `3840px`.
-- Both edges must be multiples of `16px`.
-- Long edge to short edge ratio must not exceed `3:1`.
-- Total pixels must be at least `655,360` and no more than `8,294,400`.
-
-Popular sizes:
-
-| Label | Size | Notes |
-| --- | --- | --- |
-| Square | `1024x1024` | Typical fast default |
-| Landscape | `1536x1024` | Standard landscape |
-| Portrait | `1024x1536` | Standard portrait |
-| 2K square | `2048x2048` | Larger square output |
-| 2K landscape | `2048x1152` | Widescreen output |
-| 4K landscape | `3840x2160` | Widescreen 4K output |
-| 4K portrait | `2160x3840` | Vertical 4K output |
-| Auto | `auto` | Default size |
-
-Square images are typically fastest to generate. For 4K-style output, use `3840x2160` or `2160x3840`.
-
-## Endpoints
-- Generate: `POST /v1/images/generations` (`client.images.generate(...)`)
-- Edit: `POST /v1/images/edits` (`client.images.edit(...)`)
-
-## Core parameters for GPT Image models
-- `prompt`: text prompt
-- `model`: image model
-- `n`: number of images (1-10)
-- `size`: `auto` by default for `gpt-image-2`; flexible `WIDTHxHEIGHT` sizes are allowed only for `gpt-image-2`; older GPT Image models use `1024x1024`, `1536x1024`, `1024x1536`, or `auto`
-- `quality`: `low`, `medium`, `high`, or `auto`
-- `background`: output transparency behavior (`transparent`, `opaque`, or `auto`) for generated output; this is not the same thing as the prompt's visual scene/backdrop
-- `output_format`: `png` (default), `jpeg`, `webp`
-- `output_compression`: 0-100 (jpeg/webp only)
-- `moderation`: `auto` (default) or `low`
-
-## Edit-specific parameters
-- `image`: one or more input images. For GPT Image models, you can provide up to 16 images.
-- `mask`: optional mask image
-- `input_fidelity`: `low` or `high` only for models that support it; do not set this for `gpt-image-2`
-
-Model-specific note for `input_fidelity`:
-- `gpt-image-2` always uses high fidelity for image inputs and does not support setting `input_fidelity`.
-- `gpt-image-1` and `gpt-image-1-mini` preserve all input images, but the first image gets richer textures and finer details.
-- `gpt-image-1.5` preserves the first 5 input images with higher fidelity.
-
-## Transparent backgrounds
-
-`gpt-image-2` does not currently support the Image API `background=transparent` parameter. The skill's default transparent-image path is built-in `image_gen` with a flat chroma-key background, followed by local alpha extraction with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py"`.
-
-Use CLI `gpt-image-1.5` with `background=transparent` and a transparent-capable output format such as `png` or `webp` only after the user explicitly confirms that fallback, unless they already requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. If the user asks for true/native transparency, the subject is too complex for clean chroma-key removal, or local background removal fails validation, explain the tradeoff and ask before switching.
-
-## Output
-- `data[]` list with `b64_json` per image
-- The bundled `scripts/image_gen.py` CLI decodes `b64_json` and writes output files for you.
-
-## Limits and notes
-- Input images and masks must be under 50MB.
-- Use the edits endpoint when the user requests changes to an existing image.
-- Masking is prompt-guided; exact shapes are not guaranteed.
-- Large sizes and high quality increase latency and cost.
-- Use `quality=low` for fast drafts, thumbnails, and quick iterations. Use `medium` or `high` for final assets, dense text, diagrams, identity-sensitive edits, or high-resolution outputs.
-- High `input_fidelity` can materially increase input token usage on models that support it.
-- If a request fails because a specific option is unsupported by the selected GPT Image model, retry manually without that option only when the option is not required by the user. If true transparent CLI output is required, ask before switching to `gpt-image-1.5` instead of dropping `background=transparent`, unless the user already explicitly chose that fallback.
-
-## Important boundary
-- `quality`, `input_fidelity`, explicit masks, `background`, `output_format`, and related parameters are fallback-only execution controls.
-- Do not assume they are built-in `image_gen` tool arguments.
diff --git a/skills/imagegen/references/prompting.md b/skills/imagegen/references/prompting.md
deleted file mode 100644
index 9d2da42..0000000
--- a/skills/imagegen/references/prompting.md
+++ /dev/null
@@ -1,118 +0,0 @@
-# Prompting best practices
-
-These prompting principles are shared by both top-level modes of the skill:
-- built-in `image_gen` tool (default)
-- explicit `scripts/image_gen.py` CLI fallback
-
-This file is about prompt structure, specificity, and iteration. Fallback-only execution controls such as `quality`, `input_fidelity`, masks, output format, and output paths live in the fallback docs.
-
-## Contents
-- [Structure](#structure)
-- [Specificity policy](#specificity-policy)
-- [Allowed and disallowed augmentation](#allowed-and-disallowed-augmentation)
-- [Composition and layout](#composition-and-layout)
-- [Constraints and invariants](#constraints-and-invariants)
-- [Text in images](#text-in-images)
-- [Input images and references](#input-images-and-references)
-- [Iterate deliberately](#iterate-deliberately)
-- [Transparent images](#transparent-images)
-- [Fallback-only execution controls](#fallback-only-execution-controls)
-- [Use-case tips](#use-case-tips)
-- [Where to find copy/paste recipes](#where-to-find-copypaste-recipes)
-
-## Structure
-- Use a consistent order: scene/backdrop -> subject -> key details -> constraints -> output intent.
-- Include intended use (ad, UI mock, infographic) to set the level of polish.
-- For complex requests, use short labeled lines instead of one long paragraph.
-
-## Specificity policy
-- If the user prompt is already specific and detailed, normalize it into a clean spec without adding creative requirements.
-- If the prompt is generic, you may add tasteful detail when it materially improves the output.
-- Treat examples in `sample-prompts.md` as fully-authored recipes, not as the default amount of augmentation to add to every request.
-- For photorealism, include `photorealistic` directly when that is the goal, plus concrete real-world texture such as pores, wrinkles, fabric wear, material grain, or imperfect everyday detail.
-
-## Allowed and disallowed augmentation
-
-Allowed augmentation for generic prompts:
-- composition and framing cues
-- intended-use or polish-level hints
-- practical layout guidance
-- reasonable scene concreteness that supports the request
-
-Do not add:
-- extra characters, props, or objects that are not implied
-- brand palettes, slogans, or story beats that are not implied
-- arbitrary side-specific placement unless the surrounding layout supports it
-
-## Composition and layout
-- Specify framing and viewpoint (close-up, wide, top-down) and placement only when it materially helps.
-- Call out negative space if the asset clearly needs room for UI or copy.
-- Avoid making left/right layout decisions unless the user or surrounding layout supports them.
-- For people, describe body framing, scale, gaze, and object interactions when they matter (`full body visible`, `looking down at the book`, `hands naturally gripping the handlebars`).
-
-## Constraints and invariants
-- State what must not change (`keep background unchanged`).
-- For edits, say `change only X; keep Y unchanged` and repeat invariants on every iteration to reduce drift.
-
-## Text in images
-- Put literal text in quotes or ALL CAPS and specify typography (font style, size, color, placement).
-- Spell uncommon words letter-by-letter if accuracy matters.
-- For in-image copy, require verbatim rendering and no extra characters.
-- In CLI fallback mode, use `medium` or `high` quality for small text, dense infographics, data-heavy slides, multi-font layouts, legends, axes, and footnotes.
-
-## Input images and references
-- Do not assume that every provided image is an edit target.
-- Label each image by index and role (`Image 1: edit target`, `Image 2: style reference`).
-- If the user provides images for style, composition, or mood guidance and does not ask to modify them, treat the request as generation with references.
-- If the user asks to preserve an existing image while changing specific parts, treat the request as an edit.
-- For compositing, describe how the images interact (`place the subject from Image 2 into Image 1`).
-
-## Iterate deliberately
-- Start with a clean base prompt, then make small single-change edits.
-- Re-specify critical constraints when you iterate.
-- Prefer one targeted follow-up at a time over rewriting the whole prompt.
-
-## Transparent images
-- Use built-in `image_gen` first for transparent-image requests. If the subject is clearly too complex for chroma-key removal, explain the fallback and ask before switching to CLI.
-- Prompt for a perfectly flat solid chroma-key background, usually `#00ff00`; use `#ff00ff` when the subject is green, and avoid key colors that appear in the subject.
-- Explicitly prohibit shadows, gradients, floor planes, reflections, texture, and lighting variation in the background.
-- Ask for crisp edges, generous padding, and no use of the key color inside the subject.
-- After generation, remove the background locally with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" --input <source> --out <final.png> --auto-key border --soft-matte --transparent-threshold 12 --opaque-threshold 220 --despill` and validate the alpha result before shipping it.
-- Use soft matte and despill for antialiased edges; hard tolerance-only removal is mainly for flat pixel-art or exact-color fixtures.
-- Use CLI `gpt-image-1.5 --background transparent --output-format png` only after the user explicitly confirms the fallback, or when the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Ask first for true/native transparency requests, failed chroma-key validation, or complex transparent subjects such as hair, fur, glass, smoke, liquids, translucent materials, reflective objects, or soft shadows.
-
-## Fallback-only execution controls
-- `quality`, `input_fidelity`, explicit masks, output format, and output paths are fallback-only execution controls.
-- Do not assume they are built-in `image_gen` tool arguments.
-- If the user explicitly chooses CLI fallback, see `references/cli.md` and `references/image-api.md` for those controls.
-- In CLI fallback mode, `gpt-image-2` is the default. It supports `quality=low|medium|high|auto`; use `low` for fast drafts and thumbnails, and move to `medium`, `high`, or `auto` for final assets.
-- `gpt-image-2` always uses high fidelity for image inputs, so do not set `input_fidelity` with that model.
-- If a transparent request needs true CLI transparency, ask before using `gpt-image-1.5` unless the user already explicitly chose it. Explain that built-in chroma-key removal is the default path, but `gpt-image-2` does not support `background=transparent`.
-- If the user asks for 4K-style output with `gpt-image-2`, use `3840x2160` for landscape or `2160x3840` for portrait.
-
-## Use-case tips
-Generate:
-- photorealistic-natural: Prompt as if a real photo is captured in the moment; use photography language (lens, lighting, framing); call for real texture; avoid over-stylized polish unless requested.
-- product-mockup: Describe the product/packaging and materials; ensure clean silhouette and label clarity; if in-image text is needed, require verbatim rendering and specify typography.
-- ui-mockup: Describe the target fidelity first (shippable mockup or low-fi wireframe), then focus on layout, hierarchy, and practical UI elements; avoid concept-art language.
-- infographic-diagram: Define the audience and layout flow; label parts explicitly; require verbatim text; prefer higher quality in CLI mode for dense labels.
-- logo-brand: Keep it simple and scalable; ask for a strong silhouette and balanced negative space; avoid decorative flourishes unless requested.
-- ads-marketing: Write like a creative brief; include brand positioning, audience, desired vibe, scene, and exact tagline if text must appear.
-- productivity-visual: Name the exact artifact (slide, chart, workflow diagram), define the canvas and hierarchy, provide real labels/data, and ask for readable typography and polished spacing.
-- scientific-educational: Define audience, lesson objective, required labels, scientific constraints, arrows, and scan-friendly whitespace.
-- illustration-story: Define panels or scene beats; keep each action concrete.
-- stylized-concept: Specify style cues, material finish, and rendering approach (3D, painterly, clay) without inventing new story elements.
-- historical-scene: State the location/date and required period accuracy; constrain clothing, props, and environment to match the era.
-
-Edit:
-- text-localization: Change only the text; preserve layout, typography, spacing, and hierarchy; no extra words or reflow unless needed.
-- identity-preserve: Lock identity (face, body, pose, hair, expression); change only the specified elements; match lighting and shadows.
-- precise-object-edit: Specify exactly what to remove/replace; preserve surrounding texture and lighting; keep everything else unchanged.
-- lighting-weather: Change only environmental conditions (light, shadows, atmosphere, precipitation); keep geometry, framing, and subject identity.
-- background-extraction: For simple opaque subjects, request a clean cutout on a perfectly flat chroma-key background; crisp silhouette; generous padding; no shadows; no halos; preserve label text exactly; no restyling. Ask before using true CLI transparency for complex subjects.
-- style-transfer: Specify style cues to preserve (palette, texture, brushwork) and what must change; add `no extra elements` to prevent drift.
-- compositing: Reference inputs by index; specify what moves where; match lighting, perspective, and scale; keep the base framing unchanged.
-- sketch-to-render: Preserve layout, proportions, and perspective; choose materials and lighting that support the supplied sketch without adding new elements.
-
-## Where to find copy/paste recipes
-For copy/paste prompt specs (examples only), see `references/sample-prompts.md`. This file focuses on principles, specificity, and iteration patterns.
diff --git a/skills/imagegen/references/sample-prompts.md b/skills/imagegen/references/sample-prompts.md
deleted file mode 100644
index d949295..0000000
--- a/skills/imagegen/references/sample-prompts.md
+++ /dev/null
@@ -1,433 +0,0 @@
-# Sample prompts (copy/paste)
-
-These prompt recipes are shared across both top-level modes of the skill:
-- built-in `image_gen` tool (default)
-- `scripts/image_gen.py` CLI fallback for explicit CLI/API/model requests or user-confirmed true-transparent-output fallback requests
-
-Use these as starting points. They are intentionally complete prompt recipes, not the default amount of augmentation to add to every user request.
-
-When adapting a user's prompt:
-- keep user-provided requirements
-- only add detail according to the specificity policy in `SKILL.md`
-- do not treat every example below as permission to invent extra story elements
-
-The labeled lines are prompt scaffolding, not a closed schema. `Asset type` and `Input images` are prompt-only scaffolding; the CLI does not expose them as dedicated flags.
-
-Execution details such as explicit CLI flags, `quality`, `input_fidelity`, masks, output formats, and local output paths depend on mode. Use the built-in tool by default, including simple transparent-image requests. For transparent images, prompt for a flat chroma-key background and remove it locally with `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py"`; only apply CLI-specific controls when the user explicitly opts into fallback mode or explicitly confirms that the transparent request should use true CLI transparency.
-
-CLI model notes:
-- `gpt-image-2` is the fallback CLI default for new workflows.
-- `gpt-image-2` supports `quality` values `low`, `medium`, `high`, and `auto`.
-- For 4K-style `gpt-image-2` output, use `3840x2160` or `2160x3840`.
-- If transparent output needs true CLI fallback, ask before using `gpt-image-1.5` unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback. Explain that built-in chroma-key removal is the default path, but `gpt-image-2` does not support `background=transparent`.
-- Do not set `input_fidelity` with `gpt-image-2`; image inputs already use high fidelity.
-
-For prompting principles (structure, specificity, invariants, iteration), see `references/prompting.md`.
-
-## Generate
-
-### photorealistic-natural
-```
-Use case: photorealistic-natural
-Primary request: candid photo of an elderly sailor on a small fishing boat adjusting a net
-Scene/backdrop: coastal water with soft haze
-Subject: weathered skin with wrinkles and sun texture
-Style/medium: photorealistic candid photo
-Composition/framing: medium close-up, eye-level
-Lighting/mood: soft coastal daylight, shallow depth of field, subtle film grain
-Materials/textures: real skin texture, worn fabric, salt-worn wood
-Constraints: natural color balance; no heavy retouching; no glamorization; no watermark
-Avoid: studio polish; staged look
-```
-
-### product-mockup
-```
-Use case: product-mockup
-Primary request: premium product photo of a matte black shampoo bottle with a minimal label
-Scene/backdrop: clean studio gradient from light gray to white
-Subject: single bottle centered with subtle reflection
-Style/medium: premium product photography
-Composition/framing: centered, slight three-quarter angle, generous padding
-Lighting/mood: softbox lighting, clean highlights, controlled shadows
-Materials/textures: matte plastic, crisp label printing
-Constraints: no logos or trademarks; no watermark
-```
-
-### ui-mockup
-```
-Use case: ui-mockup
-Primary request: mobile app home screen for a local farmers market with vendors and daily specials
-Asset type: mobile app screen
-Style/medium: realistic product UI, not concept art
-Composition/framing: clean vertical mobile layout with clear hierarchy
-Constraints: practical layout, clear typography, no logos or trademarks, no watermark
-```
-
-### infographic-diagram
-```
-Use case: infographic-diagram
-Primary request: detailed infographic of an automatic coffee machine flow
-Scene/backdrop: clean, light neutral background
-Subject: bean hopper -> grinder -> brew group -> boiler -> water tank -> drip tray
-Style/medium: clean vector-like infographic with clear callouts and arrows
-Composition/framing: vertical poster layout, top-to-bottom flow
-Text (verbatim): "Bean Hopper", "Grinder", "Brew Group", "Boiler", "Water Tank", "Drip Tray"
-Constraints: clear labels, strong contrast, no logos or trademarks, no watermark
-```
-
-### scientific-educational
-```
-Use case: scientific-educational
-Primary request: biology diagram titled "Cellular Respiration at a Glance" for high school students
-Scene/backdrop: clean white classroom handout background
-Subject: glucose turns into energy inside a cell; include glycolysis, Krebs cycle, and electron transport chain
-Style/medium: flat scientific diagram with consistent icons, arrows, and readable labels
-Composition/framing: landscape slide-style layout with clear hierarchy and generous whitespace
-Text (verbatim): "Cellular Respiration at a Glance", "Glucose", "Pyruvate", "ATP", "NADH", "FADH2", "CO2", "O2", "H2O"
-Constraints: scientifically plausible; avoid tiny text; no extra decoration; no watermark
-```
-
-### logo-brand
-```
-Use case: logo-brand
-Primary request: original logo for "Field & Flour", a local bakery
-Style/medium: vector logo mark; flat colors; minimal
-Composition/framing: single centered logo on a plain background with generous padding
-Constraints: strong silhouette, balanced negative space; original design only; no gradients unless essential; no trademarks; no watermark
-```
-
-### illustration-story
-```
-Use case: illustration-story
-Primary request: 4-panel comic about a pet left alone at home
-Scene/backdrop: cozy living room across panels
-Subject: pet reacting to the owner leaving, then relaxing, then returning to a composed pose
-Style/medium: comic illustration with clear panels
-Composition/framing: 4 equal-sized vertical panels, readable actions per panel
-Constraints: no text; no logos or trademarks; no watermark
-```
-
-### stylized-concept
-```
-Use case: stylized-concept
-Primary request: cavernous hangar interior with tall support beams and drifting fog
-Scene/backdrop: industrial hangar interior, deep scale, light haze
-Subject: compact shuttle parked near the center
-Style/medium: cinematic concept art, industrial realism
-Composition/framing: wide-angle, low-angle
-Lighting/mood: volumetric light rays cutting through fog
-Constraints: no logos or trademarks; no watermark
-```
-
-### ads-marketing
-```
-Use case: ads-marketing
-Primary request: campaign image for a streetwear brand called Thread
-Subject: group of friends hanging out together in a stylish urban setting
-Style/medium: polished youth streetwear campaign photography
-Composition/framing: vertical ad layout with natural poses and integrated headline space
-Lighting/mood: contemporary, energetic, tasteful
-Text (verbatim): "Yours to Create."
-Constraints: render the tagline exactly once; clean legible typography; no extra text; no watermarks; no unrelated logos
-```
-
-### productivity-visual
-```
-Use case: productivity-visual
-Primary request: one pitch-deck slide titled "Market Opportunity"
-Asset type: fundraising slide image
-Style/medium: clean modern deck slide, white background, crisp sans-serif typography
-Subject: TAM/SAM/SOM concentric-circle diagram plus a small growth bar chart from 2021 to 2026
-Composition/framing: 16:9 landscape slide, clear data hierarchy, polished spacing
-Text (verbatim): "Market Opportunity", "TAM: $42B", "SAM: $8.7B", "SOM: $340M", "AGI Research, 2024", "Internal analysis"
-Constraints: readable labels, no clip art, no stock photography, no decorative clutter, no watermark
-```
-
-### historical-scene
-```
-Use case: historical-scene
-Primary request: outdoor crowd scene in Bethel, New York on August 16, 1969
-Scene/backdrop: open field with period-appropriate staging
-Subject: crowd in period-accurate clothing, authentic environment
-Style/medium: photorealistic photo
-Composition/framing: wide shot, eye-level
-Constraints: period-accurate details; no modern objects; no logos or trademarks; no watermark
-```
-
-## Asset type templates (taxonomy-aligned)
-
-### Website assets template
-```
-Use case: <photorealistic-natural|stylized-concept|product-mockup|infographic-diagram|ui-mockup>
-Asset type: <hero image / section illustration / blog header>
-Primary request: <short description>
-Scene/backdrop: <environment or abstract backdrop>
-Subject: <main subject>
-Style/medium: <photo/illustration/3D>
-Composition/framing: <wide/centered; note usable negative space only if needed>
-Lighting/mood: <soft/bright/neutral>
-Color palette: <brand colors or neutral>
-Constraints: <no text; no logos; no watermark; leave room for UI if needed>
-```
-
-### Website assets example: minimal hero background
-```
-Use case: stylized-concept
-Asset type: landing page hero background
-Primary request: minimal abstract background with a soft gradient and subtle texture
-Style/medium: matte illustration / soft-rendered abstract background
-Composition/framing: wide composition with usable negative space for page copy
-Lighting/mood: gentle studio glow
-Color palette: restrained neutral palette
-Constraints: no text; no logos; no watermark
-```
-
-### Website assets example: feature section illustration
-```
-Use case: stylized-concept
-Asset type: feature section illustration
-Primary request: simple abstract shapes suggesting connection and flow
-Scene/backdrop: subtle light-gray backdrop with faint texture
-Style/medium: flat illustration; soft shadows; restrained contrast
-Composition/framing: centered cluster; open margins for UI
-Color palette: muted neutral palette
-Constraints: no text; no logos; no watermark
-```
-
-### Website assets example: blog header image
-```
-Use case: photorealistic-natural
-Asset type: blog header image
-Primary request: overhead desk scene with notebook, pen, and coffee cup
-Scene/backdrop: warm wooden tabletop
-Style/medium: photorealistic photo
-Composition/framing: wide crop with clean room for page copy
-Lighting/mood: soft morning light
-Constraints: no text; no logos; no watermark
-```
-
-### Game assets template
-```
-Use case: stylized-concept
-Asset type: <game environment concept art / game character concept / game UI icon / tileable game texture>
-Primary request: <biome/scene/character/icon/material>
-Scene/backdrop: <location + set dressing> (if applicable)
-Subject: <main focal element(s)>
-Style/medium: <realistic/stylized>; <concept art / character render / UI icon / texture>
-Composition/framing: <wide/establishing/top-down>; <camera angle>; <focal point placement>
-Lighting/mood: <time of day>; <mood>; <volumetric/fog/etc>
-Constraints: no logos or trademarks; no watermark
-```
-
-### Game assets example: environment concept art
-```
-Use case: stylized-concept
-Asset type: game environment concept art
-Primary request: cavernous hangar interior with tall support beams and drifting fog
-Scene/backdrop: industrial hangar interior, deep scale, light haze
-Subject: compact shuttle parked near the center
-Style/medium: cinematic concept art, industrial realism
-Composition/framing: wide-angle, low-angle
-Lighting/mood: volumetric light rays cutting through fog
-Constraints: no logos or trademarks; no watermark
-```
-
-### Game assets example: character concept
-```
-Use case: stylized-concept
-Asset type: game character concept
-Primary request: desert scout character with layered travel gear
-Subject: long coat, satchel, practical travel clothing
-Style/medium: character render; stylized realism
-Composition/framing: neutral hero pose on a simple backdrop
-Constraints: no logos or trademarks; no watermark
-```
-
-### Game assets example: UI icon
-```
-Use case: stylized-concept
-Asset type: game UI icon
-Primary request: round shield icon with a subtle rune pattern
-Style/medium: painted game UI icon
-Composition/framing: centered icon; generous padding; clear silhouette
-Constraints: no text; no background scene elements; no logos or trademarks; no watermark
-```
-
-### Game assets example: tileable texture
-```
-Use case: stylized-concept
-Asset type: tileable game texture
-Primary request: worn sandstone blocks
-Style/medium: seamless tileable texture; PBR-ish look
-Scene/backdrop: neutral lighting reference only
-Constraints: seamless edges; no obvious focal elements; no text; no logos or trademarks; no watermark
-```
-
-### Wireframe template
-```
-Use case: ui-mockup
-Asset type: website wireframe
-Primary request: <page or flow to sketch>
-Style/medium: low-fi grayscale wireframe
-Composition/framing: <landscape or portrait to match expected device>
-Subject: <sections in order; grid/columns; key labels>
-Constraints: no color; no logos; no real photos; no watermark
-```
-
-### Wireframe example: homepage (desktop)
-```
-Use case: ui-mockup
-Asset type: website wireframe
-Primary request: SaaS homepage layout with clear hierarchy
-Style/medium: low-fi grayscale wireframe
-Subject: top nav; hero with headline and CTA; three feature cards; testimonial strip; pricing preview; footer
-Composition/framing: landscape desktop layout
-Constraints: label major blocks; no color; no logos; no real photos; no watermark
-```
-
-### Wireframe example: pricing page
-```
-Use case: ui-mockup
-Asset type: website wireframe
-Primary request: pricing page layout with comparison table
-Style/medium: low-fi grayscale wireframe
-Subject: header; plan toggle; 3 pricing cards; comparison table; FAQ accordion; footer
-Composition/framing: desktop or tablet layout
-Constraints: label key areas; no color; no logos; no real photos; no watermark
-```
-
-### Wireframe example: mobile onboarding flow
-```
-Use case: ui-mockup
-Asset type: mobile onboarding wireframe
-Primary request: three-screen mobile onboarding flow
-Style/medium: low-fi grayscale wireframe
-Subject: screen 1 headline and CTA; screen 2 feature bullets; screen 3 form fields and CTA
-Composition/framing: portrait mobile layout
-Constraints: label screens and blocks; no color; no logos; no real photos; no watermark
-```
-
-### Logo template
-```
-Use case: logo-brand
-Asset type: logo concept
-Primary request: <brand idea or symbol concept>
-Style/medium: vector logo mark; flat colors; minimal
-Composition/framing: centered mark; clear silhouette; generous margin
-Color palette: <1-2 colors; high contrast>
-Text (verbatim): "<exact name>" (only if needed)
-Constraints: no gradients; no mockups; no 3D; no watermark
-```
-
-### Logo example: abstract symbol mark
-```
-Use case: logo-brand
-Asset type: logo concept
-Primary request: geometric leaf symbol suggesting sustainability and growth
-Style/medium: vector logo mark; flat colors; minimal
-Composition/framing: centered mark; clear silhouette
-Color palette: deep green and off-white
-Constraints: no text unless requested; no gradients; no mockups; no 3D; no watermark
-```
-
-### Logo example: monogram mark
-```
-Use case: logo-brand
-Asset type: logo concept
-Primary request: interlocking monogram of the letters "AV"
-Style/medium: vector logo mark; flat colors; minimal
-Composition/framing: centered mark; balanced spacing
-Color palette: black on white
-Constraints: no gradients; no mockups; no 3D; no watermark
-```
-
-### Logo example: wordmark
-```
-Use case: logo-brand
-Asset type: logo concept
-Primary request: clean wordmark for a modern studio
-Style/medium: vector wordmark; flat colors; minimal
-Text (verbatim): "Studio North"
-Composition/framing: centered text; even letter spacing
-Constraints: no gradients; no mockups; no 3D; no watermark
-```
-
-## Edit
-
-### text-localization
-```
-Use case: text-localization
-Input images: Image 1: original infographic
-Primary request: replace "Bean Hopper", "Grinder", "Brew Group", "Boiler", "Water Tank", and "Drip Tray" with "Tolva", "Molino", "Grupo de infusión", "Caldera", "Depósito de agua", and "Bandeja de goteo"
-Constraints: change only the text; preserve layout, typography, spacing, and hierarchy; no extra words; do not alter logos or imagery
-```
-
-### identity-preserve
-```
-Use case: identity-preserve
-Input images: Image 1: person photo; Image 2..N: clothing references
-Primary request: replace only the clothing with the provided garments
-Constraints: preserve face, body shape, pose, hair, expression, and identity; match lighting and shadows; keep the background unchanged; no accessories or text
-```
-
-### precise-object-edit
-```
-Use case: precise-object-edit
-Input images: Image 1: room photo
-Primary request: replace only the white chairs with wooden chairs
-Constraints: preserve camera angle, room lighting, floor shadows, and surrounding objects; keep all other aspects unchanged
-```
-
-### lighting-weather
-```
-Use case: lighting-weather
-Input images: Image 1: original photo
-Primary request: make it look like a winter evening with gentle snowfall
-Constraints: preserve subject identity, geometry, camera angle, and composition; change only lighting, atmosphere, and weather
-```
-
-### background-extraction
-```
-Use case: background-extraction
-Input images: Image 1: product photo
-Primary request: isolate the product on a clean transparent background
-Scene/backdrop: perfectly flat solid #00ff00 chroma-key background for local background removal
-Constraints: background must be one uniform color with no shadows, gradients, texture, reflections, floor plane, or lighting variation; crisp silhouette; generous padding; no halos or fringing; preserve label text exactly; no restyling; do not use #00ff00 anywhere in the subject
-```
-
-Post-process note: after built-in generation, run `python "${CODEX_HOME:-$HOME/.codex}/skills/.system/imagegen/scripts/remove_chroma_key.py" --input <source> --out <final.png> --auto-key border --soft-matte --transparent-threshold 12 --opaque-threshold 220 --despill`. Ask before using CLI `gpt-image-1.5 --background transparent --output-format png` for true/native transparency, failed chroma-key validation, or complex subjects such as hair, fur, glass, smoke, liquids, translucent materials, reflections, or soft shadows, unless the user already explicitly requested `gpt-image-1.5`, `scripts/image_gen.py`, or CLI fallback.
-
-### style-transfer
-```
-Use case: style-transfer
-Input images: Image 1: style reference
-Primary request: apply Image 1's visual style to a man riding a motorcycle on a plain white backdrop
-Constraints: preserve palette, texture, and brushwork; no extra elements
-```
-
-### compositing
-```
-Use case: compositing
-Input images: Image 1: base scene; Image 2: subject to insert
-Primary request: place the subject from Image 2 next to the person in Image 1
-Constraints: match lighting, perspective, and scale; keep the base framing unchanged; no extra elements
-```
-
-### character consistency workflow
-```
-Use case: identity-preserve
-Input images: Image 1: previous character anchor illustration
-Primary request: continue the story with the same character in a new scene and action
-Scene/backdrop: snowy forest after a winter storm
-Subject: same young forest hero gently helping a frightened squirrel out of a fallen tree
-Style/medium: same children's book watercolor illustration style as Image 1
-Constraints: do not redesign the character; preserve facial features, proportions, outfit, color palette, and personality; no text; no watermark
-```
-
-### sketch-to-render
-```
-Use case: sketch-to-render
-Input images: Image 1: drawing
-Primary request: turn the drawing into a photorealistic image
-Constraints: preserve layout, proportions, and perspective; choose realistic materials and lighting; do not add new elements or text
-```
diff --git a/skills/imagegen/scripts/image_gen.py b/skills/imagegen/scripts/image_gen.py
deleted file mode 100644
index 9e0ea67..0000000
--- a/skills/imagegen/scripts/image_gen.py
+++ /dev/null
@@ -1,995 +0,0 @@
-#!/usr/bin/env python3
-"""Fallback CLI for explicit image generation or editing with GPT Image models.
-
-Used only when the user explicitly opts into CLI fallback mode, or when explicit
-transparent output requires the `gpt-image-1.5` fallback path.
-
-Defaults to gpt-image-2 and a structured prompt augmentation workflow.
-"""
-
-from __future__ import annotations
-
-import argparse
-import asyncio
-import base64
-import json
-import os
-from pathlib import Path
-import re
-import sys
-import time
-from typing import Any, Dict, Iterable, List, Optional, Tuple
-
-from io import BytesIO
-
-DEFAULT_MODEL = "gpt-image-2"
-DEFAULT_SIZE = "auto"
-DEFAULT_QUALITY = "medium"
-DEFAULT_OUTPUT_FORMAT = "png"
-DEFAULT_CONCURRENCY = 5
-DEFAULT_DOWNSCALE_SUFFIX = "-web"
-DEFAULT_OUTPUT_PATH = "output/imagegen/output.png"
-GPT_IMAGE_MODEL_PREFIX = "gpt-image-"
-
-ALLOWED_LEGACY_SIZES = {"1024x1024", "1536x1024", "1024x1536", "auto"}
-ALLOWED_QUALITIES = {"low", "medium", "high", "auto"}
-ALLOWED_BACKGROUNDS = {"transparent", "opaque", "auto", None}
-ALLOWED_INPUT_FIDELITIES = {"low", "high", None}
-
-GPT_IMAGE_2_MODEL = "gpt-image-2"
-GPT_IMAGE_2_MIN_PIXELS = 655_360
-GPT_IMAGE_2_MAX_PIXELS = 8_294_400
-GPT_IMAGE_2_MAX_EDGE = 3840
-GPT_IMAGE_2_MAX_RATIO = 3.0
-
-MAX_IMAGE_BYTES = 50 * 1024 * 1024
-MAX_BATCH_JOBS = 500
-
-
-def _die(message: str, code: int = 1) -> None:
-    print(f"Error: {message}", file=sys.stderr)
-    raise SystemExit(code)
-
-
-def _warn(message: str) -> None:
-    print(f"Warning: {message}", file=sys.stderr)
-
-
-def _dependency_hint(package: str, *, upgrade: bool = False) -> str:
-    command = f"uv pip install {'-U ' if upgrade else ''}{package}"
-    return (
-        "Activate the repo-selected environment first, then install it with "
-        f"`{command}`. If this repo uses a local virtualenv, start with "
-        "`source .venv/bin/activate`; otherwise use this repo's configured shared fallback "
-        "environment. If your project declares dependencies, prefer that project's normal "
-        "`uv sync` flow."
-    )
-
-
-def _ensure_api_key(dry_run: bool) -> None:
-    if os.getenv("OPENAI_API_KEY"):
-        print("OPENAI_API_KEY is set.", file=sys.stderr)
-        return
-    if dry_run:
-        _warn("OPENAI_API_KEY is not set; dry-run only.")
-        return
-    _die("OPENAI_API_KEY is not set. Export it before running.")
-
-
-def _read_prompt(prompt: Optional[str], prompt_file: Optional[str]) -> str:
-    if prompt and prompt_file:
-        _die("Use --prompt or --prompt-file, not both.")
-    if prompt_file:
-        path = Path(prompt_file)
-        if not path.exists():
-            _die(f"Prompt file not found: {path}")
-        return path.read_text(encoding="utf-8").strip()
-    if prompt:
-        return prompt.strip()
-    _die("Missing prompt. Use --prompt or --prompt-file.")
-    return ""  # unreachable
-
-
-def _check_image_paths(paths: Iterable[str]) -> List[Path]:
-    resolved: List[Path] = []
-    for raw in paths:
-        path = Path(raw)
-        if not path.exists():
-            _die(f"Image file not found: {path}")
-        if path.stat().st_size > MAX_IMAGE_BYTES:
-            _warn(f"Image exceeds 50MB limit: {path}")
-        resolved.append(path)
-    return resolved
-
-
-def _normalize_output_format(fmt: Optional[str]) -> str:
-    if not fmt:
-        return DEFAULT_OUTPUT_FORMAT
-    fmt = fmt.lower()
-    if fmt not in {"png", "jpeg", "jpg", "webp"}:
-        _die("output-format must be png, jpeg, jpg, or webp.")
-    return "jpeg" if fmt == "jpg" else fmt
-
-
-def _parse_size(size: str) -> Optional[Tuple[int, int]]:
-    match = re.fullmatch(r"([1-9][0-9]*)x([1-9][0-9]*)", size)
-    if not match:
-        return None
-    return int(match.group(1)), int(match.group(2))
-
-
-def _validate_gpt_image_2_size(size: str) -> None:
-    if size == "auto":
-        return
-
-    parsed = _parse_size(size)
-    if parsed is None:
-        _die("size must be auto or WIDTHxHEIGHT, for example 1024x1024.")
-
-    width, height = parsed
-    max_edge = max(width, height)
-    min_edge = min(width, height)
-    total_pixels = width * height
-
-    if max_edge > GPT_IMAGE_2_MAX_EDGE:
-        _die("gpt-image-2 size maximum edge length must be less than or equal to 3840px.")
-    if width % 16 != 0 or height % 16 != 0:
-        _die("gpt-image-2 size width and height must be multiples of 16px.")
-    if max_edge / min_edge > GPT_IMAGE_2_MAX_RATIO:
-        _die("gpt-image-2 size long edge to short edge ratio must not exceed 3:1.")
-    if total_pixels < GPT_IMAGE_2_MIN_PIXELS or total_pixels > GPT_IMAGE_2_MAX_PIXELS:
-        _die(
-            "gpt-image-2 size total pixels must be at least 655,360 and no more than 8,294,400."
-        )
-
-
-def _validate_size(size: str, model: str) -> None:
-    if model == GPT_IMAGE_2_MODEL:
-        _validate_gpt_image_2_size(size)
-        return
-
-    if size not in ALLOWED_LEGACY_SIZES:
-        _die(
-            "size must be one of 1024x1024, 1536x1024, 1024x1536, or auto for this GPT Image model."
-        )
-
-
-def _validate_quality(quality: str) -> None:
-    if quality not in ALLOWED_QUALITIES:
-        _die("quality must be one of low, medium, high, or auto.")
-
-
-def _validate_background(background: Optional[str]) -> None:
-    if background not in ALLOWED_BACKGROUNDS:
-        _die("background must be one of transparent, opaque, or auto.")
-
-
-def _validate_input_fidelity(input_fidelity: Optional[str]) -> None:
-    if input_fidelity not in ALLOWED_INPUT_FIDELITIES:
-        _die("input-fidelity must be one of low or high.")
-
-
-def _validate_model(model: str) -> None:
-    if not model.startswith(GPT_IMAGE_MODEL_PREFIX):
-        _die(
-            "model must be a GPT Image model (for example gpt-image-1.5, gpt-image-1, or gpt-image-1-mini)."
-        )
-
-
-def _validate_transparency(background: Optional[str], output_format: str) -> None:
-    if background == "transparent" and output_format not in {"png", "webp"}:
-        _die("transparent background requires output-format png or webp.")
-
-
-def _validate_model_specific_options(
-    *,
-    model: str,
-    background: Optional[str],
-    input_fidelity: Optional[str] = None,
-) -> None:
-    if model != GPT_IMAGE_2_MODEL:
-        return
-    if background == "transparent":
-        _die(
-            "transparent backgrounds are not supported in gpt-image-2, the latest model. "
-            "Use --model gpt-image-1.5 --background transparent --output-format png instead."
-        )
-    if input_fidelity is not None:
-        _die(
-            "input_fidelity is not supported in gpt-image-2 because image inputs always use high fidelity for this model."
-        )
-
-
-def _validate_generate_payload(payload: Dict[str, Any]) -> None:
-    model = str(payload.get("model", DEFAULT_MODEL))
-    _validate_model(model)
-    n = int(payload.get("n", 1))
-    if n < 1 or n > 10:
-        _die("n must be between 1 and 10")
-    size = str(payload.get("size", DEFAULT_SIZE))
-    quality = str(payload.get("quality", DEFAULT_QUALITY))
-    background = payload.get("background")
-    _validate_size(size, model)
-    _validate_quality(quality)
-    _validate_background(background)
-    _validate_model_specific_options(model=model, background=background)
-    oc = payload.get("output_compression")
-    if oc is not None and not (0 <= int(oc) <= 100):
-        _die("output_compression must be between 0 and 100")
-
-
-def _build_output_paths(
-    out: str,
-    output_format: str,
-    count: int,
-    out_dir: Optional[str],
-) -> List[Path]:
-    ext = "." + output_format
-
-    if out_dir:
-        out_base = Path(out_dir)
-        out_base.mkdir(parents=True, exist_ok=True)
-        return [out_base / f"image_{i}{ext}" for i in range(1, count + 1)]
-
-    out_path = Path(out)
-    if out_path.exists() and out_path.is_dir():
-        out_path.mkdir(parents=True, exist_ok=True)
-        return [out_path / f"image_{i}{ext}" for i in range(1, count + 1)]
-
-    if out_path.suffix == "":
-        out_path = out_path.with_suffix(ext)
-    elif output_format and out_path.suffix.lstrip(".").lower() != output_format:
-        _warn(
-            f"Output extension {out_path.suffix} does not match output-format {output_format}."
-        )
-
-    if count == 1:
-        return [out_path]
-
-    return [
-        out_path.with_name(f"{out_path.stem}-{i}{out_path.suffix}")
-        for i in range(1, count + 1)
-    ]
-
-
-def _augment_prompt(args: argparse.Namespace, prompt: str) -> str:
-    fields = _fields_from_args(args)
-    return _augment_prompt_fields(args.augment, prompt, fields)
-
-
-def _augment_prompt_fields(augment: bool, prompt: str, fields: Dict[str, Optional[str]]) -> str:
-    if not augment:
-        return prompt
-
-    sections: List[str] = []
-    if fields.get("use_case"):
-        sections.append(f"Use case: {fields['use_case']}")
-    sections.append(f"Primary request: {prompt}")
-    if fields.get("scene"):
-        sections.append(f"Scene/background: {fields['scene']}")
-    if fields.get("subject"):
-        sections.append(f"Subject: {fields['subject']}")
-    if fields.get("style"):
-        sections.append(f"Style/medium: {fields['style']}")
-    if fields.get("composition"):
-        sections.append(f"Composition/framing: {fields['composition']}")
-    if fields.get("lighting"):
-        sections.append(f"Lighting/mood: {fields['lighting']}")
-    if fields.get("palette"):
-        sections.append(f"Color palette: {fields['palette']}")
-    if fields.get("materials"):
-        sections.append(f"Materials/textures: {fields['materials']}")
-    if fields.get("text"):
-        sections.append(f"Text (verbatim): \"{fields['text']}\"")
-    if fields.get("constraints"):
-        sections.append(f"Constraints: {fields['constraints']}")
-    if fields.get("negative"):
-        sections.append(f"Avoid: {fields['negative']}")
-
-    return "\n".join(sections)
-
-
-def _fields_from_args(args: argparse.Namespace) -> Dict[str, Optional[str]]:
-    return {
-        "use_case": getattr(args, "use_case", None),
-        "scene": getattr(args, "scene", None),
-        "subject": getattr(args, "subject", None),
-        "style": getattr(args, "style", None),
-        "composition": getattr(args, "composition", None),
-        "lighting": getattr(args, "lighting", None),
-        "palette": getattr(args, "palette", None),
-        "materials": getattr(args, "materials", None),
-        "text": getattr(args, "text", None),
-        "constraints": getattr(args, "constraints", None),
-        "negative": getattr(args, "negative", None),
-    }
-
-
-def _print_request(payload: dict) -> None:
-    print(json.dumps(payload, indent=2, sort_keys=True))
-
-
-def _decode_and_write(images: List[str], outputs: List[Path], force: bool) -> None:
-    for idx, image_b64 in enumerate(images):
-        if idx >= len(outputs):
-            break
-        out_path = outputs[idx]
-        if out_path.exists() and not force:
-            _die(f"Output already exists: {out_path} (use --force to overwrite)")
-        out_path.parent.mkdir(parents=True, exist_ok=True)
-        out_path.write_bytes(base64.b64decode(image_b64))
-        print(f"Wrote {out_path}")
-
-
-def _derive_downscale_path(path: Path, suffix: str) -> Path:
-    if suffix and not suffix.startswith("-") and not suffix.startswith("_"):
-        suffix = "-" + suffix
-    return path.with_name(f"{path.stem}{suffix}{path.suffix}")
-
-
-def _downscale_image_bytes(image_bytes: bytes, *, max_dim: int, output_format: str) -> bytes:
-    try:
-        from PIL import Image
-    except Exception:
-        _die(f"Downscaling requires Pillow. {_dependency_hint('pillow')}")
-
-    if max_dim < 1:
-        _die("--downscale-max-dim must be >= 1")
-
-    with Image.open(BytesIO(image_bytes)) as img:
-        img.load()
-        w, h = img.size
-        scale = min(1.0, float(max_dim) / float(max(w, h)))
-        target = (max(1, int(round(w * scale))), max(1, int(round(h * scale))))
-
-        resized = img if target == (w, h) else img.resize(target, Image.Resampling.LANCZOS)
-
-        fmt = output_format.lower()
-        if fmt == "jpg":
-            fmt = "jpeg"
-
-        if fmt == "jpeg":
-            if resized.mode in ("RGBA", "LA") or ("transparency" in getattr(resized, "info", {})):
-                bg = Image.new("RGB", resized.size, (255, 255, 255))
-                bg.paste(resized.convert("RGBA"), mask=resized.convert("RGBA").split()[-1])
-                resized = bg
-            else:
-                resized = resized.convert("RGB")
-
-        out = BytesIO()
-        resized.save(out, format=fmt.upper())
-        return out.getvalue()
-
-
-def _decode_write_and_downscale(
-    images: List[str],
-    outputs: List[Path],
-    *,
-    force: bool,
-    downscale_max_dim: Optional[int],
-    downscale_suffix: str,
-    output_format: str,
-) -> None:
-    for idx, image_b64 in enumerate(images):
-        if idx >= len(outputs):
-            break
-        out_path = outputs[idx]
-        if out_path.exists() and not force:
-            _die(f"Output already exists: {out_path} (use --force to overwrite)")
-        out_path.parent.mkdir(parents=True, exist_ok=True)
-
-        raw = base64.b64decode(image_b64)
-        out_path.write_bytes(raw)
-        print(f"Wrote {out_path}")
-
-        if downscale_max_dim is None:
-            continue
-
-        derived = _derive_downscale_path(out_path, downscale_suffix)
-        if derived.exists() and not force:
-            _die(f"Output already exists: {derived} (use --force to overwrite)")
-        derived.parent.mkdir(parents=True, exist_ok=True)
-        resized = _downscale_image_bytes(raw, max_dim=downscale_max_dim, output_format=output_format)
-        derived.write_bytes(resized)
-        print(f"Wrote {derived}")
-
-
-def _create_client():
-    try:
-        from openai import OpenAI
-    except ImportError:
-        _die(f"openai SDK not installed in the active environment. {_dependency_hint('openai')}")
-    return OpenAI()
-
-
-def _create_async_client():
-    try:
-        from openai import AsyncOpenAI
-    except ImportError:
-        try:
-            import openai as _openai  # noqa: F401
-        except ImportError:
-            _die(
-                f"openai SDK not installed in the active environment. {_dependency_hint('openai')}"
-            )
-        _die(
-            "AsyncOpenAI not available in this openai SDK version. "
-            f"{_dependency_hint('openai', upgrade=True)}"
-        )
-    return AsyncOpenAI()
-
-
-def _slugify(value: str) -> str:
-    value = value.strip().lower()
-    value = re.sub(r"[^a-z0-9]+", "-", value)
-    value = re.sub(r"-{2,}", "-", value).strip("-")
-    return value[:60] if value else "job"
-
-
-def _normalize_job(job: Any, idx: int) -> Dict[str, Any]:
-    if isinstance(job, str):
-        prompt = job.strip()
-        if not prompt:
-            _die(f"Empty prompt at job {idx}")
-        return {"prompt": prompt}
-    if isinstance(job, dict):
-        if "prompt" not in job or not str(job["prompt"]).strip():
-            _die(f"Missing prompt for job {idx}")
-        return job
-    _die(f"Invalid job at index {idx}: expected string or object.")
-    return {}  # unreachable
-
-
-def _read_jobs_jsonl(path: str) -> List[Dict[str, Any]]:
-    p = Path(path)
-    if not p.exists():
-        _die(f"Input file not found: {p}")
-    jobs: List[Dict[str, Any]] = []
-    for line_no, raw in enumerate(p.read_text(encoding="utf-8").splitlines(), start=1):
-        line = raw.strip()
-        if not line or line.startswith("#"):
-            continue
-        try:
-            item: Any
-            if line.startswith("{"):
-                item = json.loads(line)
-            else:
-                item = line
-            jobs.append(_normalize_job(item, idx=line_no))
-        except json.JSONDecodeError as exc:
-            _die(f"Invalid JSON on line {line_no}: {exc}")
-    if not jobs:
-        _die("No jobs found in input file.")
-    if len(jobs) > MAX_BATCH_JOBS:
-        _die(f"Too many jobs ({len(jobs)}). Max is {MAX_BATCH_JOBS}.")
-    return jobs
-
-
-def _merge_non_null(dst: Dict[str, Any], src: Dict[str, Any]) -> Dict[str, Any]:
-    merged = dict(dst)
-    for k, v in src.items():
-        if v is not None:
-            merged[k] = v
-    return merged
-
-
-def _job_output_paths(
-    *,
-    out_dir: Path,
-    output_format: str,
-    idx: int,
-    prompt: str,
-    n: int,
-    explicit_out: Optional[str],
-) -> List[Path]:
-    out_dir.mkdir(parents=True, exist_ok=True)
-    ext = "." + output_format
-
-    if explicit_out:
-        base = Path(explicit_out)
-        if base.suffix == "":
-            base = base.with_suffix(ext)
-        elif base.suffix.lstrip(".").lower() != output_format:
-            _warn(
-                f"Job {idx}: output extension {base.suffix} does not match output-format {output_format}."
-            )
-        base = out_dir / base.name
-    else:
-        slug = _slugify(prompt[:80])
-        base = out_dir / f"{idx:03d}-{slug}{ext}"
-
-    if n == 1:
-        return [base]
-    return [
-        base.with_name(f"{base.stem}-{i}{base.suffix}")
-        for i in range(1, n + 1)
-    ]
-
-
-def _extract_retry_after_seconds(exc: Exception) -> Optional[float]:
-    # Best-effort: openai SDK errors vary by version. Prefer a conservative fallback.
-    for attr in ("retry_after", "retry_after_seconds"):
-        val = getattr(exc, attr, None)
-        if isinstance(val, (int, float)) and val >= 0:
-            return float(val)
-    msg = str(exc)
-    m = re.search(r"retry[- ]after[:= ]+([0-9]+(?:\\.[0-9]+)?)", msg, re.IGNORECASE)
-    if m:
-        try:
-            return float(m.group(1))
-        except Exception:
-            return None
-    return None
-
-
-def _is_rate_limit_error(exc: Exception) -> bool:
-    name = exc.__class__.__name__.lower()
-    if "ratelimit" in name or "rate_limit" in name:
-        return True
-    msg = str(exc).lower()
-    return "429" in msg or "rate limit" in msg or "too many requests" in msg
-
-
-def _is_transient_error(exc: Exception) -> bool:
-    if _is_rate_limit_error(exc):
-        return True
-    name = exc.__class__.__name__.lower()
-    if "timeout" in name or "timedout" in name or "tempor" in name:
-        return True
-    msg = str(exc).lower()
-    return "timeout" in msg or "timed out" in msg or "connection reset" in msg
-
-
-async def _generate_one_with_retries(
-    client: Any,
-    payload: Dict[str, Any],
-    *,
-    attempts: int,
-    job_label: str,
-) -> Any:
-    last_exc: Optional[Exception] = None
-    for attempt in range(1, attempts + 1):
-        try:
-            return await client.images.generate(**payload)
-        except Exception as exc:
-            last_exc = exc
-            if not _is_transient_error(exc):
-                raise
-            if attempt == attempts:
-                raise
-            sleep_s = _extract_retry_after_seconds(exc)
-            if sleep_s is None:
-                sleep_s = min(60.0, 2.0**attempt)
-            print(
-                f"{job_label} attempt {attempt}/{attempts} failed ({exc.__class__.__name__}); retrying in {sleep_s:.1f}s",
-                file=sys.stderr,
-            )
-            await asyncio.sleep(sleep_s)
-    raise last_exc or RuntimeError("unknown error")
-
-
-async def _run_generate_batch(args: argparse.Namespace) -> int:
-    jobs = _read_jobs_jsonl(args.input)
-    out_dir = Path(args.out_dir)
-
-    base_fields = _fields_from_args(args)
-    base_payload = {
-        "model": args.model,
-        "n": args.n,
-        "size": args.size,
-        "quality": args.quality,
-        "background": args.background,
-        "output_format": args.output_format,
-        "output_compression": args.output_compression,
-        "moderation": args.moderation,
-    }
-
-    if args.dry_run:
-        for i, job in enumerate(jobs, start=1):
-            prompt = str(job["prompt"]).strip()
-            fields = _merge_non_null(base_fields, job.get("fields", {}))
-            # Allow flat job keys as well (use_case, scene, etc.)
-            fields = _merge_non_null(fields, {k: job.get(k) for k in base_fields.keys()})
-            augmented = _augment_prompt_fields(args.augment, prompt, fields)
-
-            job_payload = dict(base_payload)
-            job_payload["prompt"] = augmented
-            job_payload = _merge_non_null(job_payload, {k: job.get(k) for k in base_payload.keys()})
-            job_payload = {k: v for k, v in job_payload.items() if v is not None}
-
-            _validate_generate_payload(job_payload)
-            effective_output_format = _normalize_output_format(job_payload.get("output_format"))
-            _validate_transparency(job_payload.get("background"), effective_output_format)
-            job_payload["output_format"] = effective_output_format
-
-            n = int(job_payload.get("n", 1))
-            outputs = _job_output_paths(
-                out_dir=out_dir,
-                output_format=effective_output_format,
-                idx=i,
-                prompt=prompt,
-                n=n,
-                explicit_out=job.get("out"),
-            )
-            downscaled = None
-            if args.downscale_max_dim is not None:
-                downscaled = [
-                    str(_derive_downscale_path(p, args.downscale_suffix)) for p in outputs
-                ]
-            _print_request(
-                {
-                    "endpoint": "/v1/images/generations",
-                    "job": i,
-                    "outputs": [str(p) for p in outputs],
-                    "outputs_downscaled": downscaled,
-                    **job_payload,
-                }
-            )
-        return 0
-
-    client = _create_async_client()
-    sem = asyncio.Semaphore(args.concurrency)
-
-    any_failed = False
-
-    async def run_job(i: int, job: Dict[str, Any]) -> Tuple[int, Optional[str]]:
-        nonlocal any_failed
-        prompt = str(job["prompt"]).strip()
-        job_label = f"[job {i}/{len(jobs)}]"
-
-        fields = _merge_non_null(base_fields, job.get("fields", {}))
-        fields = _merge_non_null(fields, {k: job.get(k) for k in base_fields.keys()})
-        augmented = _augment_prompt_fields(args.augment, prompt, fields)
-
-        payload = dict(base_payload)
-        payload["prompt"] = augmented
-        payload = _merge_non_null(payload, {k: job.get(k) for k in base_payload.keys()})
-        payload = {k: v for k, v in payload.items() if v is not None}
-
-        n = int(payload.get("n", 1))
-        _validate_generate_payload(payload)
-        effective_output_format = _normalize_output_format(payload.get("output_format"))
-        _validate_transparency(payload.get("background"), effective_output_format)
-        payload["output_format"] = effective_output_format
-        outputs = _job_output_paths(
-            out_dir=out_dir,
-            output_format=effective_output_format,
-            idx=i,
-            prompt=prompt,
-            n=n,
-            explicit_out=job.get("out"),
-        )
-        try:
-            async with sem:
-                print(f"{job_label} starting", file=sys.stderr)
-                started = time.time()
-                result = await _generate_one_with_retries(
-                    client,
-                    payload,
-                    attempts=args.max_attempts,
-                    job_label=job_label,
-                )
-                elapsed = time.time() - started
-                print(f"{job_label} completed in {elapsed:.1f}s", file=sys.stderr)
-            images = [item.b64_json for item in result.data]
-            _decode_write_and_downscale(
-                images,
-                outputs,
-                force=args.force,
-                downscale_max_dim=args.downscale_max_dim,
-                downscale_suffix=args.downscale_suffix,
-                output_format=effective_output_format,
-            )
-            return i, None
-        except Exception as exc:
-            any_failed = True
-            print(f"{job_label} failed: {exc}", file=sys.stderr)
-            if args.fail_fast:
-                raise
-            return i, str(exc)
-
-    tasks = [asyncio.create_task(run_job(i, job)) for i, job in enumerate(jobs, start=1)]
-
-    try:
-        await asyncio.gather(*tasks)
-    except Exception:
-        for t in tasks:
-            if not t.done():
-                t.cancel()
-        raise
-
-    return 1 if any_failed else 0
-
-
-def _generate_batch(args: argparse.Namespace) -> None:
-    exit_code = asyncio.run(_run_generate_batch(args))
-    if exit_code:
-        raise SystemExit(exit_code)
-
-
-def _generate(args: argparse.Namespace) -> None:
-    prompt = _read_prompt(args.prompt, args.prompt_file)
-    prompt = _augment_prompt(args, prompt)
-
-    payload = {
-        "model": args.model,
-        "prompt": prompt,
-        "n": args.n,
-        "size": args.size,
-        "quality": args.quality,
-        "background": args.background,
-        "output_format": args.output_format,
-        "output_compression": args.output_compression,
-        "moderation": args.moderation,
-    }
-    payload = {k: v for k, v in payload.items() if v is not None}
-
-    output_format = _normalize_output_format(args.output_format)
-    _validate_transparency(args.background, output_format)
-    payload["output_format"] = output_format
-    output_paths = _build_output_paths(args.out, output_format, args.n, args.out_dir)
-    downscaled = None
-    if args.downscale_max_dim is not None:
-        downscaled = [str(_derive_downscale_path(p, args.downscale_suffix)) for p in output_paths]
-
-    if args.dry_run:
-        _print_request(
-            {
-                "endpoint": "/v1/images/generations",
-                "outputs": [str(p) for p in output_paths],
-                "outputs_downscaled": downscaled,
-                **payload,
-            }
-        )
-        return
-
-    print(
-        "Calling Image API (generation). This can take up to a couple of minutes.",
-        file=sys.stderr,
-    )
-    started = time.time()
-    client = _create_client()
-    result = client.images.generate(**payload)
-    elapsed = time.time() - started
-    print(f"Generation completed in {elapsed:.1f}s.", file=sys.stderr)
-
-    images = [item.b64_json for item in result.data]
-    _decode_write_and_downscale(
-        images,
-        output_paths,
-        force=args.force,
-        downscale_max_dim=args.downscale_max_dim,
-        downscale_suffix=args.downscale_suffix,
-        output_format=output_format,
-    )
-
-
-def _edit(args: argparse.Namespace) -> None:
-    prompt = _read_prompt(args.prompt, args.prompt_file)
-    prompt = _augment_prompt(args, prompt)
-
-    image_paths = _check_image_paths(args.image)
-    mask_path = Path(args.mask) if args.mask else None
-    if mask_path:
-        if not mask_path.exists():
-            _die(f"Mask file not found: {mask_path}")
-        if mask_path.suffix.lower() != ".png":
-            _warn(f"Mask should be a PNG with an alpha channel: {mask_path}")
-        if mask_path.stat().st_size > MAX_IMAGE_BYTES:
-            _warn(f"Mask exceeds 50MB limit: {mask_path}")
-
-    payload = {
-        "model": args.model,
-        "prompt": prompt,
-        "n": args.n,
-        "size": args.size,
-        "quality": args.quality,
-        "background": args.background,
-        "output_format": args.output_format,
-        "output_compression": args.output_compression,
-        "input_fidelity": args.input_fidelity,
-        "moderation": args.moderation,
-    }
-    payload = {k: v for k, v in payload.items() if v is not None}
-
-    output_format = _normalize_output_format(args.output_format)
-    _validate_transparency(args.background, output_format)
-    payload["output_format"] = output_format
-    _validate_input_fidelity(args.input_fidelity)
-    output_paths = _build_output_paths(args.out, output_format, args.n, args.out_dir)
-    downscaled = None
-    if args.downscale_max_dim is not None:
-        downscaled = [str(_derive_downscale_path(p, args.downscale_suffix)) for p in output_paths]
-
-    if args.dry_run:
-        payload_preview = dict(payload)
-        payload_preview["image"] = [str(p) for p in image_paths]
-        if mask_path:
-            payload_preview["mask"] = str(mask_path)
-        _print_request(
-            {
-                "endpoint": "/v1/images/edits",
-                "outputs": [str(p) for p in output_paths],
-                "outputs_downscaled": downscaled,
-                **payload_preview,
-            }
-        )
-        return
-
-    print(
-        f"Calling Image API (edit) with {len(image_paths)} image(s).",
-        file=sys.stderr,
-    )
-    started = time.time()
-    client = _create_client()
-
-    with _open_files(image_paths) as image_files, _open_mask(mask_path) as mask_file:
-        request = dict(payload)
-        request["image"] = image_files if len(image_files) > 1 else image_files[0]
-        if mask_file is not None:
-            request["mask"] = mask_file
-        result = client.images.edit(**request)
-
-    elapsed = time.time() - started
-    print(f"Edit completed in {elapsed:.1f}s.", file=sys.stderr)
-    images = [item.b64_json for item in result.data]
-    _decode_write_and_downscale(
-        images,
-        output_paths,
-        force=args.force,
-        downscale_max_dim=args.downscale_max_dim,
-        downscale_suffix=args.downscale_suffix,
-        output_format=output_format,
-    )
-
-
-def _open_files(paths: List[Path]):
-    return _FileBundle(paths)
-
-
-def _open_mask(mask_path: Optional[Path]):
-    if mask_path is None:
-        return _NullContext()
-    return _SingleFile(mask_path)
-
-
-class _NullContext:
-    def __enter__(self):
-        return None
-
-    def __exit__(self, exc_type, exc, tb):
-        return False
-
-
-class _SingleFile:
-    def __init__(self, path: Path):
-        self._path = path
-        self._handle = None
-
-    def __enter__(self):
-        self._handle = self._path.open("rb")
-        return self._handle
-
-    def __exit__(self, exc_type, exc, tb):
-        if self._handle:
-            try:
-                self._handle.close()
-            except Exception:
-                pass
-        return False
-
-
-class _FileBundle:
-    def __init__(self, paths: List[Path]):
-        self._paths = paths
-        self._handles: List[object] = []
-
-    def __enter__(self):
-        self._handles = [p.open("rb") for p in self._paths]
-        return self._handles
-
-    def __exit__(self, exc_type, exc, tb):
-        for handle in self._handles:
-            try:
-                handle.close()
-            except Exception:
-                pass
-        return False
-
-
-def _add_shared_args(parser: argparse.ArgumentParser) -> None:
-    parser.add_argument("--model", default=DEFAULT_MODEL)
-    parser.add_argument("--prompt")
-    parser.add_argument("--prompt-file")
-    parser.add_argument("--n", type=int, default=1)
-    parser.add_argument("--size", default=DEFAULT_SIZE)
-    parser.add_argument("--quality", default=DEFAULT_QUALITY)
-    parser.add_argument("--background")
-    parser.add_argument("--output-format")
-    parser.add_argument("--output-compression", type=int)
-    parser.add_argument("--moderation")
-    parser.add_argument("--out", default=DEFAULT_OUTPUT_PATH)
-    parser.add_argument("--out-dir")
-    parser.add_argument("--force", action="store_true")
-    parser.add_argument("--dry-run", action="store_true")
-    parser.add_argument("--augment", dest="augment", action="store_true")
-    parser.add_argument("--no-augment", dest="augment", action="store_false")
-    parser.set_defaults(augment=True)
-
-    # Prompt augmentation hints
-    parser.add_argument("--use-case")
-    parser.add_argument("--scene")
-    parser.add_argument("--subject")
-    parser.add_argument("--style")
-    parser.add_argument("--composition")
-    parser.add_argument("--lighting")
-    parser.add_argument("--palette")
-    parser.add_argument("--materials")
-    parser.add_argument("--text")
-    parser.add_argument("--constraints")
-    parser.add_argument("--negative")
-
-    # Post-processing (optional): generate an additional downscaled copy for fast web loading.
-    parser.add_argument("--downscale-max-dim", type=int)
-    parser.add_argument("--downscale-suffix", default=DEFAULT_DOWNSCALE_SUFFIX)
-
-
-def main() -> int:
-    parser = argparse.ArgumentParser(
-        description="Fallback CLI for explicit image generation or editing via GPT Image models"
-    )
-    subparsers = parser.add_subparsers(dest="command", required=True)
-
-    gen_parser = subparsers.add_parser("generate", help="Create a new image")
-    _add_shared_args(gen_parser)
-    gen_parser.set_defaults(func=_generate)
-
-    batch_parser = subparsers.add_parser(
-        "generate-batch",
-        help="Generate multiple prompts concurrently (JSONL input)",
-    )
-    _add_shared_args(batch_parser)
-    batch_parser.add_argument("--input", required=True, help="Path to JSONL file (one job per line)")
-    batch_parser.add_argument("--concurrency", type=int, default=DEFAULT_CONCURRENCY)
-    batch_parser.add_argument("--max-attempts", type=int, default=3)
-    batch_parser.add_argument("--fail-fast", action="store_true")
-    batch_parser.set_defaults(func=_generate_batch)
-
-    edit_parser = subparsers.add_parser("edit", help="Edit an existing image")
-    _add_shared_args(edit_parser)
-    edit_parser.add_argument("--image", action="append", required=True)
-    edit_parser.add_argument("--mask")
-    edit_parser.add_argument("--input-fidelity")
-    edit_parser.set_defaults(func=_edit)
-
-    args = parser.parse_args()
-    if args.n < 1 or args.n > 10:
-        _die("--n must be between 1 and 10")
-    if getattr(args, "concurrency", 1) < 1 or getattr(args, "concurrency", 1) > 25:
-        _die("--concurrency must be between 1 and 25")
-    if getattr(args, "max_attempts", 3) < 1 or getattr(args, "max_attempts", 3) > 10:
-        _die("--max-attempts must be between 1 and 10")
-    if args.output_compression is not None and not (0 <= args.output_compression <= 100):
-        _die("--output-compression must be between 0 and 100")
-    if args.command == "generate-batch" and not args.out_dir:
-        _die("generate-batch requires --out-dir")
-    if getattr(args, "downscale_max_dim", None) is not None and args.downscale_max_dim < 1:
-        _die("--downscale-max-dim must be >= 1")
-
-    _validate_model(args.model)
-    _validate_size(args.size, args.model)
-    _validate_quality(args.quality)
-    _validate_background(args.background)
-    _validate_model_specific_options(
-        model=args.model,
-        background=args.background,
-        input_fidelity=getattr(args, "input_fidelity", None),
-    )
-    _ensure_api_key(args.dry_run)
-
-    args.func(args)
-    return 0
-
-
-if __name__ == "__main__":
-    raise SystemExit(main())
diff --git a/skills/imagegen/scripts/remove_chroma_key.py b/skills/imagegen/scripts/remove_chroma_key.py
deleted file mode 100644
index 5053987..0000000
--- a/skills/imagegen/scripts/remove_chroma_key.py
+++ /dev/null
@@ -1,440 +0,0 @@
-#!/usr/bin/env python3
-"""Remove a solid chroma-key background from an image.
-
-This helper supports the imagegen skill's built-in-first transparent workflow:
-generate an image on a flat key color, then convert that key color to alpha.
-"""
-
-from __future__ import annotations
-
-import argparse
-from io import BytesIO
-from pathlib import Path
-import re
-from statistics import median
-import sys
-from typing import Tuple
-
-
-Color = Tuple[int, int, int]
-KEY_DOMINANCE_THRESHOLD = 16.0
-ALPHA_NOISE_FLOOR = 8
-
-
-def _die(message: str, code: int = 1) -> None:
-    print(f"Error: {message}", file=sys.stderr)
-    raise SystemExit(code)
-
-
-def _dependency_hint(package: str) -> str:
-    return (
-        "Activate the repo-selected environment first, then install it with "
-        f"`uv pip install {package}`. If this repo uses a local virtualenv, start with "
-        "`source .venv/bin/activate`; otherwise use this repo's configured shared fallback "
-        "environment."
-    )
-
-
-def _load_pillow():
-    try:
-        from PIL import Image, ImageFilter
-    except ImportError:
-        _die(f"Pillow is required for chroma-key removal. {_dependency_hint('pillow')}")
-    return Image, ImageFilter
-
-
-def _parse_key_color(raw: str) -> Color:
-    value = raw.strip()
-    match = re.fullmatch(r"#?([0-9a-fA-F]{6})", value)
-    if not match:
-        _die("key color must be a hex RGB value like #00ff00.")
-    hex_value = match.group(1)
-    return (
-        int(hex_value[0:2], 16),
-        int(hex_value[2:4], 16),
-        int(hex_value[4:6], 16),
-    )
-
-
-def _validate_args(args: argparse.Namespace) -> None:
-    if args.tolerance < 0 or args.tolerance > 255:
-        _die("--tolerance must be between 0 and 255.")
-    if args.transparent_threshold < 0 or args.transparent_threshold > 255:
-        _die("--transparent-threshold must be between 0 and 255.")
-    if args.opaque_threshold < 0 or args.opaque_threshold > 255:
-        _die("--opaque-threshold must be between 0 and 255.")
-    if args.soft_matte and args.transparent_threshold >= args.opaque_threshold:
-        _die("--transparent-threshold must be lower than --opaque-threshold.")
-    if args.edge_feather < 0 or args.edge_feather > 64:
-        _die("--edge-feather must be between 0 and 64.")
-    if args.edge_contract < 0 or args.edge_contract > 16:
-        _die("--edge-contract must be between 0 and 16.")
-
-    src = Path(args.input)
-    if not src.exists():
-        _die(f"Input image not found: {src}")
-
-    out = Path(args.out)
-    if out.exists() and not args.force:
-        _die(f"Output already exists: {out} (use --force to overwrite)")
-
-    if out.suffix.lower() not in {".png", ".webp"}:
-        _die("--out must end in .png or .webp so the alpha channel is preserved.")
-
-
-def _channel_distance(a: Color, b: Color) -> int:
-    return max(abs(a[0] - b[0]), abs(a[1] - b[1]), abs(a[2] - b[2]))
-
-
-def _clamp_channel(value: float) -> int:
-    return max(0, min(255, int(round(value))))
-
-
-def _smoothstep(value: float) -> float:
-    value = max(0.0, min(1.0, value))
-    return value * value * (3.0 - 2.0 * value)
-
-
-def _soft_alpha(distance: int, transparent_threshold: float, opaque_threshold: float) -> int:
-    if distance <= transparent_threshold:
-        return 0
-    if distance >= opaque_threshold:
-        return 255
-    ratio = (float(distance) - transparent_threshold) / (
-        opaque_threshold - transparent_threshold
-    )
-    return _clamp_channel(255.0 * _smoothstep(ratio))
-
-
-def _dominance_alpha(rgb: Color, key: Color) -> int:
-    spill_channels = _spill_channels(key)
-    if not spill_channels:
-        return 255
-
-    channels = [float(value) for value in rgb]
-    non_spill = [idx for idx in range(3) if idx not in spill_channels]
-    key_strength = (
-        min(channels[idx] for idx in spill_channels)
-        if len(spill_channels) > 1
-        else channels[spill_channels[0]]
-    )
-    non_key_strength = max((channels[idx] for idx in non_spill), default=0.0)
-    dominance = key_strength - non_key_strength
-    if dominance <= 0:
-        return 255
-
-    denominator = max(1.0, float(max(key)) - non_key_strength)
-    alpha = 1.0 - min(1.0, dominance / denominator)
-    return _clamp_channel(alpha * 255.0)
-
-
-def _spill_channels(key: Color) -> list[int]:
-    key_max = max(key)
-    if key_max < 128:
-        return []
-    return [idx for idx, value in enumerate(key) if value >= key_max - 16 and value >= 128]
-
-
-def _key_channel_dominance(rgb: Color, key: Color) -> float:
-    spill_channels = _spill_channels(key)
-    if not spill_channels:
-        return 0.0
-
-    channels = [float(value) for value in rgb]
-    non_spill = [idx for idx in range(3) if idx not in spill_channels]
-    key_strength = (
-        min(channels[idx] for idx in spill_channels)
-        if len(spill_channels) > 1
-        else channels[spill_channels[0]]
-    )
-    non_key_strength = max((channels[idx] for idx in non_spill), default=0.0)
-    return key_strength - non_key_strength
-
-
-def _looks_key_colored(rgb: Color, key: Color, distance: int) -> bool:
-    if distance <= 32:
-        return True
-
-    spill_channels = _spill_channels(key)
-    if not spill_channels:
-        return True
-
-    return _key_channel_dominance(rgb, key) >= KEY_DOMINANCE_THRESHOLD
-
-
-def _cleanup_spill(rgb: Color, key: Color, alpha: int = 255) -> Color:
-    if alpha >= 252:
-        return rgb
-
-    spill_channels = _spill_channels(key)
-    if not spill_channels:
-        return rgb
-
-    channels = [float(value) for value in rgb]
-    non_spill = [idx for idx in range(3) if idx not in spill_channels]
-    if non_spill:
-        anchor = max(channels[idx] for idx in non_spill)
-        cap = max(0.0, anchor - 1.0)
-        for idx in spill_channels:
-            if channels[idx] > cap:
-                channels[idx] = cap
-
-    return (
-        _clamp_channel(channels[0]),
-        _clamp_channel(channels[1]),
-        _clamp_channel(channels[2]),
-    )
-
-
-def _apply_alpha_to_image(
-    image,
-    *,
-    key: Color,
-    tolerance: int,
-    spill_cleanup: bool,
-    soft_matte: bool,
-    transparent_threshold: float,
-    opaque_threshold: float,
-) -> int:
-    pixels = image.load()
-    width, height = image.size
-    transparent = 0
-
-    for y in range(height):
-        for x in range(width):
-            red, green, blue, alpha = pixels[x, y]
-            rgb = (red, green, blue)
-            distance = _channel_distance(rgb, key)
-            key_like = _looks_key_colored(rgb, key, distance)
-            output_alpha = (
-                min(
-                    _soft_alpha(distance, transparent_threshold, opaque_threshold),
-                    _dominance_alpha(rgb, key),
-                )
-                if soft_matte and key_like
-                else (0 if distance <= tolerance else 255)
-            )
-            output_alpha = int(round(output_alpha * (alpha / 255.0)))
-            if 0 < output_alpha <= ALPHA_NOISE_FLOOR:
-                output_alpha = 0
-
-            if output_alpha == 0:
-                pixels[x, y] = (0, 0, 0, 0)
-                transparent += 1
-                continue
-
-            if spill_cleanup and key_like:
-                red, green, blue = _cleanup_spill(rgb, key, output_alpha)
-            pixels[x, y] = (red, green, blue, output_alpha)
-
-    return transparent
-
-
-def _contract_alpha(image, pixels: int):
-    if pixels == 0:
-        return image
-
-    _, ImageFilter = _load_pillow()
-    alpha = image.getchannel("A")
-    for _ in range(pixels):
-        alpha = alpha.filter(ImageFilter.MinFilter(3))
-    image.putalpha(alpha)
-    return image
-
-
-def _apply_edge_feather(image, radius: float):
-    if radius == 0:
-        return image
-
-    _, ImageFilter = _load_pillow()
-    alpha = image.getchannel("A")
-    alpha = alpha.filter(ImageFilter.GaussianBlur(radius=radius))
-    image.putalpha(alpha)
-    return image
-
-
-def _encode_image(image, output_format: str) -> bytes:
-    out = BytesIO()
-    image.save(out, format=output_format.upper())
-    return out.getvalue()
-
-
-def _alpha_counts(image) -> tuple[int, int, int]:
-    pixels = image.load()
-    width, height = image.size
-    total = 0
-    transparent = 0
-    partial = 0
-
-    for y in range(height):
-        for x in range(width):
-            alpha = pixels[x, y][3]
-            total += 1
-            if alpha == 0:
-                transparent += 1
-            elif alpha < 255:
-                partial += 1
-
-    return total, transparent, partial
-
-
-def _sample_border_key(image, mode: str) -> Color:
-    width, height = image.size
-    pixels = image.load()
-    samples: list[Color] = []
-
-    if mode == "corners":
-        patch = max(1, min(width, height, 12))
-        boxes = [
-            (0, 0, patch, patch),
-            (width - patch, 0, width, patch),
-            (0, height - patch, patch, height),
-            (width - patch, height - patch, width, height),
-        ]
-        for left, top, right, bottom in boxes:
-            for y in range(top, bottom):
-                for x in range(left, right):
-                    red, green, blue = pixels[x, y][:3]
-                    samples.append((red, green, blue))
-    else:
-        band = max(1, min(width, height, 6))
-        step = max(1, min(width, height) // 256)
-        for x in range(0, width, step):
-            for y in range(band):
-                red, green, blue = pixels[x, y][:3]
-                samples.append((red, green, blue))
-                red, green, blue = pixels[x, height - 1 - y][:3]
-                samples.append((red, green, blue))
-        for y in range(0, height, step):
-            for x in range(band):
-                red, green, blue = pixels[x, y][:3]
-                samples.append((red, green, blue))
-                red, green, blue = pixels[width - 1 - x, y][:3]
-                samples.append((red, green, blue))
-
-    if not samples:
-        _die("Could not sample background key color from image border.")
-
-    return (
-        int(round(median(sample[0] for sample in samples))),
-        int(round(median(sample[1] for sample in samples))),
-        int(round(median(sample[2] for sample in samples))),
-    )
-
-
-def _remove_chroma_key(args: argparse.Namespace) -> None:
-    Image, _ = _load_pillow()
-    src = Path(args.input)
-    out = Path(args.out)
-
-    with Image.open(src) as image:
-        rgba = image.convert("RGBA")
-    key = (
-        _sample_border_key(rgba, args.auto_key)
-        if args.auto_key != "none"
-        else _parse_key_color(args.key_color)
-    )
-
-    transparent = _apply_alpha_to_image(
-        rgba,
-        key=key,
-        tolerance=args.tolerance,
-        spill_cleanup=args.spill_cleanup,
-        soft_matte=args.soft_matte,
-        transparent_threshold=args.transparent_threshold,
-        opaque_threshold=args.opaque_threshold,
-    )
-    rgba = _contract_alpha(rgba, args.edge_contract)
-    rgba = _apply_edge_feather(rgba, args.edge_feather)
-
-    total, transparent_after, partial_after = _alpha_counts(rgba)
-
-    out.parent.mkdir(parents=True, exist_ok=True)
-    output_format = "PNG" if out.suffix.lower() == ".png" else "WEBP"
-    out.write_bytes(_encode_image(rgba, output_format))
-
-    print(f"Wrote {out}")
-    print(f"Key color: #{key[0]:02x}{key[1]:02x}{key[2]:02x}")
-    print(f"Transparent pixels: {transparent_after}/{total}")
-    print(f"Partially transparent pixels: {partial_after}/{total}")
-    if transparent == 0:
-        print("Warning: no pixels matched the key color before feathering.", file=sys.stderr)
-
-
-def _build_parser() -> argparse.ArgumentParser:
-    parser = argparse.ArgumentParser(
-        description="Remove a solid chroma-key background and write an image with alpha."
-    )
-    parser.add_argument("--input", required=True, help="Input image path.")
-    parser.add_argument("--out", required=True, help="Output .png or .webp path.")
-    parser.add_argument(
-        "--key-color",
-        default="#00ff00",
-        help="Hex RGB key color to remove, for example #00ff00.",
-    )
-    parser.add_argument(
-        "--tolerance",
-        type=int,
-        default=12,
-        help="Hard-key per-channel tolerance for matching the key color, 0-255.",
-    )
-    parser.add_argument(
-        "--auto-key",
-        choices=["none", "corners", "border"],
-        default="none",
-        help="Sample the key color from image corners or border instead of --key-color.",
-    )
-    parser.add_argument(
-        "--soft-matte",
-        action="store_true",
-        help="Use a smooth alpha ramp between transparent and opaque thresholds.",
-    )
-    parser.add_argument(
-        "--transparent-threshold",
-        type=float,
-        default=12.0,
-        help="Soft-matte distance at or below which pixels become fully transparent.",
-    )
-    parser.add_argument(
-        "--opaque-threshold",
-        type=float,
-        default=96.0,
-        help="Soft-matte distance at or above which pixels become fully opaque.",
-    )
-    parser.add_argument(
-        "--edge-feather",
-        type=float,
-        default=0.0,
-        help="Optional alpha blur radius for softened edges, 0-64.",
-    )
-    parser.add_argument(
-        "--edge-contract",
-        type=int,
-        default=0,
-        help="Shrink the visible alpha matte by this many pixels before feathering.",
-    )
-    parser.add_argument(
-        "--spill-cleanup",
-        dest="spill_cleanup",
-        action="store_true",
-        help="Reduce obvious key-color spill on opaque pixels.",
-    )
-    parser.add_argument(
-        "--despill",
-        dest="spill_cleanup",
-        action="store_true",
-        help="Alias for --spill-cleanup; decontaminate key-color edge spill.",
-    )
-    parser.add_argument("--force", action="store_true", help="Overwrite an existing output file.")
-    return parser
-
-
-def main() -> None:
-    parser = _build_parser()
-    args = parser.parse_args()
-    _validate_args(args)
-    _remove_chroma_key(args)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/skills/openai-docs/LICENSE.txt b/skills/openai-docs/LICENSE.txt
deleted file mode 100644
index 13e25df..0000000
--- a/skills/openai-docs/LICENSE.txt
+++ /dev/null
@@ -1,201 +0,0 @@
-Apache License
-Version 2.0, January 2004
-http://www.apache.org/licenses/
-
-TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-1. Definitions.
-
-   "License" shall mean the terms and conditions for use, reproduction,
-   and distribution as defined by Sections 1 through 9 of this document.
-
-   "Licensor" shall mean the copyright owner or entity authorized by
-   the copyright owner that is granting the License.
-
-   "Legal Entity" shall mean the union of the acting entity and all
-   other entities that control, are controlled by, or are under common
-   control with that entity. For the purposes of this definition,
-   "control" means (i) the power, direct or indirect, to cause the
-   direction or management of such entity, whether by contract or
-   otherwise, or (ii) ownership of fifty percent (50%) or more of the
-   outstanding shares, or (iii) beneficial ownership of such entity.
-
-   "You" (or "Your") shall mean an individual or Legal Entity
-   exercising permissions granted by this License.
-
-   "Source" form shall mean the preferred form for making modifications,
-   including but not limited to software source code, documentation
-   source, and configuration files.
-
-   "Object" form shall mean any form resulting from mechanical
-   transformation or translation of a Source form, including but
-   not limited to compiled object code, generated documentation,
-   and conversions to other media types.
-
-   "Work" shall mean the work of authorship, whether in Source or
-   Object form, made available under the License, as indicated by a
-   copyright notice that is included in or attached to the work
-   (an example is provided in the Appendix below).
-
-   "Derivative Works" shall mean any work, whether in Source or Object
-   form, that is based on (or derived from) the Work and for which the
-   editorial revisions, annotations, elaborations, or other modifications
-   represent, as a whole, an original work of authorship. For the purposes
-   of this License, Derivative Works shall not include works that remain
-   separable from, or merely link (or bind by name) to the interfaces of,
-   the Work and Derivative Works thereof.
-
-   "Contribution" shall mean any work of authorship, including
-   the original version of the Work and any modifications or additions
-   to that Work or Derivative Works thereof, that is intentionally
-   submitted to Licensor for inclusion in the Work by the copyright owner
-   or by an individual or Legal Entity authorized to submit on behalf of
-   the copyright owner. For the purposes of this definition, "submitted"
-   means any form of electronic, verbal, or written communication sent
-   to the Licensor or its representatives, including but not limited to
-   communication on electronic mailing lists, source code control systems,
-   and issue tracking systems that are managed by, or on behalf of, the
-   Licensor for the purpose of discussing and improving the Work, but
-   excluding communication that is conspicuously marked or otherwise
-   designated in writing by the copyright owner as "Not a Contribution."
-
-   "Contributor" shall mean Licensor and any individual or Legal Entity
-   on behalf of whom a Contribution has been received by Licensor and
-   subsequently incorporated within the Work.
-
-2. Grant of Copyright License. Subject to the terms and conditions of
-   this License, each Contributor hereby grants to You a perpetual,
-   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-   copyright license to reproduce, prepare Derivative Works of,
-   publicly display, publicly perform, sublicense, and distribute the
-   Work and such Derivative Works in Source or Object form.
-
-3. Grant of Patent License. Subject to the terms and conditions of
-   this License, each Contributor hereby grants to You a perpetual,
-   worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-   (except as stated in this section) patent license to make, have made,
-   use, offer to sell, sell, import, and otherwise transfer the Work,
-   where such license applies only to those patent claims licensable
-   by such Contributor that are necessarily infringed by their
-   Contribution(s) alone or by combination of their Contribution(s)
-   with the Work to which such Contribution(s) was submitted. If You
-   institute patent litigation against any entity (including a
-   cross-claim or counterclaim in a lawsuit) alleging that the Work
-   or a Contribution incorporated within the Work constitutes direct
-   or contributory patent infringement, then any patent licenses
-   granted to You under this License for that Work shall terminate
-   as of the date such litigation is filed.
-
-4. Redistribution. You may reproduce and distribute copies of the
-   Work or Derivative Works thereof in any medium, with or without
-   modifications, and in Source or Object form, provided that You
-   meet the following conditions:
-
-   (a) You must give any other recipients of the Work or
-       Derivative Works a copy of this License; and
-
-   (b) You must cause any modified files to carry prominent notices
-       stating that You changed the files; and
-
-   (c) You must retain, in the Source form of any Derivative Works
-       that You distribute, all copyright, patent, trademark, and
-       attribution notices from the Source form of the Work,
-       excluding those notices that do not pertain to any part of
-       the Derivative Works; and
-
-   (d) If the Work includes a "NOTICE" text file as part of its
-       distribution, then any Derivative Works that You distribute must
-       include a readable copy of the attribution notices contained
-       within such NOTICE file, excluding those notices that do not
-       pertain to any part of the Derivative Works, in at least one
-       of the following places: within a NOTICE text file distributed
-       as part of the Derivative Works; within the Source form or
-       documentation, if provided along with the Derivative Works; or,
-       within a display generated by the Derivative Works, if and
-       wherever such third-party notices normally appear. The contents
-       of the NOTICE file are for informational purposes only and
-       do not modify the License. You may add Your own attribution
-       notices within Derivative Works that You distribute, alongside
-       or as an addendum to the NOTICE text from the Work, provided
-       that such additional attribution notices cannot be construed
-       as modifying the License.
-
-   You may add Your own copyright statement to Your modifications and
-   may provide additional or different license terms and conditions
-   for use, reproduction, or distribution of Your modifications, or
-   for any such Derivative Works as a whole, provided Your use,
-   reproduction, and distribution of the Work otherwise complies with
-   the conditions stated in this License.
-
-5. Submission of Contributions. Unless You explicitly state otherwise,
-   any Contribution intentionally submitted for inclusion in the Work
-   by You to the Licensor shall be under the terms and conditions of
-   this License, without any additional terms or conditions.
-   Notwithstanding the above, nothing herein shall supersede or modify
-   the terms of any separate license agreement you may have executed
-   with Licensor regarding such Contributions.
-
-6. Trademarks. This License does not grant permission to use the trade
-   names, trademarks, service marks, or product names of the Licensor,
-   except as required for reasonable and customary use in describing the
-   origin of the Work and reproducing the content of the NOTICE file.
-
-7. Disclaimer of Warranty. Unless required by applicable law or
-   agreed to in writing, Licensor provides the Work (and each
-   Contributor provides its Contributions) on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-   implied, including, without limitation, any warranties or conditions
-   of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-   PARTICULAR PURPOSE. You are solely responsible for determining the
-   appropriateness of using or redistributing the Work and assume any
-   risks associated with Your exercise of permissions under this License.
-
-8. Limitation of Liability. In no event and under no legal theory,
-   whether in tort (including negligence), contract, or otherwise,
-   unless required by applicable law (such as deliberate and grossly
-   negligent acts) or agreed to in writing, shall any Contributor be
-   liable to You for damages, including any direct, indirect, special,
-   incidental, or consequential damages of any character arising as a
-   result of this License or out of the use or inability to use the
-   Work (including but not limited to damages for loss of goodwill,
-   work stoppage, computer failure or malfunction, or any and all
-   other commercial damages or losses), even if such Contributor
-   has been advised of the possibility of such damages.
-
-9. Accepting Warranty or Additional Liability. While redistributing
-   the Work or Derivative Works thereof, You may choose to offer,
-   and charge a fee for, acceptance of support, warranty, indemnity,
-   or other liability obligations and/or rights consistent with this
-   License. However, in accepting such obligations, You may act only
-   on Your own behalf and on Your sole responsibility, not on behalf of
-   any other Contributor, and only if You agree to indemnify,
-   defend, and hold each Contributor harmless for any liability
-   incurred by, or claims asserted against, such Contributor by reason
-   of your accepting any such warranty or additional liability.
-
-END OF TERMS AND CONDITIONS
-
-APPENDIX: How to apply the Apache License to your work.
-
-   To apply the Apache License to your work, attach the following
-   boilerplate notice, with the fields enclosed by brackets "[]"
-   replaced with your own identifying information. (Don\'t include
-   the brackets!)  The text should be enclosed in the appropriate
-   comment syntax for the file format. We also recommend that a
-   file or class name and description of purpose be included on the
-   same "printed page" as the copyright notice for easier
-   identification within third-party archives.
-
-Copyright [yyyy] [name of copyright owner]
-
-Licensed under the Apache License, Version 2.0 (the "License");
-you may not use this file except in compliance with the License.
-You may obtain a copy of the License at
-
-    http://www.apache.org/licenses/LICENSE-2.0
-
-Unless required by applicable law or agreed to in writing, software
-distributed under the License is distributed on an "AS IS" BASIS,
-WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-See the License for the specific language governing permissions and
-limitations under the License.
diff --git a/skills/openai-docs/SKILL.md b/skills/openai-docs/SKILL.md
deleted file mode 100644
index 30526bd..0000000
--- a/skills/openai-docs/SKILL.md
+++ /dev/null
@@ -1,167 +0,0 @@
----
-name: "openai-docs"
-description: "Use when the user asks how to build with OpenAI products or APIs, asks about Codex itself or choosing Codex surfaces, needs up-to-date official documentation with citations, help choosing the latest model for a use case, or model upgrade and prompt-upgrade guidance; use OpenAI docs MCP tools for non-Codex docs questions, use the Codex manual helper first for broad Codex self-knowledge, and restrict fallback browsing to official OpenAI domains."
----
-
-
-# OpenAI Docs
-
-Provide authoritative, current guidance from OpenAI developer docs using the developers.openai.com MCP server. "Docs MCP" means `mcp__openaiDeveloperDocs__search_openai_docs` and `mcp__openaiDeveloperDocs__fetch_openai_doc`; for API reference, schema, parameter, or required-field questions, also use `mcp__openaiDeveloperDocs__get_openapi_spec` when available. Official-domain web search is fallback after those tools are unavailable or unhelpful. Broad Codex questions use the manual helper before Docs MCP. This skill also owns model selection, API model migration, and prompt-upgrade guidance.
-
-## API Key Setup
-
-For requests to build, run, configure, debug, or implement an API-backed app, script, CLI, generator, or tool, use `openai-platform-api-key` first when available. After that credential gate is resolved, return here for current docs as needed.
-
-Use this skill directly for docs-only questions, citations, model/API guidance, conceptual explanations, and examples that do not require building or running an API-backed artifact.
-
-## Workflow Configuration
-
-### Source Priority
-
-- For Codex self-knowledge, use the Codex source route below; it owns when to use the manual helper, Docs MCP, or bounded uncertainty.
-- For non-Codex OpenAI docs questions, use `mcp__openaiDeveloperDocs__search_openai_docs` to find the most relevant doc pages.
-- For non-Codex OpenAI docs questions, fetch the relevant page with `mcp__openaiDeveloperDocs__fetch_openai_doc` before answering. If search is noisy, run a narrower Docs MCP search; when any plausible official OpenAI docs URL is known or found, try fetching that URL through Docs MCP before relying on web-search content.
-- For API reference, schema, parameter, or required-field questions, use `mcp__openaiDeveloperDocs__get_openapi_spec` when available to verify the API shape alongside the relevant guide or reference page.
-- Use `mcp__openaiDeveloperDocs__list_openai_docs` only when you need to browse or discover non-Codex pages without a clear query.
-- For model-selection, "latest model", or default-model questions, fetch `https://developers.openai.com/api/docs/guides/latest-model.md` first. If that is unavailable, load `references/latest-model.md`.
-- For model upgrades or prompt upgrades, run `node scripts/resolve-latest-model-info.js` only when the target is latest/current/default or otherwise unspecified; otherwise preserve the explicitly requested target.
-- Preserve explicit target requests: if the user names a target model like "migrate to GPT-5.4", keep that requested target even if `latest-model.md` names a newer model. Mention newer guidance only as optional.
-- If current remote guidance is needed, fetch both the returned migration and prompting guide URLs directly. If direct fetch fails, use MCP/search fallback; if that also fails, use bundled fallback references and disclose the fallback.
-
-## OpenAI product snapshots
-
-1. Apps SDK: Build ChatGPT apps by providing a web component UI and an MCP server that exposes your app's tools to ChatGPT.
-2. Responses API: A unified endpoint designed for stateful, multimodal, tool-using interactions in agentic workflows.
-3. Chat Completions API: Generate a model response from a list of messages comprising a conversation.
-4. Codex: OpenAI's coding agent for software development that can write, understand, review, and debug code.
-5. gpt-oss: Open-weight OpenAI reasoning models (gpt-oss-120b and gpt-oss-20b) released under the Apache 2.0 license.
-6. Realtime API: Build low-latency, multimodal experiences including natural speech-to-speech conversations.
-7. Agents SDK: A toolkit for building agentic apps where a model can use tools and context, hand off to other agents, stream partial results, and keep a full trace.
-
-## Codex self-knowledge
-
-Use this path for questions about Codex itself: configuring, extending, operating, troubleshooting, local state, product surfaces, or where Codex behavior should live. A codebase merely mentioning a plugin, skill, hook, MCP server, browser, or automation is not enough. For generic software tasks, answer the software task directly; if asked whether Codex self-knowledge applies, answer that meta question briefly and continue the requested artifact.
-
-### Source Route
-
-The Codex manual is the first source for broad Codex synthesis. Treat the manual and Docs MCP as different lanes, not interchangeable official-doc sources. For published-user Codex product answers, the source route is complete: the manual, Docs MCP when this route calls for it, official OpenAI web fallback, and callable capabilities surfaced in the current session when the question is about that capability. Knowledge bases outside developers.openai.com are outside this route for public product answers.
-
-For broad Codex behavior, setup, customization, skills, plugins, MCP, hooks, `AGENTS.md`, automations, surfaces, local state, or system-map questions:
-
-1. Reuse a same-thread manual and outline path when it is still fresh.
-2. Otherwise run the skill-local helper first in normal writable sessions. Skip it without trying only when the session is explicitly read-only, shell execution is unavailable, or visible policy shows no allowed temp cache.
-3. By default, the helper chooses the first usable temp cache dir in this order: `$TMPDIR/openai-docs-cache`, `%TEMP%\openai-docs-cache`, `%TMP%\openai-docs-cache`, `/private/tmp/openai-docs-cache`, then `/tmp/openai-docs-cache`. Workspace-only write access is not enough for this temp cache.
-4. Run the helper directly unless you need to override the cache dir. The helper falls back to `curl` when native `fetch` is unavailable or when proxy env vars are present, so no shell-specific proxy prefix is required. Resolve `<skill-dir>` to this skill's actual directory; in copied local eval workdirs this is usually `.codex/skills/openai-docs`:
-
-```bash
-node <skill-dir>/scripts/fetch-codex-manual.mjs
-```
-
-If you need to override the cache dir, pass `--cache-dir <cache-dir>`. On Windows, the helper checks `%TEMP%` and `%TMP%` automatically; in PowerShell, `$env:TEMP\\openai-docs-cache` is a typical explicit override.
-
-Treat helper availability as established by explicit read-only/no-shell policy or an actual command result. A guessed sandbox or guessed helper failure is not enough to switch to Docs MCP or web lookup; after an actual helper command failure, continue to the narrowest official next source below.
-
-The helper verifies freshness, writes `codex-manual.md`, and emits `codex-manual.outline.md`. The outline maps source pages and headings to line ranges; use it to choose the relevant manual section, then read or search targeted manual sections for Codex product facts. Use the skill directory to locate and run the helper; after the helper succeeds, use the returned manual and outline paths as the search scope for Codex product facts and term coverage checks.
-
-Reuse the same-thread manual and outline paths for follow-up Codex questions. Refresh first when the manual was fetched more than about a day ago, the path is unusable, the path came from another thread or uncertain provenance, or likely-current information is missing and staleness is plausible.
-
-For questions about whether the manual is current enough to rely on now, run the helper when temp caching is allowed and base the answer on its returned status, manual path, and outline path.
-
-If the manual resolves a Codex claim, answer from it and stop expanding sources for that claim; continue the user's broader task if the docs lookup was only one dependency. Manual source pages and known anchors are enough citation support for manual-covered material.
-
-If the helper is skipped because the session is read-only, has no shell execution, or has no allowed temp cache, the next source is Docs MCP: call `mcp__openaiDeveloperDocs__search_openai_docs`, then `mcp__openaiDeveloperDocs__fetch_openai_doc` for a relevant hit before any web fallback.
-
-If a user names a Codex term or mode that a fresh manual does not use, search the manual for obvious adjacent concepts, then answer that the exact term is not documented and use the closest documented terminology. If the prompt asks how that term maps to Codex behavior, resolve the mapping from adjacent manual sections. If the exact term remains material or likely current after that manual pass, use one narrow Docs MCP search/fetch before bounded uncertainty; otherwise, the source lookup for that terminology or mapping claim is complete.
-
-Use the narrowest official next source only when the manual is unavailable, the helper fails, temp caching is not allowed, another material claim is missing or likely stale, or the user explicitly needs a page-specific citation. Prefer one specific Docs MCP search and, if it returns a clearly relevant page, one fetch; for unresolved Codex capability names, acronyms, scheduling terms, or exact error text, this Docs MCP step is the next source before web search. After the manual plus any permitted Docs MCP gap-fill, resolve remaining gaps as bounded uncertainty. Use official-domain web fallback only after that Docs MCP path is unavailable or unhelpful. If the claim is still not established, stop with bounded uncertainty. If official docs/manual conflict with a callable capability already surfaced in the current session, state the conflict and prefer verified current-session behavior for that environment.
-
-For undocumented or private-looking model slugs, product mode labels, entitlement labels, account access paths, or rollout names, answer from current public docs and bounded uncertainty. Those labels are not a reason to leave the public source route.
-
-For support-style diagnostics, prefer a layer-by-layer answer from the manual over provider-specific web lookups: installed/enabled plugin, bundled app or connector authorization, MCP setup, workspace/admin policy, restart or new-thread expectations, then support or feedback if still unresolved.
-
-If the source route still does not establish a claim, return bounded uncertainty or route to support, an admin, or product feedback instead of widening the investigation.
-
-For unresolved product terminology, answer from the manual plus the allowed official next source. If those sources do not establish the term, answer with bounded uncertainty from those sources.
-
-### Surface Map
-
-When Codex nouns or durable-instruction surfaces overlap, recommend the smallest surface that matches the scope:
-
-- Prompt or thread context -> one-off task constraints.
-- `AGENTS.md` -> durable repo conventions, commands, verification steps, and review expectations; closer nested files apply under their subtree.
-- Project `.codex/config.toml` -> trusted-repo Codex settings such as sandbox, MCP, hooks, model, or reasoning defaults.
-- Global config or global guidance -> personal defaults across repos.
-- Skill -> reusable task workflow with references or scripts.
-- Plugin -> installable bundle with skills plus commands, tools, MCP config, hooks, assets, apps, or marketplace metadata.
-- MCP server or app connector -> live external data/actions or authorized private app/workspace data. Use connectors for private Google Docs, Calendar, Slack, GitHub, Notion, and similar data instead of web search or model memory.
-- Automation -> scheduled checks, reminders, monitors, or follow-up work; use a thread heartbeat when continuity in an existing thread matters.
-- Hook -> lifecycle enforcement around tool calls, commands, or file edits.
-
-Split mixed-scope requests instead of forcing one answer. Example: "always do X, but only for this PR" defaults to prompt/thread context for the current run; use `AGENTS.md` or project config only if it should persist, hooks only for mechanical enforcement, and automations only for scheduled or follow-up work.
-
-Use this quick product map when needed: CLI is terminal-first local repo work; IDE extension is editor-attached coding; Codex app is desktop planning, review, and interactive work; cloud/web is hosted parallel/offloaded work; Browser Use/in-app browser is Codex-controlled web testing; Chrome extension uses the user's Chrome profile; Computer Use controls desktop apps and OS UI. Keep `config.toml` defaults, `requirements.toml` constraints, and managed/admin policy separate.
-
-### Boundaries And Output
-
-- API key auth does not imply ChatGPT, cloud task, or connector access. For plugin/app/auth failures, check bundle availability, plugin installed/enabled state, connector/app authorization, MCP setup, restart/refresh expectations, workspace policy, and per-surface availability before answering.
-- Sandbox or network denials need scoped escalation with a clear justification. Destructive commands, writes outside the workspace, or broad access changes require explicit approval.
-- Memory can provide user preference or context, but explicit prompt instructions win and memory is not a source for current external facts.
-- For affirmative surface-selection answers, use this shape: recommendation, why, what to avoid, and the manual/source evidence used.
-- When page-specific Codex citations are actually needed, these anchors often fit: `concepts/customization#agents-guidance` for `AGENTS.md`, `concepts/customization#skills` for skills, `plugins/build#plugin-structure` for plugins, `concepts/customization#mcp` for MCP, `config-advanced#hooks` for hooks, `app/automations#thread-automations` for thread automations, and `config-reference#configtoml` for config.
-
-## If MCP server is missing
-
-If MCP tools fail or no OpenAI docs resources are available:
-
-1. Run the install command yourself: `codex mcp add openaiDeveloperDocs --url https://developers.openai.com/mcp`
-2. If it fails due to permissions/sandboxing, immediately retry the same command with escalated permissions and include a 1-sentence justification for approval.
-3. Ask the user to run the install command only if the escalated attempt fails.
-4. Ask the user to restart Codex.
-5. Re-run the doc search/fetch after restart.
-
-## Workflow
-
-1. Clarify whether the request is general docs lookup, model selection, a model-string upgrade, prompt-upgrade guidance, or broader API/provider migration.
-2. For Codex self-knowledge requests, follow the Codex self-knowledge source procedure above.
-3. For model-selection or upgrade requests, prefer current remote docs over bundled references when the user asks for latest/current/default guidance.
-   - Fetch `https://developers.openai.com/api/docs/guides/latest-model.md`.
-   - Find the latest model ID and explicit migration or prompt-guidance links.
-   - Prefer explicit links from the latest-model page over derived URLs.
-   - For explicit named-model requests, preserve the requested model target. Mention newer remote guidance only as optional.
-   - For dynamic latest/current/default upgrades, run `node scripts/resolve-latest-model-info.js`, then fetch both returned guide URLs directly when possible.
-   - If direct guide fetch fails, use the developer-docs MCP tools or official OpenAI-domain search to find the same guide content.
-   - If remote docs are unavailable, use bundled fallback references and say that fallback guidance was used.
-4. For model upgrades, keep changes narrow: update active OpenAI API model defaults and directly related prompts only when safe.
-5. Leave historical docs, examples, eval baselines, fixtures, provider comparisons, provider registries, pricing tables, alias defaults, low-cost fallback paths, and ambiguous older model usage unchanged unless the user explicitly asks to upgrade them.
-6. Keep SDK, tooling, IDE, plugin, shell, auth, and provider-environment migrations out of a model-and-prompt upgrade unless the user explicitly asks for them.
-7. If an upgrade needs API-surface changes, schema rewiring, tool-handler changes, or implementation work beyond a literal model-string replacement and prompt edits, report it as blocked or confirmation-needed.
-8. For general docs lookup, search docs with a precise query, fetch the best page and exact section needed, and answer with concise citations.
-
-## Reference map
-
-Read only what you need:
-
-- `https://developers.openai.com/api/docs/guides/latest-model.md` -> current model-selection and "best/latest/current model" questions.
-- `scripts/fetch-codex-manual.mjs` -> current Codex manual fetch, verification, local temp cache, and outline generation.
-- `https://developers.openai.com/codex/codex-manual.md` -> current Codex self-knowledge synthesis, including setup, customization, skills, plugins, MCP, hooks, `AGENTS.md`, automations, and surface behavior; normally access it through the helper path and targeted file reads when temp caching is available.
-- `references/latest-model.md` -> bundled fallback for model-selection and "best/latest/current model" questions.
-- `references/upgrade-guide.md` -> bundled fallback for model upgrade and upgrade-planning requests.
-- `references/prompting-guide.md` -> bundled fallback for prompt rewrites and prompt-behavior upgrades.
-
-## Quality rules
-
-- Treat OpenAI docs as the source of truth; avoid speculation.
-- For Codex self-knowledge, follow the source route above instead of relying on remembered behavior.
-- Keep migration changes narrow and behavior-preserving.
-- Prefer prompt-only upgrades when possible.
-- Avoid inventing pricing, availability, parameters, API changes, or breaking changes.
-- Keep quotes short and within policy limits; prefer paraphrase with citations.
-- If multiple pages differ, call out the difference and cite both.
-- If official docs and verified callable current-session behavior disagree, state the conflict before making broad claims or edits.
-- If docs do not cover the user’s need, say so and offer next steps.
-
-## Tooling notes
-
-- Use MCP doc tools before web search for OpenAI-related markdown docs. The Codex manual flow is the exception: follow the Codex self-knowledge source procedure for broad Codex synthesis.
-- If the MCP server is installed but returns no meaningful results, then use web search as a fallback.
-- When falling back to web search, restrict to official OpenAI domains (developers.openai.com, platform.openai.com) and cite sources.
diff --git a/skills/openai-docs/agents/openai.yaml b/skills/openai-docs/agents/openai.yaml
deleted file mode 100644
index 8bbf03c..0000000
--- a/skills/openai-docs/agents/openai.yaml
+++ /dev/null
@@ -1,14 +0,0 @@
-interface:
-  display_name: "OpenAI Docs"
-  short_description: "Reference OpenAI docs, Codex self-knowledge, and model migration guidance"
-  icon_small: "./assets/openai-small.svg"
-  icon_large: "./assets/openai.png"
-  default_prompt: "Use OpenAI Docs for official docs lookup, questions about Codex itself or Codex surfaces, model selection, model migration, and prompt-upgrade work."
-
-dependencies:
-  tools:
-    - type: "mcp"
-      value: "openaiDeveloperDocs"
-      description: "OpenAI Developer Docs MCP server"
-      transport: "streamable_http"
-      url: "https://developers.openai.com/mcp"
diff --git a/skills/openai-docs/assets/openai-small.svg b/skills/openai-docs/assets/openai-small.svg
deleted file mode 100644
index 1d075dc..0000000
--- a/skills/openai-docs/assets/openai-small.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="14" height="14" fill="currentColor" viewBox="0 0 14 14">
-  <path d="M10.931 3.34a.112.112 0 0 0-.069-.104l-.038-.007c-1.537.05-2.45.318-3.714 1.002v6.683c.48-.248.936-.44 1.414-.58.695-.203 1.417-.292 2.303-.305l.038-.008a.113.113 0 0 0 .066-.104V3.341ZM2.363 9.919c0 .064.051.11.105.111l.33.008c1.162.046 2.042.243 2.975.662-.403-.585-1.008-1.075-1.654-1.292a.991.991 0 0 1-.674-.941v-5.14a6.36 6.36 0 0 0-.59-.076l-.37-.02a.115.115 0 0 0-.122.111v6.577Zm9.455-.001a.998.998 0 0 1-.877.992l-.101.007c-.832.012-1.47.095-2.066.27-.599.174-1.176.448-1.883.863a.444.444 0 0 1-.449 0c-1.299-.763-2.229-1.07-3.689-1.125l-.299-.008a.997.997 0 0 1-.977-.998V3.342c0-.573.478-1.017 1.038-.999l.417.023c.188.015.35.037.513.062v-.754c0-.708.749-1.244 1.429-.903.984.492 1.836 1.449 2.15 2.505 1.216-.617 2.222-.884 3.771-.934l.105.003a.998.998 0 0 1 .918.996v6.576ZM4.332 8.466c0 .049.03.087.07.1l.24.091a4.319 4.319 0 0 1 1.581 1.176V3.721c-.164-.803-.799-1.617-1.584-2.07l-.162-.088c-.025-.012-.054-.013-.088.009a.12.12 0 0 0-.057.102v6.792Z"/>
-</svg>
diff --git a/skills/openai-docs/assets/openai.png b/skills/openai-docs/assets/openai.png
deleted file mode 100644
index e9b9eb80cd90ccdfc7e276b07f4046aa9c9d1887..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1429
zcmbW1X)qfI7>2WsZI&%Dh?dljBaOCEMMKw7ZA6J9aYbCMqq=TtRa|RzO_Vl5(Tby3
z>WGvo5$jf6$Dnm3k*y$7_qxxBm9_eJr$2Uf=6%0+=J|ep?|hH#F_x#Ll%)Uwz-hD<
z%JC%qJ{u@@GLIjMi30$Vo@mrf=a?63lOMvlevr3YeHmW9u)%SZM{6T>Dj>OG-NM(s
zxeg66h^R2ccnS@hB9Zx5zfp_$#T*uKL&buLGL{${$dr@`q~IC?DdR&0Yq0d<K8P63
zoq-ia(lt|gi+>z!?aXm2s}%cPO10FrRE?G-k0{=7K$_&kI=~e$pjYgzE8vVY;O<xd
zh7-$JISb@wBgjW#OZ1&1O&;m2U9KfMN=UULqKFQf`-x@tWG&~CiRI{9?_3=;#l~lR
zK#z)MO6IJRX|$k#ma65P3XlGZ>>46Hm7aP^&cE!{sKcdEAVNXg4w0>eo^HyTDRAUX
z1q<1l*$z0vv6jqHvTYK7N`0u5;6yAk8Hu1q<Wy{rILx>vr9>?%KFBwx(h6KK`f%%#
zP9L?T7T}-#%27<caJiY)8CM_rxL@n9YJDZNu(J9ejFfg_<ecNPs>~gRX#U;>m%`xu
zRx(>rAYhNw6pH4Us6k_8+@3ALmhG5zSAFOj7mD2H0~sQ=I4$p^(D+2UDcut(d(Zp!
z$J7P4kw8<WXpL^om{teTpzUG?*SB;E6jJ+JHsPQr$qRnXhSVG{9g$TC8FX`Rpn&7+
z49+fmGzlrEzf8G|kl-q=EvOW>gyQccMw&gi*xV|;t$}UYUBXtS6J`v8J*FsDliZ(~
z<@+Da;4XO8{*25XsWoe!b=2mY`PSnj0Z7~UQ*|-j*hV&a!&>HP&o)P@{myW|*myuJ
zPL74L-`HWji(Yv(m?iF4r#zM!p1!g6I7dIXic~LBBSC+v<&e%2x^h<IJiw&mW8Z#0
z{_2-+{>38vZ+K%YzU=I56m0T>JWomcJPn6TrJifjM(Wx@?~P{4<?FFY@=pSTUd~o}
zZK;*aN^s}j1WEV4qnQKwZ1F*R%O8oLP)$oaCzXCD=G9&pHSm0{G{lAl`D<rbJ!ccF
z85QDL+)<5fuOZ(l(?EyaR!ECYYzqjdxCOQ|wYt!U3M5cglY$y?<CzeXXL_6rDorOB
zaCnI6Jd%^$mGOf;e;0TE^1W_)bg_09Rn>%}rrY5}h#pwawmf9bv&aQiDux**Y3-i1
zqTMnW8G{DfFvi;3E(l}R$dnUJ(<_$+W=og_k=xR0MMrfK2)TPiox{1oBNwcL>8#m#
z2$uC?K_J`ikEKh0r?2|0pJAYIrydWjz4!V9$3;~TX9@!$D);A=7}tjnb%dew^(*jT
z!cczU%3j<f{C>Ofc-pF{Xw&l)zxDY>N0@3`IgX*{{x>pcJ4^R^O&K$8J*lYk{{3ft
z3HXDsfQ`mNPS^OYH*TNCxEWY;hF<R+^scY<FnNH(oQP8l2?g@@NIEiwbCYYbI|48j
z8ozE+o#IU-lr!8uz1JY-%2OJSVuk1og^-S*(3~~~GPq`>@zMxCh3axXGT}NR5^Abn
zdCpco+Y1il&A)g0(10*jT094hy+6Dx>_H|(eSZ_d9(a-0S=ek~_H;O<t9ybI)3JKg
zbOx4(h)2Y)5Ec$=Bnn#aUqfE~t^>Zvn>M@rc@Zsm>2rYBSEw^m9;T>t);vhumBCh|
zt36@MO*|h0+t^`bH+9yn%$0(3`IN-}RNc3{YL?YaM@F{M$-4!hEikCpNbjV70IV&k
AfB*mh

diff --git a/skills/openai-docs/references/latest-model.md b/skills/openai-docs/references/latest-model.md
deleted file mode 100644
index a1ffbfb..0000000
--- a/skills/openai-docs/references/latest-model.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# Latest model guide
-
-This file is a curated helper. Every recommendation here must be verified against current OpenAI docs before it is repeated to a user.
-
-## Current model map
-
-| Model ID | Use for |
-| --- | --- |
-| `gpt-5.5` | Latest/default text and reasoning model for most new apps, including coding and tool-heavy workflows |
-| `gpt-5.5-pro` | Maximum reasoning or quality when latency and cost matter less |
-| `gpt-5.4` | Previous default text and reasoning model; use for existing GPT-5.4 integrations |
-| `gpt-5.4-mini` | Lower-cost testing and lighter production workflows |
-| `gpt-5.4-nano` | High-throughput simple tasks and classification |
-| `gpt-5.5` | Explicit no-reasoning text path via `reasoning.effort: none` |
-| `gpt-4.1-mini` | Cheaper no-reasoning text |
-| `gpt-4.1-nano` | Fastest and cheapest no-reasoning text |
-| `gpt-5.3-codex` | Agentic coding, code editing, and tool-heavy coding workflows |
-| `gpt-5.1-codex-mini` | Cheaper coding workflows |
-| `gpt-image-2` | Best image generation and edit quality |
-| `gpt-image-1.5` | Less expensive image generation and edit quality |
-| `gpt-image-1-mini` | Cost-optimized image generation |
-| `gpt-4o-mini-tts` | Text-to-speech |
-| `gpt-4o-mini-transcribe` | Speech-to-text, fast and cost-efficient |
-| `gpt-realtime-1.5` | Realtime voice and multimodal sessions |
-| `gpt-realtime-mini` | Cheaper realtime sessions |
-| `gpt-audio` | Chat Completions audio input and output |
-| `gpt-audio-mini` | Cheaper Chat Completions audio workflows |
-| `sora-2` | Faster iteration and draft video generation |
-| `sora-2-pro` | Higher-quality production video |
-| `omni-moderation-latest` | Text and image moderation |
-| `text-embedding-3-large` | Higher-quality retrieval embeddings; default in this skill because no best-specific row exists |
-| `text-embedding-3-small` | Lower-cost embeddings |
-
-## Maintenance notes
-
-- This file will drift unless it is periodically re-verified against current OpenAI docs.
-- If this file conflicts with current docs, the docs win.
diff --git a/skills/openai-docs/references/prompting-guide.md b/skills/openai-docs/references/prompting-guide.md
deleted file mode 100644
index 0d9273c..0000000
--- a/skills/openai-docs/references/prompting-guide.md
+++ /dev/null
@@ -1,244 +0,0 @@
-GPT-5.5 works best when prompts define the outcome and leave room for the model to choose an efficient solution path. Compared with earlier models, you can often use shorter, more outcome-oriented prompts: describe what good looks like, what constraints matter, what evidence is available, and what the final answer should contain.
-
-Avoid carrying over every instruction from an older prompt stack. Legacy prompts often over-specify the process because earlier models needed more help staying on track. With GPT-5.5, that can add noise, narrow the model's search space, or lead to overly mechanical answers.
-
-For more detail on GPT-5.5 behavior changes, start with the [Using GPT-5.5 guide](/api/docs/guides/latest-model). This guide focuses on prompt changes that follow from those behavior changes.
-
-The patterns here are starting points. Adapt them to your product surface, tools, evals, and user experience goals.
-
-## Personality and behavior
-
-GPT-5.5's default style is efficient, direct, and task-oriented. This is useful for production systems: responses stay focused, behavior is easier to steer, and the model avoids unnecessary conversational padding.
-
-For customer-facing assistants, support workflows, coaching experiences, and other conversational products, define both personality and collaboration style.
-
-- **Personality** controls how the assistant sounds: tone, warmth, directness, formality, humor, empathy, and level of polish.
-- **Collaboration style** controls how the assistant works: when it asks questions, when it makes assumptions, how proactive it should be, how much context it gives, when it checks work, and how it handles uncertainty or risk.
-
-Keep both short. Personality instructions should shape the user experience. Collaboration instructions should shape task behavior. Neither should replace clear goals, success criteria, tool rules, or stopping conditions.
-
-Example personality block for a steady task-focused assistant:
-
-```text
-# Personality
-You are a capable collaborator: approachable, steady, and direct. Assume the user is competent and acting in good faith, and respond with patience, respect, and practical helpfulness.
-
-Prefer making progress over stopping for clarification when the request is already clear enough to attempt. Use context and reasonable assumptions to move forward. Ask for clarification only when the missing information would materially change the answer or create meaningful risk, and keep any question narrow.
-
-Stay concise without becoming curt. Give enough context for the user to understand and trust the answer, then stop. Use examples, comparisons, or simple analogies when they make the point easier to grasp. When correcting the user or disagreeing, be candid but constructive. When an error is pointed out, acknowledge it plainly and focus on fixing it.
-
-Match the user's tone within professional bounds. Avoid emojis and profanity by default, unless the user explicitly asks for that style or has clearly established it as appropriate for the conversation.
-```
-
-Example personality block for an expressive collaborative assistant:
-
-```text
-# Personality
-Adopt a vivid conversational presence: intelligent, curious, playful when appropriate, and attentive to the user's thinking. Ask good questions when the problem is blurry, then become decisive once there is enough context.
-
-Be warm, collaborative, and polished. Conversation should feel easy and alive, but not chatty for its own sake. Offer a real point of view rather than merely mirroring the user, while staying responsive to their goals and constraints.
-
-Be thoughtful and grounded when the task calls for synthesis or advice. State a clear recommendation when you have enough context, explain important tradeoffs, and name uncertainty without becoming evasive.
-```
-
-For more expressive products, add warmth, curiosity, humor, or point of view explicitly, but keep the block short. Use personality to shape the experience, not to compensate for unclear goals or missing task instructions.
-
-## Improve time to first visible token with a preamble
-
-In streaming applications, users notice how long it takes before the first visible response appears. GPT-5.5 may spend time reasoning, planning, or preparing tool calls before emitting visible text.
-
-For longer or tool-heavy tasks, prompt the model to start with a short preamble: a brief visible update that acknowledges the request and states the first step. This can improve perceived responsiveness without changing the underlying task.
-
-Use this pattern when the task may take more than one step, require tool calls, or involve a long-running agent workflow.
-
-```text
-Before any tool calls for a multi-step task, send a short user-visible update that acknowledges the request and states the first step. Keep it to one or two sentences.
-```
-
-For coding agents that expose separate message phases, you can be more explicit:
-
-```text
-You must always start with an intermediary update before any content in the analysis channel if the task will require calling tools. The user update should acknowledge the request and explain your first step.
-```
-
-## Outcome-first prompts and stopping conditions
-
-GPT-5.5 is strongest when the prompt defines the target outcome, success criteria, constraints, and available context, then lets the model choose the path.
-
-For many tasks, describe the destination rather than every step. This gives the model room to choose the right search, tool, or reasoning strategy for the task.
-
-Prefer this:
-
-```text
-Resolve the customer's issue end to end.
-
-Success means:
-- the eligibility decision is made from the available policy and account data
-- any allowed action is completed before responding
-- the final answer includes completed_actions, customer_message, and blockers
-- if evidence is missing, ask for the smallest missing field
-```
-
-**Avoid unnecessary absolute rules.** Older prompts often use strict instructions like `ALWAYS`, `NEVER`, `must`, and `only` to control model behavior. Use those words for true invariants, such as safety rules, required output fields, or actions that should never happen. For judgment calls, such as when to search, ask for clarification, use a tool, or keep iterating, prefer decision rules instead.
-
-Avoid this style of instruction unless every step is truly required:
-
-```text
-First inspect A, then inspect B, then compare every field, then think through
-all possible exceptions, then decide which tool to call, then call the tool,
-then explain the entire process to the user.
-```
-
-Add explicit stopping conditions:
-
-```text
-Resolve the user query in the fewest useful tool loops, but do not let loop minimization outrank correctness, accessible fallback evidence, calculations, or required citation tags for factual claims.
-
-After each result, ask: "Can I answer the user's core request now with useful evidence and citations for the factual claims?" If yes, answer.
-```
-
-Define missing-evidence behavior:
-
-```text
-Use the minimum evidence sufficient to answer correctly, cite it precisely, then stop.
-```
-
-## Formatting
-
-GPT-5.5 is highly steerable on output format and structure. Use that control when it improves comprehension or product fit.
-
-Set `text.verbosity`, describe the expected output shape, and reserve heavier structure for cases where it improves comprehension or your product UI needs a stable artifact. The API default for `text.verbosity` is `medium`; use `low` when you prefer shorter, more concise responses.
-
-Plain conversational formatting:
-
-```text
-Let formatting serve comprehension. Use plain paragraphs as the default format for normal conversation, explanations, reports, documentation, and technical writeups. Keep the presentation clean and readable without making the structure feel heavier than the content.
-
-Use headers, bold text, bullets, and numbered lists sparingly. Reach for them when the user requests them, when the answer needs clear comparison or ranking, or when the information would be harder to scan as prose. Otherwise, favor short paragraphs and natural transitions.
-
-Respect formatting preferences from the user. If they ask for a terse answer, minimal formatting, no bullets, no headers, or a specific structure, follow that preference unless there is a strong reason not to.
-```
-
-Add explicit audience and length guidance:
-
-```text
-Write for a senior business audience. Keep the answer under 400 words. Use short paragraphs and only include bullets when they improve scannability. Prioritize the conclusion first, then the reasoning, then caveats.
-```
-
-For editing, rewriting, summaries, or customer-facing messages, tell the model what to preserve before asking it to improve style. This pattern is useful when you want polish without expansion.
-
-```text
-Preserve the requested artifact, length, structure, and genre first. Quietly improve clarity, flow, and correctness. Do not add new claims, extra sections, or a more promotional tone unless explicitly requested.
-```
-
-## Grounding, citations, and retrieval budgets
-
-For grounded answers, citation behavior should be part of the prompt. Define what needs support, what counts as enough evidence, and how the model should behave when evidence is missing. Absence of evidence shouldn't automatically become a factual "no." For more details and examples, see the [citation formatting guide](/api/docs/guides/citation-formatting).
-
-### Add an explicit retrieval budget
-
-Retrieval budgets are stopping rules for search. They tell the model when enough evidence is enough.
-
-```text
-For ordinary Q&A, start with one broad search using short, discriminative keywords. If the top results contain enough citable support for the core request, answer from those results instead of searching again.
-
-Make another retrieval call only when:
-- The top results do not answer the core question.
-- A required fact, parameter, owner, date, ID, or source is missing.
-- The user asked for exhaustive coverage, a comparison, or a comprehensive list.
-- A specific document, URL, email, meeting, record, or code artifact must be read.
-- The answer would otherwise contain an important unsupported factual claim.
-
-Do not search again to improve phrasing, add examples, cite nonessential details, or support wording that can safely be made more generic.
-```
-
-## Creative drafting guardrails
-
-For drafting tasks, tell the model which claims must come from sources and which parts may be creatively written. This is especially important for slides, launch copy, customer summaries, talk tracks, leadership blurbs, and narrative framing.
-
-```text
-For creative or generative requests such as slides, leadership blurbs, outbound copy, summaries for sharing, talk tracks, or narrative framing, distinguish source-backed facts from creative wording.
-
-- Use retrieved or provided facts for concrete product, customer, metric, roadmap, date, capability, and competitive claims, and cite those claims.
-- Do not invent specific names, first-party data claims, metrics, roadmap status, customer outcomes, or product capabilities to make the draft sound stronger.
-- If there is little or no citable support, write a useful generic draft with placeholders or clearly labeled assumptions rather than unsupported specifics.
-```
-
-## Frontend engineering and visual taste
-
-For frontend work, refer to the [example instructions](/api/docs/guides/frontend-prompt) for practical ways to steer UI quality. They cover product and user context, design-system alignment, first-screen usability, familiar controls, expected states, responsive behavior, and common generated-UI defaults to avoid, such as generic heroes, nested cards, decorative gradients, visible instructional text, and broken layouts.
-
-## Prompt the model to check its work
-
-Give GPT-5.5 access to tools that let it check outputs when validation is possible.
-
-For coding agents, ask for concrete validation commands:
-
-```text
-After making changes, run the most relevant validation available:
-- targeted unit tests for changed behavior
-- type checks or lint checks when applicable
-- build checks for affected packages
-- a minimal smoke test when full validation is too expensive
-
-If validation cannot be run, explain why and describe the next best check.
-```
-
-For visual artifacts, ask for inspection after rendering:
-
-```text
-Render the artifact before finalizing. Inspect the rendered output for layout, clipping, spacing, missing content, and visual consistency. Revise until the rendered output matches the requirements.
-```
-
-For engineering and planning tasks, make implementation plans traceable:
-
-```text
-For implementation plans, include:
-- requirements and where each is addressed
-- named resources, files, APIs, or systems involved
-- state transitions or data flow where relevant
-- validation commands or checks
-- failure behavior
-- privacy and security considerations
-- open questions that materially affect implementation
-```
-
-## Phase parameter
-
-Starting with GPT-5.4, long-running or tool-heavy Responses workflows can use assistant-item `phase` values to distinguish intermediate updates from final answers. GPT-5.5 uses the same pattern.
-
-If you use `previous_response_id`, the API preserves prior assistant state automatically. If your application manually replays assistant output items into the next request, preserve each original `phase` value and pass it back unchanged. This matters most when a response includes preambles, repeated tool calls, or a final answer after intermediate assistant updates.
-
-```text
-If manually replaying assistant items:
-- Preserve assistant `phase` values exactly.
-- Use `phase: "commentary"` for intermediate user-visible updates.
-- Use `phase: "final_answer"` for the completed answer.
-- Do not add `phase` to user messages.
-```
-
-## Suggested prompt structure
-
-Use this structure as a starting point for complex prompts. Keep each section short. Add detail only where it changes behavior.
-
-```text
-Role: [1-2 sentences defining the model's function, context, and job]
-
-# Personality
-[tone, demeanor, and collaboration style]
-
-# Goal
-[user-visible outcome]
-
-# Success criteria
-[what must be true before the final answer]
-
-# Constraints
-[policy, safety, business, evidence, and side-effect limits]
-
-# Output
-[sections, length, and tone]
-
-# Stop rules
-[when to retry, fallback, abstain, ask, or stop]
-```
diff --git a/skills/openai-docs/references/upgrade-guide.md b/skills/openai-docs/references/upgrade-guide.md
deleted file mode 100644
index b29f137..0000000
--- a/skills/openai-docs/references/upgrade-guide.md
+++ /dev/null
@@ -1,181 +0,0 @@
-# Upgrading to GPT-5.5
-
-Use this guide when the user explicitly asks to upgrade an existing integration to GPT-5.5. Pair it with current OpenAI docs lookups. The default target string is `gpt-5.5`.
-
-## Freshness check
-
-Before applying this bundled guide for a latest/current/default model upgrade, run `node scripts/resolve-latest-model-info.js` from the OpenAI Docs skill directory.
-
-- If the command returns `modelSlug: "gpt-5p5"`, continue with this bundled guide and use `references/prompting-guide.md` when prompt updates are needed.
-- If the command returns a different `modelSlug`, fetch both the returned `migrationGuideUrl` and `promptingGuideUrl` and use them as the current source of truth instead of the bundled references.
-- If the command fails, metadata is missing, or either remote guide cannot be fetched, continue with bundled fallback references and say the remote freshness check was unavailable.
-- If the user explicitly named a target model, preserve that target and use current docs only to check compatibility or caveats.
-
-## Upgrade posture
-
-Upgrade with the narrowest safe change set:
-
-- replace the model string first
-- update only the prompts that are directly tied to that model usage
-- do not automatically upgrade older or ambiguous model usages that may be intentionally pinned, such as historical docs, examples, tests, eval baselines, comparison code, or low-cost fallback/routing paths. Unless the user explicitly asks to upgrade all model usage, leave those sites unchanged and list them as confirmation-needed
-- prefer prompt-only upgrades when possible
-- if the upgrade would require API-surface changes, parameter rewrites, tool rewiring, provider migration, or broader code edits, mark it as blocked instead of stretching the scope
-
-## Upgrade workflow
-
-1. Inventory current model usage.
-   - Search for model strings, client calls, and prompt-bearing files.
-   - Include inline prompts, prompt templates, YAML or JSON configs, Markdown docs, and saved prompts when they are clearly tied to a model usage site.
-2. Pair each model usage with its prompt surface.
-   - Prefer the closest prompt surface first: inline system or developer text, then adjacent prompt files, then shared templates.
-   - If you cannot confidently tie a prompt to the model usage, say so instead of guessing.
-3. Classify the source model family.
-   - Common buckets: GPT-5.4, GPT-5.3-Codex or GPT-5.2-Codex, earlier GPT-5.x, GPT-4o or GPT-4.1, reasoning models such as o1 or o3 or o4-mini, third-party model, or mixed and unclear.
-4. Decide the upgrade class.
-   - `model string only`
-   - `model string + light prompt rewrite`
-   - `blocked without code changes`
-5. Run the compatibility gate.
-   - Check whether the current integration can accept `gpt-5.5` without API-surface changes or implementation changes.
-   - Check whether structured outputs, tool schemas, function names, and downstream parsers can remain unchanged.
-   - For long-running Responses or tool-heavy agents, check whether `phase` is already preserved or round-tripped when the host replays assistant items or uses preambles.
-   - If compatibility depends on code changes, return `blocked`.
-   - If compatibility is unclear, return `unknown` rather than improvising.
-6. Apply the upgrade when it is in scope.
-   - Default replacement string: `gpt-5.5`.
-   - Keep the intervention small and behavior-preserving.
-   - Start from the current reasoning effort when it is visible unless there is a measured reason to change it.
-   - For in-scope changes, update the model string and directly related prompts.
-   - For blocked or unknown changes, do not edit; report the blocker or uncertainty.
-7. Summarize the result.
-   - `Current model usage`
-   - `Model-string updates`
-   - `Reasoning-effort handling`
-   - `Prompt updates`
-   - `Structured output and formatting assessment`
-   - `Tool-use assessment` when the flow uses tools, retrieval, or terminal actions
-   - `Phase assessment` when the flow is long-running, replayed, or tool-heavy
-   - `Compatibility check`
-   - `Validation performed`
-
-Output rule:
-
-- For each usage site, state the starting reasoning-effort recommendation.
-- If the repo exposes the current reasoning setting, recommend preserving it first unless current OpenAI docs say otherwise.
-- If the repo does not expose the current setting, recommend not adding one unless current OpenAI docs require it.
-
-## Upgrade outcomes
-
-### `model string only`
-
-Choose this when:
-
-- the source model is GPT-5.4
-- the existing prompts are already short, explicit, and task-bounded
-- the workflow does not rely on strict output formats, tool-call behavior, batch completeness, or long-horizon execution that should be validated after the upgrade
-- there are no obvious compatibility blockers
-
-Default action:
-
-- replace the model string with `gpt-5.5`
-- preserve the current reasoning effort
-- keep prompts unchanged
-- validate behavior with existing tests, realistic spot checks, or an existing eval suite when one is already available
-
-### `model string + light prompt rewrite`
-
-Choose this when:
-
-- the task needs stronger completeness, citation discipline, verification, or dependency handling
-- the upgraded model becomes too verbose, too dense, or hard to scan unless formatting is constrained
-- the workflow has strict output shape requirements and lacks an explicit format contract, schema, or parser validation
-- the workflow is research-heavy and needs stronger handling of sparse or empty retrieval results
-- the workflow is coding-oriented, terminal-based, tool-heavy, or multi-agent, but the existing API surface and tool definitions can remain unchanged
-
-Default action:
-
-- replace the model string with `gpt-5.5`
-- preserve the current reasoning effort for the first pass
-- make only the smallest prompt edits needed for the observed workflow risk
-- read the [GPT-5.5 prompting guide](/api/docs/guides/prompt-guidance?model=gpt-5.5) to choose the smallest prompt changes that recover or improve behavior
-- avoid broad prompt cleanup unrelated to the upgrade
-- for research workflows, add citation rules, retrieval budgets, missing-evidence behavior, and validation guidance from the prompting guide
-- for dependency-aware or tool-heavy workflows, add prerequisite checks, missing-context handling, explicit tool budgets, stop conditions, and validation guidance
-- for coding or terminal workflows, add repo-specific constraints, acceptance criteria, and concrete validation commands
-- for multi-agent support or triage workflows, add task ownership, handoff, completeness, and stopping criteria
-- for long-running Responses agents with preambles or multiple assistant messages, explicitly review whether `phase` is already handled; if adding or preserving `phase` would require code edits, mark the path as `blocked`
-- do not classify a coding or tool-using Responses workflow as `blocked` just because the visible snippet is minimal; prefer `model string + light prompt rewrite` unless the repo clearly shows that a safe GPT-5.5 path would require host-side code changes
-
-### `blocked`
-
-Choose this when:
-
-- the upgrade appears to require API-surface changes
-- the upgrade appears to require parameter rewrites or reasoning-setting changes that are not exposed outside implementation code
-- the upgrade would require changing tool definitions, tool handler wiring, or schema contracts
-- the user is asking for a tooling, IDE, plugin, shell, or environment migration rather than a model and prompt migration
-- the integration depends on provider-specific APIs that do not map to the current OpenAI API surface without implementation work
-- you cannot confidently identify the prompt surface tied to the model usage
-
-Default action:
-
-- do not improvise a broader upgrade
-- report the blocker and explain that the fix is out of scope for this guide
-- if useful, describe the smallest follow-up implementation task that would unblock the migration
-
-## Compatibility checklist
-
-Before applying or recommending a model-and-prompt-only upgrade, check:
-
-1. Can the current host accept the `gpt-5.5` model string without changing client code or API surface?
-2. Are the related prompts identifiable and editable?
-3. Does the host depend on behavior that likely needs API-surface changes, parameter rewrites, provider migration, or tool rewiring?
-4. Would the likely fix be prompt-only, or would it need implementation changes?
-5. Is the prompt surface close enough to the model usage that you can make a targeted change instead of a broad cleanup?
-6. Do strict structured outputs, schemas, or downstream parsers still have an explicit contract?
-7. For long-running Responses or tool-heavy agents, is `phase` already preserved if the host relies on preambles, replayed assistant items, or multiple assistant messages?
-8. Are latency, token, or price assumptions validated by tests, realistic spot checks, or an existing eval suite rather than inferred from general model positioning?
-
-If item 1 is no, items 3 through 4 point to implementation work, or item 7 is no and the fix needs code changes, return `blocked`.
-
-If item 2 is no, return `unknown` unless the user can point to the prompt location.
-
-Important:
-
-- Existing use of tools, agents, or multiple usage sites is not by itself a blocker.
-- If the current host can keep the same API surface and the same tool definitions, prefer `model string + light prompt rewrite` over `blocked`.
-- Reserve `blocked` for cases that truly require implementation changes, not cases that only need stronger prompt steering.
-- Do not claim token savings without task-level validation.
-
-## Scope boundaries
-
-This guide may:
-
-- update or recommend updated model strings
-- update or recommend updated prompts
-- inspect code and prompt files to understand where those changes belong
-- inspect whether existing Responses flows already preserve `phase`
-- flag compatibility blockers
-- propose validation with existing tests, realistic spot checks, or existing eval suites
-
-This guide may not:
-
-- move Chat Completions code to Responses
-- move Responses code to another API surface
-- migrate SDKs, APIs, IDE configuration, shell hooks, plugins, or provider-specific tooling
-- rewrite parameter shapes
-- change tool definitions or tool-call handling
-- change structured-output wiring
-- add or retrofit `phase` handling in implementation code
-- edit business logic, orchestration logic, SDK usage, IDE configuration, shell hooks, or plugin integration behavior except for model-string replacements and directly related prompt edits
-
-If a safe GPT-5.5 upgrade requires any of those changes, mark the path as blocked and out of scope.
-
-## Validation plan
-
-- Validate each upgraded usage site with existing tests, realistic spot checks, or an existing eval suite when one is already available.
-- Compare against the current GPT-5.4 baseline when available.
-- Check task success, retry count, tool-call count, total tokens, latency, output shape, and user-visible quality.
-- For specialized workflows, validate the contract that matters most instead of judging only general output quality.
-- If prompt edits were added, confirm each block is doing real work instead of adding noise.
-- If the workflow has downstream impact, add a lightweight verification pass before finalization.
diff --git a/skills/openai-docs/scripts/fetch-codex-manual.mjs b/skills/openai-docs/scripts/fetch-codex-manual.mjs
deleted file mode 100644
index b260552..0000000
--- a/skills/openai-docs/scripts/fetch-codex-manual.mjs
+++ /dev/null
@@ -1,598 +0,0 @@
-#!/usr/bin/env node
-import {
-  access,
-  mkdir,
-  readFile,
-  rename,
-  rm,
-  stat,
-  writeFile,
-} from "node:fs/promises";
-import { constants as fsConstants } from "node:fs";
-import { execFile } from "node:child_process";
-import { createHash } from "node:crypto";
-import path from "node:path";
-import process from "node:process";
-import { pathToFileURL } from "node:url";
-import { inspect, promisify } from "node:util";
-
-const DEFAULT_MANUAL_URL = "https://developers.openai.com/codex/codex-manual.md";
-const DEFAULT_CACHE_DIR_NAME = "openai-docs-cache";
-const CACHE_FILE_NAME = "codex-manual.md";
-const OUTLINE_FILE_NAME = "codex-manual.outline.md";
-const HASH_HEADER = "x-content-sha256";
-const USER_AGENT = "codex-openai-docs";
-const execFileAsync = promisify(execFile);
-
-class ManualFetchError extends Error {
-  constructor(message, options) {
-    super(message, options);
-    this.name = "ManualFetchError";
-  }
-}
-
-const sha256 = (value) => createHash("sha256").update(value).digest("hex");
-
-const withTimeout = async (promiseFactory, timeoutMs) => {
-  const controller = new AbortController();
-  const timeout = setTimeout(() => controller.abort(), timeoutMs);
-  try {
-    return await promiseFactory(controller.signal);
-  } finally {
-    clearTimeout(timeout);
-  }
-};
-
-const proxyConfigured = () =>
-  process.env.HTTP_PROXY ||
-  process.env.HTTPS_PROXY ||
-  process.env.http_proxy ||
-  process.env.https_proxy;
-
-const responseHeaders = (headers) => ({
-  get(name) {
-    return headers.get(name.toLowerCase()) ?? null;
-  },
-});
-
-const makeResponse = ({ body, headers, status }) => ({
-  headers: responseHeaders(headers),
-  ok: status >= 200 && status < 300,
-  status,
-  async text() {
-    return body;
-  },
-});
-
-const parseCurlHeaders = (rawHeaders) => {
-  const normalized = rawHeaders.replace(/\r\n/g, "\n").trim();
-  const blocks = normalized.split(/\n\n+/).filter(Boolean);
-  const headerBlock = [...blocks]
-    .reverse()
-    .find((block) => block.startsWith("HTTP/"));
-
-  if (!headerBlock) {
-    throw new ManualFetchError("curl did not return HTTP response headers.");
-  }
-
-  const [statusLine, ...lines] = headerBlock.split("\n");
-  const statusMatch = /^HTTP\/\S+\s+(\d{3})/.exec(statusLine);
-  if (!statusMatch) {
-    throw new ManualFetchError(
-      `Could not parse HTTP status from curl response: ${statusLine}`
-    );
-  }
-
-  const headers = new Map();
-  lines.forEach((line) => {
-    const separator = line.indexOf(":");
-    if (separator === -1) return;
-    const name = line.slice(0, separator).trim().toLowerCase();
-    const value = line.slice(separator + 1).trim();
-    headers.set(name, value);
-  });
-
-  return {
-    headers,
-    status: Number(statusMatch[1]),
-  };
-};
-
-const tempFilePath = (cacheDir, suffix) =>
-  path.join(
-    cacheDir,
-    `.fetch-codex-manual-${process.pid}-${Date.now()}-${Math.random()
-      .toString(16)
-      .slice(2)}${suffix}`
-  );
-
-const requestManualWithCurl = async (url, { cacheDir, method, timeoutMs }) => {
-  const headerPath = tempFilePath(cacheDir, ".headers");
-  const bodyPath = tempFilePath(cacheDir, ".body");
-  const curlNames =
-    process.platform === "win32" ? ["curl.exe", "curl"] : ["curl"];
-  const args = [
-    "--silent",
-    "--show-error",
-    "--location",
-    "--dump-header",
-    headerPath,
-    "--output",
-    bodyPath,
-    "--user-agent",
-    USER_AGENT,
-    "--max-time",
-    String(Math.max(1, Math.ceil(timeoutMs / 1000))),
-  ];
-
-  if (method === "HEAD") {
-    args.push("--head");
-  } else {
-    args.push("--request", method);
-  }
-  args.push(url);
-
-  let lastError;
-  for (const curlName of curlNames) {
-    try {
-      await execFileAsync(curlName, args, { windowsHide: true });
-      const [rawHeaders, body] = await Promise.all([
-        readFile(headerPath, "utf8"),
-        readFile(bodyPath, "utf8"),
-      ]);
-      const { headers, status } = parseCurlHeaders(rawHeaders);
-      return makeResponse({ body, headers, status });
-    } catch (error) {
-      lastError = error;
-      if (error?.code !== "ENOENT") break;
-    } finally {
-      await Promise.all([
-        rm(headerPath, { force: true }),
-        rm(bodyPath, { force: true }),
-      ]);
-    }
-  }
-
-  if (lastError?.code === "ENOENT") {
-    throw new ManualFetchError("curl is unavailable in this environment.", {
-      cause: lastError,
-    });
-  }
-  throw new ManualFetchError(`${method} ${url} could not be fetched.`, {
-    cause: lastError,
-  });
-};
-
-const requestManualWithFetch = async (url, { method, timeoutMs }) => {
-  if (typeof fetch !== "function") {
-    throw new ManualFetchError(
-      "Native fetch is unavailable in this Node runtime."
-    );
-  }
-
-  return withTimeout(
-    (signal) =>
-      fetch(url, {
-        method,
-        headers: { "User-Agent": USER_AGENT },
-        signal,
-      }),
-    timeoutMs
-  );
-};
-
-const requestManual = async (url, { cacheDir, method, timeoutMs }) => {
-  const preferCurl = Boolean(proxyConfigured()) || typeof fetch !== "function";
-  const transports = preferCurl
-    ? [
-        () => requestManualWithCurl(url, { cacheDir, method, timeoutMs }),
-        () => requestManualWithFetch(url, { method, timeoutMs }),
-      ]
-    : [
-        () => requestManualWithFetch(url, { method, timeoutMs }),
-        () => requestManualWithCurl(url, { cacheDir, method, timeoutMs }),
-      ];
-
-  let lastError;
-  for (const transport of transports) {
-    try {
-      const response = await transport();
-      if (!response.ok) {
-        throw new ManualFetchError(
-          `${method} ${url} failed with HTTP ${response.status}.`
-        );
-      }
-      return response;
-    } catch (error) {
-      lastError = error;
-    }
-  }
-
-  throw new ManualFetchError(`${method} ${url} could not be fetched.`, {
-    cause: lastError,
-  });
-};
-
-const readHeaderSha = (response) => {
-  const value = response.headers.get(HASH_HEADER);
-  if (!value || !/^[a-f0-9]{64}$/i.test(value)) {
-    throw new ManualFetchError(`Manual response is missing ${HASH_HEADER}.`);
-  }
-  return value.toLowerCase();
-};
-
-const nearestExistingParent = async (target) => {
-  let current = target;
-  while (true) {
-    try {
-      const info = await stat(current);
-      return info.isDirectory() ? current : null;
-    } catch (error) {
-      if (error?.code !== "ENOENT") return null;
-    }
-
-    const parent = path.dirname(current);
-    if (parent === current) return null;
-    current = parent;
-  }
-};
-
-const usableCacheDir = async (cacheDir) => {
-  if (!cacheDir) return null;
-  const resolved = path.resolve(cacheDir);
-
-  try {
-    const info = await stat(resolved);
-    if (!info.isDirectory()) return null;
-  } catch (error) {
-    if (error?.code !== "ENOENT") return null;
-  }
-
-  const parent = await nearestExistingParent(resolved);
-  if (!parent) return null;
-
-  try {
-    await access(parent, fsConstants.W_OK | fsConstants.X_OK);
-  } catch {
-    return null;
-  }
-
-  return resolved;
-};
-
-const defaultCacheDirCandidates = () => {
-  const candidates = [];
-  const seen = new Set();
-  const pushCandidate = (candidate) => {
-    if (!candidate || seen.has(candidate)) return;
-    seen.add(candidate);
-    candidates.push(candidate);
-  };
-
-  [process.env.TMPDIR, process.env.TEMP, process.env.TMP].forEach((baseDir) => {
-    if (baseDir) {
-      pushCandidate(path.join(baseDir, DEFAULT_CACHE_DIR_NAME));
-    }
-  });
-
-  if (process.platform !== "win32") {
-    pushCandidate(`/private/tmp/${DEFAULT_CACHE_DIR_NAME}`);
-    pushCandidate(`/tmp/${DEFAULT_CACHE_DIR_NAME}`);
-  }
-
-  return candidates;
-};
-
-const resolveCacheDir = async (cacheDir) => {
-  if (cacheDir) {
-    return usableCacheDir(cacheDir);
-  }
-
-  for (const candidate of defaultCacheDirCandidates()) {
-    const usable = await usableCacheDir(candidate);
-    if (usable) return usable;
-  }
-
-  return null;
-};
-
-const cacheFilePath = (cacheDir) => path.join(cacheDir, CACHE_FILE_NAME);
-
-const outlineFilePath = (cacheDir) => path.join(cacheDir, OUTLINE_FILE_NAME);
-
-const manualLines = (manual) => {
-  const lines = manual.replace(/\r\n/g, "\n").split("\n");
-  if (lines[lines.length - 1] === "") lines.pop();
-  return lines;
-};
-
-const sectionTitle = (rawTitle) =>
-  rawTitle.replace(/\s+#+\s*$/, "").replace(/\s+/g, " ").trim();
-
-const buildOutline = (manual) => {
-  const lines = manualLines(manual);
-  const headings = [];
-  let inFence = false;
-
-  lines.forEach((line, index) => {
-    if (/^\s*(```|~~~)/.test(line)) {
-      inFence = !inFence;
-      return;
-    }
-    if (inFence) return;
-
-    const match = /^(#{1,6})\s+(.+?)\s*$/.exec(line);
-    if (!match) return;
-
-    const level = match[1].length;
-    if (level < 2 || level > 3) return;
-
-    headings.push({
-      level,
-      title: sectionTitle(match[2]),
-      startLine: index + 1,
-      endLine: lines.length,
-    });
-  });
-
-  for (let index = 0; index < headings.length; index += 1) {
-    const heading = headings[index];
-    const nextPeer = headings
-      .slice(index + 1)
-      .find((candidate) => candidate.level <= heading.level);
-    if (nextPeer) {
-      heading.endLine = nextPeer.startLine - 1;
-    }
-  }
-
-  if (headings.length === 0) {
-    return {
-      headingCount: 0,
-      lineCount: lines.length,
-      text: "No markdown headings found.",
-    };
-  }
-
-  const minLevel = Math.min(...headings.map((heading) => heading.level));
-  return {
-    headingCount: headings.length,
-    lineCount: lines.length,
-    text: headings
-      .map((heading) => {
-        const indent = "  ".repeat(heading.level - minLevel);
-        return `${indent}- ${heading.title} (lines ${heading.startLine}-${heading.endLine})`;
-      })
-      .join("\n"),
-  };
-};
-
-const outlineMarkdown = (outline) => `# Codex Manual Outline\n\n${outline.text}\n`;
-
-const manualStatusLine = (status) =>
-  status.cacheStatus === "hit"
-    ? "Manual status: local manual was already current."
-    : "Manual status: local manual was updated.";
-
-const formatResult = ({ status, outlineText }) =>
-  [
-    `Manual path: ${status.manualPath}`,
-    `Outline path: ${status.outlinePath}`,
-    manualStatusLine(status),
-    "",
-    outlineText,
-  ].join("\n");
-
-const readCachedManual = async (cacheDir, expectedSha256) => {
-  try {
-    const manual = await readFile(cacheFilePath(cacheDir), "utf8");
-    return sha256(manual) === expectedSha256 ? manual : null;
-  } catch {
-    return null;
-  }
-};
-
-const writeCachedManual = async (cacheDir, manual) => {
-  await mkdir(cacheDir, { recursive: true });
-  const tmpPath = tempFilePath(cacheDir, `.${CACHE_FILE_NAME}.tmp`);
-  await writeFile(tmpPath, manual, "utf8");
-  await rename(tmpPath, cacheFilePath(cacheDir));
-};
-
-const writeOutline = async (cacheDir, outlineText) => {
-  await mkdir(cacheDir, { recursive: true });
-  const tmpPath = tempFilePath(cacheDir, `.${OUTLINE_FILE_NAME}.tmp`);
-  await writeFile(tmpPath, outlineText, "utf8");
-  await rename(tmpPath, outlineFilePath(cacheDir));
-};
-
-const fetchCodexManual = async ({
-  manualUrl = DEFAULT_MANUAL_URL,
-  cacheDir,
-  timeoutMs = 30000,
-} = {}) => {
-  const resolvedCacheDir = await resolveCacheDir(cacheDir);
-  if (!resolvedCacheDir) {
-    throw new ManualFetchError(
-      "Manual cache directory is unavailable; pass --cache-dir to override or use OpenAI Docs MCP fallback."
-    );
-  }
-  await mkdir(resolvedCacheDir, { recursive: true });
-
-  const headResponse = await requestManual(manualUrl, {
-    cacheDir: resolvedCacheDir,
-    method: "HEAD",
-    timeoutMs,
-  });
-  const expectedSha256 = readHeaderSha(headResponse);
-  const manualPath = cacheFilePath(resolvedCacheDir);
-  const outlinePath = outlineFilePath(resolvedCacheDir);
-  const checkedAt = new Date().toISOString();
-
-  const cachedManual = await readCachedManual(resolvedCacheDir, expectedSha256);
-  if (cachedManual !== null) {
-    const outline = buildOutline(cachedManual);
-    const outlineText = outlineMarkdown(outline);
-    await writeOutline(resolvedCacheDir, outlineText);
-
-    return {
-      outlineText,
-      status: {
-        manualUrl,
-        headerSha256: expectedSha256,
-        fetchedManualSha256: expectedSha256,
-        manualHashMatches: true,
-        cacheStatus: "hit",
-        cacheDir: resolvedCacheDir,
-        manualPath,
-        outlinePath,
-        checkedAt,
-        lineCount: outline.lineCount,
-        headingCount: outline.headingCount,
-      },
-    };
-  }
-
-  const getResponse = await requestManual(manualUrl, {
-    cacheDir: resolvedCacheDir,
-    method: "GET",
-    timeoutMs,
-  });
-  const getHeaderSha256 = readHeaderSha(getResponse);
-  if (getHeaderSha256 !== expectedSha256) {
-    throw new ManualFetchError(
-      `${HASH_HEADER} changed between HEAD and GET for ${manualUrl}.`
-    );
-  }
-
-  const manualText = await getResponse.text();
-  const actualSha256 = sha256(manualText);
-  const manualHashMatches = actualSha256 === expectedSha256;
-  if (!manualHashMatches) {
-    throw new ManualFetchError(
-      `${HASH_HEADER} did not match the fetched manual body for ${manualUrl}.`
-    );
-  }
-
-  await writeCachedManual(resolvedCacheDir, manualText);
-  const outline = buildOutline(manualText);
-  const outlineText = outlineMarkdown(outline);
-  await writeOutline(resolvedCacheDir, outlineText);
-
-  return {
-    outlineText,
-    status: {
-      manualUrl,
-      headerSha256: expectedSha256,
-      fetchedManualSha256: actualSha256,
-      manualHashMatches,
-      cacheStatus: "updated",
-      cacheDir: resolvedCacheDir,
-      manualPath,
-      outlinePath,
-      checkedAt,
-      lineCount: outline.lineCount,
-      headingCount: outline.headingCount,
-    },
-  };
-};
-
-const parseArgs = (argv) => {
-  const args = {
-    manualUrl: DEFAULT_MANUAL_URL,
-    cacheDir: undefined,
-    timeoutMs: 30000,
-    statusJson: false,
-  };
-
-  for (let index = 0; index < argv.length; index += 1) {
-    const arg = argv[index];
-    if (arg === "--manual-url") {
-      args.manualUrl = argv[++index];
-    } else if (arg === "--cache-dir") {
-      args.cacheDir = argv[++index];
-    } else if (arg === "--timeout-ms") {
-      args.timeoutMs = Number(argv[++index]);
-    } else if (arg === "--status-json") {
-      args.statusJson = true;
-    } else {
-      throw new ManualFetchError(`Unknown argument: ${arg}`);
-    }
-  }
-
-  if (!args.manualUrl) {
-    throw new ManualFetchError("--manual-url cannot be empty.");
-  }
-  if (!Number.isFinite(args.timeoutMs) || args.timeoutMs <= 0) {
-    throw new ManualFetchError("--timeout-ms must be a positive number.");
-  }
-
-  return args;
-};
-
-const main = async () => {
-  const args = parseArgs(process.argv.slice(2));
-  const { outlineText, status } = await fetchCodexManual(args);
-
-  process.stdout.write(formatResult({ status, outlineText }));
-
-  if (args.statusJson) {
-    console.error(JSON.stringify(status));
-  }
-};
-
-const envProxyHint = () => {
-  if (proxyConfigured()) {
-    return "Hint: proxy env vars are present. This helper prefers `curl` in proxied sessions; if requests still fail, verify `curl` is installed and the proxy configuration is valid.";
-  }
-  if (typeof fetch !== "function") {
-    return "Hint: native fetch is unavailable in this Node runtime. Install `curl` or use a newer Node version to fetch the manual.";
-  }
-  if (process.platform === "win32") {
-    return "Hint: on Windows, pass a cache dir under `%TEMP%` or `%TMP%`.";
-  }
-  return null;
-};
-
-const formatErrorDetails = (error) => {
-  const details = inspect(error, {
-    breakLength: 120,
-    colors: false,
-    compact: false,
-    depth: 8,
-  });
-  if (!error?.cause) {
-    return details;
-  }
-
-  return `${details}\n\nCause:\n${inspect(error.cause, {
-    breakLength: 120,
-    colors: false,
-    compact: false,
-    depth: 8,
-  })}`;
-};
-
-const isCliEntrypoint = () => {
-  const entrypoint = process.argv[1];
-  if (!entrypoint) {
-    return false;
-  }
-
-  return pathToFileURL(entrypoint).href === import.meta.url;
-};
-
-if (isCliEntrypoint()) {
-  main().catch((error) => {
-    console.error(`Error: ${error.message}`);
-    const hint = envProxyHint();
-    if (hint) {
-      console.error(hint);
-    }
-    console.error("");
-    console.error("Details:");
-    console.error(formatErrorDetails(error));
-    process.exitCode = 1;
-  });
-}
-
-export { DEFAULT_MANUAL_URL, fetchCodexManual };
diff --git a/skills/openai-docs/scripts/resolve-latest-model-info.js b/skills/openai-docs/scripts/resolve-latest-model-info.js
deleted file mode 100644
index 1bd16ac..0000000
--- a/skills/openai-docs/scripts/resolve-latest-model-info.js
+++ /dev/null
@@ -1,147 +0,0 @@
-#!/usr/bin/env node
-
-const fs = require("node:fs/promises");
-const path = require("node:path");
-
-const DEFAULT_URL =
-  "https://developers.openai.com/api/docs/guides/latest-model.md";
-const DEFAULT_BASE_URL = "https://developers.openai.com";
-
-function parseArgs(argv) {
-  const args = {
-    source: process.env.LATEST_MODEL_URL || DEFAULT_URL,
-    baseUrl: process.env.LATEST_MODEL_BASE_URL || DEFAULT_BASE_URL,
-  };
-
-  for (let i = 2; i < argv.length; i += 1) {
-    const arg = argv[i];
-    if (arg === "--source" || arg === "--url") {
-      args.source = argv[i + 1];
-      i += 1;
-    } else if (arg === "--base-url") {
-      args.baseUrl = argv[i + 1];
-      i += 1;
-    }
-  }
-
-  return args;
-}
-
-async function readSource(source) {
-  if (source.startsWith("file://")) {
-    return fs.readFile(new URL(source), "utf8");
-  }
-
-  if (!/^https?:\/\//.test(source)) {
-    return fs.readFile(path.resolve(source), "utf8");
-  }
-
-  const response = await fetch(source, {
-    headers: { accept: "text/markdown,text/plain,*/*" },
-  });
-
-  if (!response.ok) {
-    throw new Error(`failed to fetch ${source}: ${response.status}`);
-  }
-
-  return response.text();
-}
-
-function parseIndentedInfo(lines, startIndex) {
-  const info = {};
-
-  for (let i = startIndex + 1; i < lines.length; i += 1) {
-    const line = lines[i];
-    if (!line.trim()) {
-      continue;
-    }
-
-    const match = line.match(/^ {2}([A-Za-z][A-Za-z0-9_-]*):\s*(.+?)\s*$/);
-    if (!match) {
-      break;
-    }
-
-    info[match[1]] = match[2].replace(/^["']|["']$/g, "");
-  }
-
-  return info;
-}
-
-function parseFlatInfo(block) {
-  const info = {};
-
-  for (const line of block.split(/\r?\n/)) {
-    const match = line.match(/^\s*([A-Za-z][A-Za-z0-9_-]*):\s*(.+?)\s*$/);
-    if (match) {
-      info[match[1]] = match[2].replace(/^["']|["']$/g, "");
-    }
-  }
-
-  return info;
-}
-
-function extractLatestModelInfo(markdown) {
-  const lines = markdown.split(/\r?\n/);
-  const latestModelInfoIndex = lines.findIndex((line) =>
-    /^latestModelInfo:\s*$/.test(line)
-  );
-
-  if (latestModelInfoIndex >= 0) {
-    return parseIndentedInfo(lines, latestModelInfoIndex);
-  }
-
-  const commentMatch = markdown.match(
-    /<!--\s*latestModelInfo\s*\n([\s\S]*?)\n\s*-->/m
-  );
-  if (commentMatch) {
-    return parseFlatInfo(commentMatch[1]);
-  }
-
-  return undefined;
-}
-
-function modelToSkillSlug(model) {
-  return model.trim().replace(/\./g, "p");
-}
-
-function absoluteUrl(baseUrl, value) {
-  return new URL(value, baseUrl).toString();
-}
-
-function normalizeInfo(info, baseUrl) {
-  const model = info?.model?.trim();
-  const migrationGuide = info?.migrationGuide?.trim();
-  const promptingGuide = info?.promptingGuide?.trim();
-
-  if (!model || !migrationGuide || !promptingGuide) {
-    throw new Error(
-      "latestModelInfo must include model, migrationGuide, and promptingGuide"
-    );
-  }
-
-  return {
-    model,
-    modelSlug: modelToSkillSlug(model),
-    migrationGuideUrl: absoluteUrl(baseUrl, migrationGuide),
-    promptingGuideUrl: absoluteUrl(baseUrl, promptingGuide),
-  };
-}
-
-async function main() {
-  const { source, baseUrl } = parseArgs(process.argv);
-  const markdown = await readSource(source);
-  const info = extractLatestModelInfo(markdown);
-
-  if (!info) {
-    throw new Error(`latestModelInfo block not found in ${source}`);
-  }
-
-  process.stdout.write(
-    `${JSON.stringify(normalizeInfo(info, baseUrl), null, 2)}\n`
-  );
-}
-
-main().catch((error) => {
-  console.error(error.message);
-  process.exit(1);
-});
diff --git a/skills/plugin-creator/SKILL.md b/skills/plugin-creator/SKILL.md
deleted file mode 100644
index af960ec..0000000
--- a/skills/plugin-creator/SKILL.md
+++ /dev/null
@@ -1,243 +0,0 @@
----
-name: plugin-creator
-description: Create and scaffold plugin directories for Codex with a required `.codex-plugin/plugin.json`, optional plugin folders/files, valid manifest defaults, and personal-marketplace entries by default. Use when Codex needs to create a new personal plugin, add optional plugin structure, generate or update marketplace entries for plugin ordering and availability metadata, or update an existing local plugin during development with the CLI-driven cachebuster and reinstall flow.
----
-
-# Plugin Creator
-
-## Quick Start
-
-1. Run the scaffold script:
-
-```bash
-# Plugin names are normalized to lower-case hyphen-case and must be <= 64 chars.
-# The generated folder and plugin.json name are always the same.
-# Run from the skill root (the directory containing this `SKILL.md`).
-# By default creates in `~/plugins/<plugin-name>`.
-python3 scripts/create_basic_plugin.py <plugin-name>
-```
-
-2. Edit `<plugin-path>/.codex-plugin/plugin.json` when the request gives specific metadata.
-   The scaffold starts with valid defaults and must not contain `[TODO: ...]` placeholders.
-
-3. Generate or update the personal marketplace entry when the plugin should appear in Codex UI ordering:
-
-```bash
-# Personal marketplace entries default to `~/.agents/plugins/marketplace.json`.
-python3 scripts/create_basic_plugin.py my-plugin --with-marketplace
-```
-
-Only specify `--marketplace-name <name>` when the default `personal` marketplace name is already
-taken or installed and you need to seed a different new marketplace file:
-
-```bash
-python3 scripts/create_basic_plugin.py my-plugin \
-  --with-marketplace \
-  --marketplace-name team-local
-```
-
-Only use a repo/team marketplace when the user specifically asks for that destination:
-
-```bash
-python3 scripts/create_basic_plugin.py my-plugin \
-  --path <repo-root>/plugins \
-  --marketplace-path <repo-root>/.agents/plugins/marketplace.json \
-  --with-marketplace
-```
-
-When the user specifies a marketplace path, make sure that marketplace is actually installed before
-telling the user to reinstall from it. The default personal marketplace file at
-`~/.agents/plugins/marketplace.json` is discovered implicitly, but other marketplace paths are not.
-On Windows, use the equivalent path under the user profile.
-
-4. Generate/adjust optional companion folders as needed:
-
-```bash
-python3 scripts/create_basic_plugin.py my-plugin \
-  --path <parent-plugin-directory> \
-  --marketplace-path <marketplace-json-path> \
-  --with-skills --with-hooks --with-scripts --with-assets --with-mcp --with-apps --with-marketplace
-```
-
-`<parent-plugin-directory>` is the directory where the plugin folder `<plugin-name>` will be
-created (for example `~/plugins`).
-
-5. Before handing back a generated plugin, run:
-
-```bash
-python3 scripts/validate_plugin.py <plugin-path>
-```
-
-For updates to an existing local plugin during development, keep the scaffold flow as-is and use the
-reference instead of hand-editing marketplace files:
-
-```bash
-python3 scripts/update_plugin_cachebuster.py <plugin-path>
-```
-
-Prefer the helper default cachebuster unless the user explicitly asks for a specific override.
-See `references/installing-and-updating.md` for the expected cachebuster and reinstall flow while iterating on an existing local plugin.
-
-## What this skill creates
-
-- Default marketplace-backed scaffolds use the personal marketplace file at
-  `~/.agents/plugins/marketplace.json`, with plugins generally being stored in
-  `~/plugins/<plugin-name>/`.
-- Creates plugin root at `/<parent-plugin-directory>/<plugin-name>/`.
-- Always creates `/<parent-plugin-directory>/<plugin-name>/.codex-plugin/plugin.json`.
-- Fills the manifest with the validated schema shape that the ingestion path accepts.
-- Creates or updates `~/.agents/plugins/marketplace.json` when `--with-marketplace` is set.
-  - If the marketplace file does not exist yet, seed a personal marketplace root before adding the first plugin entry.
-- `<plugin-name>` is normalized using skill-creator naming rules:
-  - `My Plugin` → `my-plugin`
-  - `My--Plugin` → `my-plugin`
-  - underscores, spaces, and punctuation are converted to `-`
-  - result is lower-case hyphen-delimited with consecutive hyphens collapsed
-- Supports optional creation of:
-  - `skills/`
-  - `hooks/`
-  - `scripts/`
-  - `assets/`
-  - `.mcp.json`
-  - `.app.json`
-
-## Marketplace workflow
-
-- Personal-marketplace creation defaults to `~/.agents/plugins/marketplace.json`. Here,
-  "personal marketplace" means the marketplace whose file is at that path.
-- Repo/team marketplace creation is opt-in through both `--path` and `--marketplace-path`, only
-  when the user specifically requests it.
-- `--marketplace-name` is an exception path. Use it only when the default `personal` marketplace
-  name is already taken and you need to seed a different new marketplace file.
-- Do not use `--marketplace-name` to rename an existing marketplace file in place. If the file
-  already exists, its top-level `name` must already match.
-- If the user specifies a different marketplace path, treat that marketplace as needing explicit installation via `codex plugin marketplace add`.
-- Prefer `scripts/read_marketplace_name.py` when you need the marketplace name from any
-  `marketplace.json` file. With no argument it reads the default personal marketplace; with an
-  explicit path it works for repo/team marketplaces too.
-- In either location, the generated source path remains `./plugins/<plugin-name>`.
-- Marketplace root metadata supports top-level `name` plus optional `interface.displayName`.
-- Treat plugin order in `plugins[]` as render order in Codex. Append new entries unless a user explicitly asks to reorder the list.
-- `displayName` belongs inside the marketplace `interface` object, not individual `plugins[]` entries.
-- Each generated marketplace entry must include all of:
-  - `policy.installation`
-  - `policy.authentication`
-  - `category`
-- Default new entries to:
-  - `policy.installation: "AVAILABLE"`
-  - `policy.authentication: "ON_INSTALL"`
-- Override defaults only when the user explicitly specifies another allowed value.
-- Allowed `policy.installation` values:
-  - `NOT_AVAILABLE`
-  - `AVAILABLE`
-  - `INSTALLED_BY_DEFAULT`
-- Allowed `policy.authentication` values:
-  - `ON_INSTALL`
-  - `ON_USE`
-- Treat `policy.products` as an override. Omit it unless the user explicitly requests product gating.
-- The generated plugin entry shape is:
-
-```json
-{
-  "name": "plugin-name",
-  "source": {
-    "source": "local",
-    "path": "./plugins/plugin-name"
-  },
-  "policy": {
-    "installation": "AVAILABLE",
-    "authentication": "ON_INSTALL"
-  },
-  "category": "Productivity"
-}
-```
-
-- Use `--force` only when intentionally replacing an existing marketplace entry for the same plugin name.
-- If the target marketplace file does not exist yet, create it with top-level `"name"`, an `"interface"` object containing `"displayName"`, and a `plugins` array, then add the new entry.
-
-- For a brand-new marketplace file, the root object should look like:
-
-```json
-{
-  "name": "personal",
-  "interface": {
-    "displayName": "Personal"
-  },
-  "plugins": [
-    {
-      "name": "plugin-name",
-      "source": {
-        "source": "local",
-        "path": "./plugins/plugin-name"
-      },
-      "policy": {
-        "installation": "AVAILABLE",
-        "authentication": "ON_INSTALL"
-      },
-      "category": "Productivity"
-    }
-  ]
-}
-```
-
-## Required behavior
-
-- Outer folder name and `plugin.json` `"name"` are always the same normalized plugin name.
-- Do not remove required structure; keep `.codex-plugin/plugin.json` present.
-- Do not leave `[TODO: ...]` placeholders in plugin manifests.
-- Keep `apps` and `mcpServers` out of `plugin.json` unless their companion files are actually created.
-- Omit unsupported plugin manifest fields that validation rejects, including `hooks`.
-- If creating files inside an existing plugin path, use `--force` only when overwrite is intentional.
-- Preserve any existing marketplace `interface.displayName`.
-- When generating marketplace entries, always write `policy.installation`, `policy.authentication`, and `category` even if their values are defaults.
-- Add `policy.products` only when the user explicitly asks for that override.
-- Keep marketplace `source.path` relative to the selected marketplace root as `./plugins/<plugin-name>`.
-- Only use `--marketplace-name` when creating a new marketplace file whose name should not be
-  `personal` because that name is already taken or installed elsewhere.
-- If Codex would need approval to write the marketplace file, ask for that approval before
-  proceeding. If the user prefers to run the write themselves, provide the exact scaffold command
-  and then continue from validation or subsequent plugin edits instead of leaving the workflow
-  vague.
-- For updates to an existing local plugin during development, do not hand-edit marketplace config
-  or `marketplace.json`. Use the update flow documented in
-  `references/installing-and-updating.md` and `scripts/update_plugin_cachebuster.py`.
-- Do not tell the user to run `codex plugin marketplace add` for the default personal-marketplace
-  flow. That command is for explicit non-default marketplace configuration, not for the standard
-  `~/.agents/plugins/marketplace.json` path.
-- If the user provided a non-default `--marketplace-path`, make sure that marketplace is installed
-  before giving reinstall instructions. Use `codex plugin marketplace add <path-to-marketplace-root>`
-  when that explicit marketplace has not been configured yet.
-- When the workflow created or updated a marketplace-backed plugin, end the final user-facing
-  response with a short Codex app handoff. Say `To view this in the Codex app:` and write
-  `View <normalized plugin name>` and `Share <normalized plugin name>` as Markdown links, not raw
-  URLs or code spans.
-- The View deeplink uses `codex://plugins/<normalized plugin name>?marketplacePath=<absolute marketplace.json path>`.
-  The Share deeplink uses the same URL with `&mode=share`.
-- Replace the placeholders with the real normalized plugin name and absolute `marketplace.json`
-  path from the scaffolded plugin. URL-encode the path segment and query value when needed.
-- Do not add `pluginName` or `hostId` query parameters to these deeplinks. Codex derives both after
-  the user clicks the link.
-- Do not emit the `View <normalized plugin name>` or `Share <normalized plugin name>` links when no marketplace entry was
-  created or updated.
-
-## Reference to exact spec sample
-
-For the exact canonical sample JSON for both plugin manifests and marketplace entries, use:
-
-- `references/plugin-json-spec.md`
-- `references/installing-and-updating.md` for update/reinstall guidance while
-  iterating on an existing local plugin, plus the new-thread pickup behavior after reinstall
-
-## Validation
-
-After editing `SKILL.md`, run:
-
-```bash
-python3 ../skill-creator/scripts/quick_validate.py .
-```
-
-Before handing back a generated plugin, run:
-
-```bash
-python3 scripts/validate_plugin.py <plugin-path>
-```
diff --git a/skills/plugin-creator/agents/openai.yaml b/skills/plugin-creator/agents/openai.yaml
deleted file mode 100644
index 19a9a6f..0000000
--- a/skills/plugin-creator/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "Plugin Creator"
-  short_description: "Scaffold plugins and marketplace entries"
-  default_prompt: "Use $plugin-creator to scaffold a valid plugin in the personal marketplace, then validate it before handing it back."
-  icon_small: "./assets/plugin-creator-small.svg"
-  icon_large: "./assets/plugin-creator.png"
diff --git a/skills/plugin-creator/assets/plugin-creator-small.svg b/skills/plugin-creator/assets/plugin-creator-small.svg
deleted file mode 100644
index c6e4f67..0000000
--- a/skills/plugin-creator/assets/plugin-creator-small.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" viewBox="0 0 20 20">
-  <path fill="#0D0D0D" d="M12.03 4.113a3.612 3.612 0 0 1 5.108 5.108l-6.292 6.29c-.324.324-.56.561-.791.752l-.235.176c-.205.14-.422.261-.65.36l-.229.093a4.136 4.136 0 0 1-.586.16l-.764.134-2.394.4c-.142.024-.294.05-.423.06-.098.007-.232.01-.378-.026l-.149-.05a1.081 1.081 0 0 1-.521-.474l-.046-.093a1.104 1.104 0 0 1-.075-.527c.01-.129.035-.28.06-.422l.398-2.394c.1-.602.162-.987.295-1.35l.093-.23c.1-.228.22-.445.36-.65l.176-.235c.19-.232.428-.467.751-.79l6.292-6.292Zm-5.35 7.232c-.35.35-.534.535-.66.688l-.11.147a2.67 2.67 0 0 0-.24.433l-.062.154c-.08.22-.124.462-.232 1.112l-.398 2.394-.001.001h.003l2.393-.399.717-.126a2.63 2.63 0 0 0 .394-.105l.154-.063a2.65 2.65 0 0 0 .433-.24l.147-.11c.153-.126.339-.31.688-.66l4.988-4.988-3.227-3.226-4.987 4.988Zm9.517-6.291a2.281 2.281 0 0 0-3.225 0l-.364.362 3.226 3.227.363-.364c.89-.89.89-2.334 0-3.225ZM4.583 1.783a.3.3 0 0 1 .294.241c.117.585.347 1.092.707 1.48.357.385.859.668 1.549.783a.3.3 0 0 1 0 .592c-.69.115-1.192.398-1.549.783-.315.34-.53.77-.657 1.265l-.05.215a.3.3 0 0 1-.588 0c-.117-.585-.347-1.092-.707-1.48-.357-.384-.859-.668-1.549-.783a.3.3 0 0 1 0-.592c.69-.115 1.192-.398 1.549-.783.36-.388.59-.895.707-1.48l.015-.05a.3.3 0 0 1 .279-.19Z"/>
-</svg>
diff --git a/skills/plugin-creator/assets/plugin-creator.png b/skills/plugin-creator/assets/plugin-creator.png
deleted file mode 100644
index 4f3d6d82fa78fbdce97af3c17f6a25c683aa3290..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1563
zcmV+$2ITpPP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1+Ym(K~#7F?cH5#
z99100@!y%5ZPPYs)~0PjXk@GQA{H?sLh4NusZb$>1#i4F!Dtb@FnH%p6OalPi4TDy
zMcTdqNqhk%K`*Qbx>_X{K4hvjHd<=hH0fq{Gsiib9J_g*IrFfyGygA?&1Rp<e)!Lv
z&F&-sMNt$*Q4~c{6h%=KMNyPO4AlSe^Y3O*N_Bv<bom=~{{V|kChCnG>l>Iw2qhkb
ze|)YB#{A1DHe~H{=}oVwFPPA*37~O^y*^+fpb`thKY1$)zGE1LrVQMsu}jdkKwuIF
z!Y>Y|aer<UrQKcdlAZ^Q{2)91&JcVoQ6T*Ma0W$d-2N&9zp9%V!;uSptb5j%eT;^L
z6bObW-<-wIr$^yai2w-<LzX|##Yf)12p@_)$mHZ?=J%(Mjaw-rgCMhbFaPM=oA6ky
z_aOp9(=>ZBkl8tR2W{Vc1+7>_fXyPMKjmfh7264^#1Q8f8yfM)Gsj@1QV6g#maH@I
zP%I~8Ek<RbOv;k}5F1c?Wgoi<*$P7x%A{x|<$X!4K(@n>1&*Sz<4`O%n=C#xm?`ka
z@f*eCnG*Imx=o;)FU8GPEG9%?fE(jGa4*wlOu)drquT{LDa8yFs(BEJAz$>R*gPVE
zqU#+{sHQ>IV#p$cqEO9(Y=$ALItt^-S@v#+A*(J*LO`5i$f|}?GICI;ra;_c$ihcq
zX6#?7t76DPMwx(OH38xkLlzp!uBppVEb<_JVaNhUVVGdAj!ZzYNQ3x|AuFRSya%H+
z?dbZhQ0jjifQKRr5)?-HzW@Ca#_cg2y7h{`C>$TMzDr80D_JB#g2uq?7v-;0HimyF
z%!H*6!ecrjR#+G^-I_yvejNAeo`a<|Y<nL|JL@pN{{Z&hoCdS3mG9aZOIo+R)V&Fh
zMG7Qr44F3+E-_5_P-H-=g&|WxS=iTPHeUbJHw;lE-k_>BMrB2#6*u;OYX9V;b-SyY
zmSuIfx3`<{v8qo<lrTgNCnXS!^5dh5MGZr?4N71b<;O;qiYkU|6O=$P%8!dG6m<;Q
z8kE2>M4|80YXzgSg7L69b@21RF+`z))FOtR$uxAc?!1W*3JruXoD~WPVK^^v5W;X*
zpdf_dzQ8~TL#;qS2tz&JK?uWJzP@9~zdK179`pAt+{P25gyAjUK={;^Ves}2U?==6
zNf;tu_96V2E4^TR<-qwx`(A%qKJ|LP3BwTiGa(EWhXUIZ!jHo1q$CkT<Qb$q9qaZR
z-cXW?A@V*UtEQteHIyV{h&+Mtsqv1jS5@v%l8zzrHX()S?Dki3hC&$2c>~d#9UdUR
zH40%o$QuZQi$i}mMj?#VDT6HUKah5JtJNrku|D+)DV1De$d*y~ogWBegVa9;v@4x`
z{E^m^dv>Y3)-b^IHelgvz;bpZlf!BnL!=DS*wpgU)oZ_Yc0Tbalu)#Ku-%=0qSQQw
zNPQo|`ICR&zKgd<K7%+_%4h~_Ia@yUSS&C^${>uf@(L>gD6zp1DQ&W{*=*XftU-Bx
z{{AAaUi%GI*nGtbL!>kzrBZ3#>yIi-O6)L1N+5D`wYCsZVu>MA1<7o7SqLbx#Skfh
zh!xgWmj{RvYYdUEo2<$LK#4tu$n`2~?FwtF{91jn{I@yA@4gUs43X;z*=U8eRh}nB
zZ@!E}7h*pdGS?vX=F0UC71dDKEG$029y`&?4tIz02f3n9Xus>kIZ7E~2%2`79eMr(
zBrMmT%M$w#UDy9A6bf}v=-|G+IQzzn<<ph_!YmliS%q8QYkJd|jWB@(r}RO&{{H^K
znVFe0E^lVq|8n+{`TD76Tg=x^9nGP>BbTJjk&~1^x!BXwGidKmHbOD6^2FPh=j>?`
zzdy<x8yll1-a(!|N-8#Aa@A!RhIqp1iKi%vq9}@@D2k#eilV55^dCV<^wOW~YLEZ`
N002ovPDHLkV1k6v&87eV

diff --git a/skills/plugin-creator/references/installing-and-updating.md b/skills/plugin-creator/references/installing-and-updating.md
deleted file mode 100644
index 28b3b88..0000000
--- a/skills/plugin-creator/references/installing-and-updating.md
+++ /dev/null
@@ -1,143 +0,0 @@
-# Updating Existing Local Plugins
-
-Use this reference when a plugin already exists and the request is about updating the plugin during 
-local development.
-
-All scripts here are specified relative to the skill root. Update the path for running the scripts
-depending on your current working directory.
-
-## When To Use This Flow
-
-Use this flow when all of the following are true:
-
-- the plugin already exists locally
-- the marketplace entry already points at the plugin source you are editing
-- the user wants Codex to see the updated plugin without manually editing marketplace files
-
-If the user still needs the initial plugin entry or marketplace structure created, use the scaffold
-flow first and only then switch to this reinstall flow.
-
-## Update Loop
-
-1. Update the plugin manifest to a single Codex cachebuster suffix:
-
-```bash
-python3 scripts/update_plugin_cachebuster.py \
-  <plugin-path>
-```
-
-Prefer the default helper behavior here. If you omit `--cachebuster`, the helper uses a UTC
-timestamp down to seconds, which is the recommended path for routine local iteration.
-
-Only use a manual cachebuster override when the user explicitly asks for one or when a workflow
-outside Codex depends on a specific token:
-
-```bash
-python3 scripts/update_plugin_cachebuster.py \
-  <plugin-path> \
-  --cachebuster local-20260519-184516
-```
-
-2. For the default scaffolded flow, read the marketplace name from the personal marketplace file:
-
-```bash
-python3 scripts/read_marketplace_name.py
-```
-
-Here, "personal marketplace" means the marketplace whose file is at
-`~/.agents/plugins/marketplace.json`. On Windows, use the equivalent path under the user profile.
-The helper uses Python's home-directory resolution and prints the marketplace name to use when
-constructing the install command.
-
-To read the name from a different marketplace file, pass the path directly:
-
-```bash
-python3 scripts/read_marketplace_name.py --marketplace-path <path-to-marketplace.json>
-```
-
-3. Reinstall from that marketplace name:
-
-```bash
-codex plugin add <plugin-name>@<marketplace-name-from-marketplace-json>
-```
-
-The default personal marketplace is discovered implicitly from
-`~/.agents/plugins/marketplace.json`. You do not need `codex plugin marketplace add` for that
-path, and `codex plugin marketplace list` is not the right check for whether that default
-marketplace exists.
-
-4. If the plugin is not using the personal marketplace file, check which configured local
-   marketplace is actually surfacing that plugin:
-
-```bash
-codex plugin list
-```
-
-If the plugin is not in the personal marketplace file, confirm which marketplace entry points at
-the plugin source you are editing and make sure that marketplace is still local. If it is a
-different local marketplace, reinstall from that marketplace name instead of forcing the personal
-marketplace flow. If it is not local, stop and help the user resolve the mismatch before
-continuing.
-
-5. If the plugin lives in a different confirmed local marketplace, substitute that marketplace
-   name:
-
-```bash
-codex plugin add <plugin-name>@<local-marketplace>
-```
-
-6. Prompt the user to use a new thread to try the updated plugin, so that Codex picks up new skills
-   and tools.
-
-## Cachebuster Policy
-
-- Preserve the existing version prefix and replace only the suffix.
-- Treat the preserved prefix as everything before `+`.
-- Use the format:
-
-```text
-<base-version>+codex.<cachebuster>
-```
-
-Examples:
-
-- `0.1.0` → `0.1.0+codex.local-20260519-184516`
-- `0.1.0+codex.old-token` → `0.1.0+codex.local-20260519-184516`
-- `1.2.3-beta.1+codex.prev` → `1.2.3-beta.1+codex.local-20260519-184516`
-- `dev-build+other-tag` → `dev-build+codex.local-20260519-184516`
-
-Replace the existing Codex cachebuster instead of appending another one. Do not keep incrementing
-numeric version components just to trigger reinstall behavior.
-
-## Marketplace Rules
-
-- Marketplace manipulation should happen through commands, not by hand-editing `marketplace.json`
-  or `config.toml` during this update/reinstall flow.
-- Prefer the personal marketplace file for the default scaffolded flow.
-- Read the personal marketplace name with
-  `python3 scripts/read_marketplace_name.py` and use the printed value when constructing
-  `codex plugin add <plugin-name>@<marketplace-name>`.
-- For non-default marketplace files, use
-  `python3 scripts/read_marketplace_name.py --marketplace-path <path-to-marketplace.json>` to read
-  the name before constructing reinstall commands.
-- Do not tell the user to run `codex plugin marketplace add` for the default personal-marketplace
-  flow. That marketplace is discovered implicitly by Codex.
-- If the user specified a different marketplace path, make sure that marketplace is installed
-  before giving install or reinstall instructions. Non-default marketplace paths are not
-  discovered implicitly.
-- Use `codex plugin list` when the plugin lives in a different configured marketplace and you need
-  to confirm which marketplace is surfacing that plugin.
-- If a non-default local marketplace has not been configured yet, install it with
-  `codex plugin marketplace add <path-to-marketplace-root>` before telling the user to run
-  `codex plugin add <plugin-name>@<marketplace-name>`.
-- If the plugin is not in the personal marketplace file, confirm that the selected marketplace is
-  local before telling the user to reinstall from it.
-- If the selected marketplace is not local, stop and help the user resolve that mismatch rather
-  than pretending the normal local reinstall flow applies.
-- If the plugin source is not already the source referenced by the chosen marketplace entry, stop
-  and fix that first. This update flow does not rewrite marketplace entries.
-
-## After Reinstall
-
-After reinstalling, prompt the user to start a new thread for testing. That is the safe boundary for
-picking up the updated plugin and its MCP tools.
diff --git a/skills/plugin-creator/references/plugin-json-spec.md b/skills/plugin-creator/references/plugin-json-spec.md
deleted file mode 100644
index 5eb2251..0000000
--- a/skills/plugin-creator/references/plugin-json-spec.md
+++ /dev/null
@@ -1,194 +0,0 @@
-# Plugin JSON sample spec
-
-```json
-{
-  "name": "plugin-name",
-  "version": "1.2.0",
-  "description": "Brief plugin description",
-  "author": {
-    "name": "Author Name",
-    "email": "author@example.com",
-    "url": "https://github.com/author"
-  },
-  "homepage": "https://docs.example.com/plugin",
-  "repository": "https://github.com/author/plugin",
-  "license": "MIT",
-  "keywords": ["keyword1", "keyword2"],
-  "skills": "./skills/",
-  "hooks": "./hooks.json",
-  "mcpServers": "./.mcp.json",
-  "apps": "./.app.json",
-  "interface": {
-    "displayName": "Plugin Display Name",
-    "shortDescription": "Short description for subtitle",
-    "longDescription": "Long description for details page",
-    "developerName": "OpenAI",
-    "category": "Productivity",
-    "capabilities": ["Interactive", "Write"],
-    "websiteURL": "https://openai.com/",
-    "privacyPolicyURL": "https://openai.com/policies/row-privacy-policy/",
-    "termsOfServiceURL": "https://openai.com/policies/row-terms-of-use/",
-    "defaultPrompt": [
-      "Summarize my inbox and draft replies for me.",
-      "Find open bugs and turn them into Linear tickets.",
-      "Review today's meetings and flag scheduling gaps."
-    ],
-    "brandColor": "#3B82F6",
-    "composerIcon": "./assets/icon.png",
-    "logo": "./assets/logo.png",
-    "screenshots": [
-      "./assets/screenshot1.png",
-      "./assets/screenshot2.png",
-      "./assets/screenshot3.png"
-    ]
-  }
-}
-```
-
-## Field guide
-
-### Top-level fields
-
-- `name` (`string`): Plugin identifier (kebab-case, no spaces). Required if `plugin.json` is provided and used as manifest name and component namespace.
-- `version` (`string`): Plugin semantic version.
-- `description` (`string`): Short purpose summary.
-- `author` (`object`): Publisher identity.
-  - `name` (`string`): Author or team name.
-  - `email` (`string`): Contact email.
-  - `url` (`string`): Author/team homepage or profile URL.
-- `homepage` (`string`): Documentation URL for plugin usage.
-- `repository` (`string`): Source code URL.
-- `license` (`string`): License identifier (for example `MIT`, `Apache-2.0`).
-- `keywords` (`array` of `string`): Search/discovery tags.
-- `skills` (`string`): Relative path to skill directories/files.
-- `hooks` (`string`): Hook config path.
-- `mcpServers` (`string`): MCP config path.
-- `apps` (`string`): App manifest path for plugin integrations.
-- `interface` (`object`): Interface/UX metadata block for plugin presentation.
-
-### `interface` fields
-
-- `displayName` (`string`): User-facing title shown for the plugin.
-- `shortDescription` (`string`): Brief subtitle used in compact views.
-- `longDescription` (`string`): Longer description used on details screens.
-- `developerName` (`string`): Human-readable publisher name.
-- `category` (`string`): Plugin category bucket.
-- `capabilities` (`array` of `string`): Capability list from implementation.
-- `websiteURL` (`string`): Public website for the plugin.
-- `privacyPolicyURL` (`string`): Privacy policy URL.
-- `termsOfServiceURL` (`string`): Terms of service URL.
-- `defaultPrompt` (`array` of `string`): Starter prompts shown in composer/UX context.
-  - Include at most 3 strings. Entries after the first 3 are ignored and will not be included.
-  - Each string is capped at 128 characters. Longer entries are truncated.
-  - Prefer short starter prompts around 50 characters so they scan well in the UI.
-- `brandColor` (`string`): Theme color for the plugin card.
-- `composerIcon` (`string`): Path to icon asset.
-- `logo` (`string`): Path to logo asset.
-- `screenshots` (`array` of `string`): List of screenshot asset paths.
-  - Screenshot entries must be PNG filenames and stored under `./assets/`.
-  - Keep file paths relative to plugin root.
-
-### Path conventions and defaults
-
-- Path values should be relative and begin with `./`.
-- `skills`, `hooks`, and `mcpServers` are supplemented on top of default component discovery; they do not replace defaults.
-- Custom path values must follow the plugin root convention and naming/namespacing rules.
-- This repo’s scaffold writes `.codex-plugin/plugin.json`; treat that as the manifest location this skill generates.
-
-# Marketplace JSON sample spec
-
-`marketplace.json` depends on where the plugin should live. New plugin creation defaults to the
-personal marketplace unless the caller explicitly requests a repo-local destination:
-
-- Personal plugin: `~/.agents/plugins/marketplace.json`
-- Repo/team plugin: `<repo-root>/.agents/plugins/marketplace.json`
-
-```json
-{
-  "name": "openai-curated",
-  "interface": {
-    "displayName": "ChatGPT Official"
-  },
-  "plugins": [
-    {
-      "name": "linear",
-      "source": {
-        "source": "local",
-        "path": "./plugins/linear"
-      },
-      "policy": {
-        "installation": "AVAILABLE",
-        "authentication": "ON_INSTALL"
-      },
-      "category": "Productivity"
-    }
-  ]
-}
-```
-
-## Marketplace field guide
-
-### Top-level fields
-
-- `name` (`string`): Marketplace identifier or catalog name.
-- `interface` (`object`, optional): Marketplace presentation metadata.
-- `plugins` (`array`): Ordered plugin entries. This order determines how Codex renders plugins.
-
-### `interface` fields
-
-- `displayName` (`string`, optional): User-facing marketplace title.
-
-### Plugin entry fields
-
-- `name` (`string`): Plugin identifier. Match the plugin folder name and `plugin.json` `name`.
-- `source` (`object`): Plugin source descriptor.
-  - `source` (`string`): Use `local` for this repo workflow.
-  - `path` (`string`): Relative plugin path based on the marketplace root.
-    - Personal plugin in `~/.agents/plugins/marketplace.json`: `./plugins/<plugin-name>`
-    - Repo/team plugin: `./plugins/<plugin-name>`
-  - The same relative path convention is used for both personal and repo/team marketplaces.
-    - Example: with `~/.agents/plugins/marketplace.json`, `./plugins/<plugin-name>` resolves to
-      `~/plugins/<plugin-name>`.
-- `policy` (`object`): Marketplace policy block. Always include it.
-  - `installation` (`string`): Availability policy.
-    - Allowed values: `NOT_AVAILABLE`, `AVAILABLE`, `INSTALLED_BY_DEFAULT`
-    - Default for new entries: `AVAILABLE`
-  - `authentication` (`string`): Authentication timing policy.
-    - Allowed values: `ON_INSTALL`, `ON_USE`
-    - Default for new entries: `ON_INSTALL`
-  - `products` (`array` of `string`, optional): Product override for this plugin entry. Omit it unless product gating is explicitly requested.
-- `category` (`string`): Display category bucket. Always include it.
-
-### Marketplace generation rules
-
-- `displayName` belongs under the top-level `interface` object, not individual plugin entries.
-- When creating a new marketplace file from scratch, seed `interface.displayName` alongside top-level `name`.
-- Always include `policy.installation`, `policy.authentication`, and `category` on every generated or updated plugin entry.
-- Treat `policy.products` as an override and omit it unless explicitly requested.
-- Append new entries unless the user explicitly requests reordering.
-- Replace an existing entry for the same plugin only when overwrite is intentional.
-- Default new plugin creation to the personal marketplace.
-- Use a repo/team marketplace only when the user specifically requests that destination.
-- Only override the marketplace `name` when the default `personal` name is already taken or
-  installed and you need to seed a different new marketplace file.
-- Choose marketplace location to match the selected destination:
-  - Personal plugin: `~/.agents/plugins/marketplace.json`
-  - Repo/team plugin: `<repo-root>/.agents/plugins/marketplace.json`
-
-### Plugin validation notes
-
-- The validator mirrors the workspace plugin ingestion schema so generated plugins follow the same
-  manifest contract from the start.
-- Plugin manifests must include real values for `name`, `version`, `description`,
-  `author.name`, and the required `interface` fields.
-- `version` must use strict semver.
-- `websiteURL`, `privacyPolicyURL`, and `termsOfServiceURL` must be absolute `https://` URLs when
-  present.
-- `composerIcon`, `logo`, and `screenshots` must point to real files inside the plugin archive when
-  present.
-- `apps` and `mcpServers` should appear in `plugin.json` only when `.app.json` and `.mcp.json`
-  actually exist.
-- Validation rejects unsupported manifest fields such as `hooks`, so the scaffold keeps them out of
-  generated manifests.
-- Run `scripts/validate_plugin.py <plugin-path>` before handing back a generated plugin. It adds one
-  intentional preflight check that rejects leftover `[TODO: ...]` placeholders.
diff --git a/skills/plugin-creator/scripts/create_basic_plugin.py b/skills/plugin-creator/scripts/create_basic_plugin.py
deleted file mode 100644
index 78b9fca..0000000
--- a/skills/plugin-creator/scripts/create_basic_plugin.py
+++ /dev/null
@@ -1,324 +0,0 @@
-#!/usr/bin/env python3
-"""Scaffold a plugin directory and optionally update marketplace.json."""
-
-from __future__ import annotations
-
-import argparse
-import json
-import re
-from pathlib import Path
-from typing import Any
-
-
-MAX_PLUGIN_NAME_LENGTH = 64
-DEFAULT_INSTALL_POLICY = "AVAILABLE"
-DEFAULT_AUTH_POLICY = "ON_INSTALL"
-DEFAULT_CATEGORY = "Productivity"
-DEFAULT_MARKETPLACE_NAME = "personal"
-VALID_INSTALL_POLICIES = {"NOT_AVAILABLE", "AVAILABLE", "INSTALLED_BY_DEFAULT"}
-VALID_AUTH_POLICIES = {"ON_INSTALL", "ON_USE"}
-DEFAULT_PLUGIN_PARENT = Path.home() / "plugins"
-DEFAULT_MARKETPLACE_PATH = Path.home() / ".agents" / "plugins" / "marketplace.json"
-
-
-def normalize_plugin_name(plugin_name: str) -> str:
-    """Normalize a plugin name to lowercase hyphen-case."""
-    normalized = plugin_name.strip().lower()
-    normalized = re.sub(r"[^a-z0-9]+", "-", normalized)
-    normalized = normalized.strip("-")
-    normalized = re.sub(r"-{2,}", "-", normalized)
-    return normalized
-
-
-def validate_plugin_name(plugin_name: str) -> None:
-    if not plugin_name:
-        raise ValueError("Plugin name must include at least one letter or digit.")
-    if len(plugin_name) > MAX_PLUGIN_NAME_LENGTH:
-        raise ValueError(
-            f"Plugin name '{plugin_name}' is too long ({len(plugin_name)} characters). "
-            f"Maximum is {MAX_PLUGIN_NAME_LENGTH} characters."
-        )
-
-
-def validate_marketplace_name(marketplace_name: str) -> None:
-    if not marketplace_name:
-        raise ValueError("Marketplace name must include at least one letter or digit.")
-    if re.fullmatch(r"[A-Za-z0-9_-]+", marketplace_name) is None:
-        raise ValueError(
-            "Marketplace name may only contain ASCII letters, digits, `_`, and `-`."
-        )
-
-
-def display_name_from_plugin_name(plugin_name: str) -> str:
-    return " ".join(part.capitalize() for part in re.split(r"[-_]+", plugin_name))
-
-
-def build_plugin_json(plugin_name: str, *, with_mcp: bool, with_apps: bool) -> dict[str, Any]:
-    display_name = display_name_from_plugin_name(plugin_name)
-    payload: dict[str, Any] = {
-        "name": plugin_name,
-        "version": "0.1.0",
-        "description": f"{display_name} plugin",
-        "author": {
-            "name": "Local developer",
-        },
-        "skills": "./skills/",
-        "interface": {
-            "displayName": display_name,
-            "shortDescription": f"Use {display_name} in Codex.",
-            "longDescription": f"{display_name} adds a local Codex plugin scaffold.",
-            "developerName": "Local developer",
-            "category": DEFAULT_CATEGORY,
-            "capabilities": [],
-            "defaultPrompt": f"Help me use {display_name}.",
-        },
-    }
-    if with_mcp:
-        payload["mcpServers"] = "./.mcp.json"
-    if with_apps:
-        payload["apps"] = "./.app.json"
-    return payload
-
-
-def build_marketplace_entry(
-    plugin_name: str,
-    install_policy: str,
-    auth_policy: str,
-    category: str,
-) -> dict[str, Any]:
-    return {
-        "name": plugin_name,
-        "source": {
-            "source": "local",
-            "path": f"./plugins/{plugin_name}",
-        },
-        "policy": {
-            "installation": install_policy,
-            "authentication": auth_policy,
-        },
-        "category": category,
-    }
-
-
-def load_json(path: Path) -> dict[str, Any]:
-    with path.open() as handle:
-        return json.load(handle)
-
-
-def build_default_marketplace(marketplace_name: str) -> dict[str, Any]:
-    return {
-        "name": marketplace_name,
-        "interface": {
-            "displayName": display_name_from_plugin_name(marketplace_name),
-        },
-        "plugins": [],
-    }
-
-
-def validate_marketplace_interface(payload: dict[str, Any]) -> None:
-    interface = payload.get("interface")
-    if interface is not None and not isinstance(interface, dict):
-        raise ValueError("marketplace.json field 'interface' must be an object.")
-
-
-def update_marketplace_json(
-    marketplace_path: Path,
-    marketplace_name: str | None,
-    plugin_name: str,
-    install_policy: str,
-    auth_policy: str,
-    category: str,
-    force: bool,
-) -> None:
-    if marketplace_path.exists():
-        payload = load_json(marketplace_path)
-    else:
-        payload = build_default_marketplace(marketplace_name or DEFAULT_MARKETPLACE_NAME)
-
-    if not isinstance(payload, dict):
-        raise ValueError(f"{marketplace_path} must contain a JSON object.")
-
-    validate_marketplace_interface(payload)
-
-    existing_marketplace_name = payload.get("name")
-    if marketplace_name is not None:
-        if not isinstance(existing_marketplace_name, str) or not existing_marketplace_name.strip():
-            raise ValueError(f"{marketplace_path} must contain a non-empty string 'name'.")
-        if existing_marketplace_name != marketplace_name:
-            raise ValueError(
-                f"{marketplace_path} already uses marketplace name "
-                f"'{existing_marketplace_name}'. Create a new marketplace file to use "
-                f"'{marketplace_name}' instead."
-            )
-
-    plugins = payload.setdefault("plugins", [])
-    if not isinstance(plugins, list):
-        raise ValueError(f"{marketplace_path} field 'plugins' must be an array.")
-
-    new_entry = build_marketplace_entry(plugin_name, install_policy, auth_policy, category)
-
-    for index, entry in enumerate(plugins):
-        if isinstance(entry, dict) and entry.get("name") == plugin_name:
-            if not force:
-                raise FileExistsError(
-                    f"Marketplace entry '{plugin_name}' already exists in {marketplace_path}. "
-                    "Use --force to overwrite that entry."
-                )
-            plugins[index] = new_entry
-            break
-    else:
-        plugins.append(new_entry)
-
-    write_json(marketplace_path, payload, force=True)
-
-
-def write_json(path: Path, data: dict, force: bool) -> None:
-    if path.exists() and not force:
-        raise FileExistsError(f"{path} already exists. Use --force to overwrite.")
-    path.parent.mkdir(parents=True, exist_ok=True)
-    with path.open("w") as handle:
-        json.dump(data, handle, indent=2)
-        handle.write("\n")
-
-
-def create_stub_file(path: Path, payload: dict, force: bool) -> None:
-    if path.exists() and not force:
-        return
-    path.parent.mkdir(parents=True, exist_ok=True)
-    with path.open("w") as handle:
-        json.dump(payload, handle, indent=2)
-        handle.write("\n")
-
-
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser(
-        description="Create a plugin skeleton with a validation-ready plugin.json."
-    )
-    parser.add_argument("plugin_name")
-    parser.add_argument(
-        "--path",
-        default=str(DEFAULT_PLUGIN_PARENT),
-        help=(
-            "Parent directory for plugin creation (defaults to <home>/plugins). "
-            "Pass an explicit repo path only when a repo/team plugin is intended."
-        ),
-    )
-    parser.add_argument("--with-skills", action="store_true", help="Create skills/ directory")
-    parser.add_argument("--with-hooks", action="store_true", help="Create hooks/ directory")
-    parser.add_argument("--with-scripts", action="store_true", help="Create scripts/ directory")
-    parser.add_argument("--with-assets", action="store_true", help="Create assets/ directory")
-    parser.add_argument("--with-mcp", action="store_true", help="Create .mcp.json placeholder")
-    parser.add_argument("--with-apps", action="store_true", help="Create .app.json placeholder")
-    parser.add_argument(
-        "--with-marketplace",
-        action="store_true",
-        help=(
-            "Create or update <home>/.agents/plugins/marketplace.json by default. "
-            "Marketplace entries always point to ./plugins/<plugin-name> relative to the "
-            "marketplace root."
-        ),
-    )
-    parser.add_argument(
-        "--marketplace-path",
-        default=str(DEFAULT_MARKETPLACE_PATH),
-        help=(
-            "Path to marketplace.json (defaults to <home>/.agents/plugins/marketplace.json). "
-            "Pass a repo-rooted marketplace path only when a repo/team plugin is intended."
-        ),
-    )
-    parser.add_argument(
-        "--marketplace-name",
-        help=(
-            "Marketplace name to seed into a new marketplace.json. Use this only when the default "
-            "'personal' marketplace name is already taken and you need a different new marketplace."
-        ),
-    )
-    parser.add_argument(
-        "--install-policy",
-        default=DEFAULT_INSTALL_POLICY,
-        choices=sorted(VALID_INSTALL_POLICIES),
-        help="Marketplace policy.installation value",
-    )
-    parser.add_argument(
-        "--auth-policy",
-        default=DEFAULT_AUTH_POLICY,
-        choices=sorted(VALID_AUTH_POLICIES),
-        help="Marketplace policy.authentication value",
-    )
-    parser.add_argument(
-        "--category",
-        default=DEFAULT_CATEGORY,
-        help="Marketplace category value",
-    )
-    parser.add_argument("--force", action="store_true", help="Overwrite existing files")
-    return parser.parse_args()
-
-
-def main() -> None:
-    args = parse_args()
-    raw_plugin_name = args.plugin_name
-    plugin_name = normalize_plugin_name(raw_plugin_name)
-    if plugin_name != raw_plugin_name:
-        print(f"Note: Normalized plugin name from '{raw_plugin_name}' to '{plugin_name}'.")
-    validate_plugin_name(plugin_name)
-    marketplace_name = None
-    if args.marketplace_name is not None:
-        marketplace_name = args.marketplace_name.strip()
-        validate_marketplace_name(marketplace_name)
-
-    plugin_root = (Path(args.path).expanduser().resolve() / plugin_name)
-    plugin_root.mkdir(parents=True, exist_ok=True)
-
-    plugin_json_path = plugin_root / ".codex-plugin" / "plugin.json"
-    write_json(
-        plugin_json_path,
-        build_plugin_json(plugin_name, with_mcp=args.with_mcp, with_apps=args.with_apps),
-        args.force,
-    )
-
-    optional_directories = {
-        "skills": args.with_skills,
-        "hooks": args.with_hooks,
-        "scripts": args.with_scripts,
-        "assets": args.with_assets,
-    }
-    for folder, enabled in optional_directories.items():
-        if enabled:
-            (plugin_root / folder).mkdir(parents=True, exist_ok=True)
-
-    if args.with_mcp:
-        create_stub_file(
-            plugin_root / ".mcp.json",
-            {"mcpServers": {}},
-            args.force,
-        )
-
-    if args.with_apps:
-        create_stub_file(
-            plugin_root / ".app.json",
-            {
-                "apps": {},
-            },
-            args.force,
-        )
-
-    if args.with_marketplace:
-        marketplace_path = Path(args.marketplace_path).expanduser().resolve()
-        update_marketplace_json(
-            marketplace_path,
-            marketplace_name,
-            plugin_name,
-            args.install_policy,
-            args.auth_policy,
-            args.category,
-            args.force,
-        )
-
-    print(f"Created plugin scaffold: {plugin_root}")
-    print(f"plugin manifest: {plugin_json_path}")
-    if args.with_marketplace:
-        print(f"marketplace manifest: {marketplace_path}")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/skills/plugin-creator/scripts/read_marketplace_name.py b/skills/plugin-creator/scripts/read_marketplace_name.py
deleted file mode 100644
index 597e9f7..0000000
--- a/skills/plugin-creator/scripts/read_marketplace_name.py
+++ /dev/null
@@ -1,48 +0,0 @@
-#!/usr/bin/env python3
-"""Print the top-level marketplace name from any marketplace.json file."""
-
-from __future__ import annotations
-
-import argparse
-import json
-import sys
-from pathlib import Path
-
-
-def default_marketplace_path() -> Path:
-    return Path.home() / ".agents" / "plugins" / "marketplace.json"
-
-
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser(
-        description=(
-            "Print the top-level marketplace name from marketplace.json. Defaults to the personal "
-            "marketplace path under the current home directory."
-        )
-    )
-    parser.add_argument(
-        "--marketplace-path",
-        default=str(default_marketplace_path()),
-        help="Path to marketplace.json",
-    )
-    return parser.parse_args()
-
-
-def main() -> None:
-    args = parse_args()
-    marketplace_path = Path(args.marketplace_path).expanduser().resolve()
-    payload = json.loads(marketplace_path.read_text(encoding="utf-8"))
-    if not isinstance(payload, dict):
-        raise ValueError(f"{marketplace_path} must contain a JSON object.")
-    name = payload.get("name")
-    if not isinstance(name, str) or not name.strip():
-        raise ValueError(f"{marketplace_path} must contain a non-empty string 'name'.")
-    print(name.strip())
-
-
-if __name__ == "__main__":
-    try:
-        main()
-    except Exception as err:  # noqa: BLE001 - CLI should surface a single clear message.
-        print(str(err), file=sys.stderr)
-        raise SystemExit(1) from err
diff --git a/skills/plugin-creator/scripts/update_plugin_cachebuster.py b/skills/plugin-creator/scripts/update_plugin_cachebuster.py
deleted file mode 100644
index 82d19e5..0000000
--- a/skills/plugin-creator/scripts/update_plugin_cachebuster.py
+++ /dev/null
@@ -1,78 +0,0 @@
-#!/usr/bin/env python3
-"""Rewrite a local plugin version to a single Codex cachebuster suffix."""
-
-from __future__ import annotations
-
-import argparse
-import json
-import re
-import sys
-from datetime import datetime, timezone
-from pathlib import Path
-
-
-CACHEBUSTER_PREFIX = "codex"
-
-
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser(
-        description=(
-            "Rewrite a local plugin's version so it preserves everything before '+' and uses "
-            "a single +codex.<cachebuster> suffix."
-        )
-    )
-    parser.add_argument("plugin_path", help="Path to the plugin root directory")
-    parser.add_argument(
-        "--cachebuster",
-        help="Optional cachebuster token to embed in the plugin version",
-    )
-    return parser.parse_args()
-
-
-def main() -> None:
-    args = parse_args()
-    plugin_root = Path(args.plugin_path).expanduser().resolve()
-    manifest_path = plugin_root / ".codex-plugin" / "plugin.json"
-    manifest = load_manifest(manifest_path)
-
-    version = manifest.get("version")
-    if not isinstance(version, str) or not version.strip():
-        raise ValueError(f"{manifest_path} must contain a non-empty string 'version'.")
-    cachebuster = sanitize_cachebuster(args.cachebuster or default_cachebuster())
-    next_version = with_cachebuster(version, cachebuster)
-    manifest["version"] = next_version
-    manifest_path.write_text(json.dumps(manifest, indent=2) + "\n", encoding="utf-8")
-
-    print(f"Updated plugin version: {version} -> {next_version}")
-
-
-def load_manifest(manifest_path: Path) -> dict[str, object]:
-    if not manifest_path.is_file():
-        raise FileNotFoundError(f"missing manifest: {manifest_path}")
-    payload = json.loads(manifest_path.read_text(encoding="utf-8"))
-    if not isinstance(payload, dict):
-        raise ValueError(f"{manifest_path} must contain a JSON object.")
-    return payload
-def sanitize_cachebuster(value: str) -> str:
-    sanitized = re.sub(r"[^a-z0-9-]+", "-", value.strip().lower())
-    sanitized = re.sub(r"-{2,}", "-", sanitized).strip("-")
-    if not sanitized:
-        raise ValueError("Cachebuster must contain at least one letter or digit.")
-    return sanitized
-
-
-def default_cachebuster() -> str:
-    return datetime.now(timezone.utc).strftime("%Y%m%d%H%M%S")
-
-
-def with_cachebuster(version: str, cachebuster: str) -> str:
-    version_prefix = version.split("+", 1)[0]
-    return f"{version_prefix}+{CACHEBUSTER_PREFIX}.{cachebuster}"
-
-
-if __name__ == "__main__":
-    try:
-        main()
-    except Exception as err:  # noqa: BLE001 - CLI should surface a single clear message.
-        print(str(err), file=sys.stderr)
-        raise SystemExit(1) from err
diff --git a/skills/plugin-creator/scripts/validate_plugin.py b/skills/plugin-creator/scripts/validate_plugin.py
deleted file mode 100644
index 6f49cb0..0000000
--- a/skills/plugin-creator/scripts/validate_plugin.py
+++ /dev/null
@@ -1,593 +0,0 @@
-#!/usr/bin/env python3
-"""Validate a generated plugin against the plugin ingestion contract."""
-
-from __future__ import annotations
-
-import argparse
-import json
-import re
-from pathlib import Path, PurePosixPath
-from typing import Any
-from urllib.parse import urlparse
-
-import yaml
-
-
-TODO_MARKER = "[TODO:"
-SEMVER_RE = re.compile(
-    r"^(0|[1-9]\d*)\."
-    r"(0|[1-9]\d*)\."
-    r"(0|[1-9]\d*)"
-    r"(?:-(?:0|[1-9]\d*|\d*[A-Za-z-][0-9A-Za-z-]*)(?:\."
-    r"(?:0|[1-9]\d*|\d*[A-Za-z-][0-9A-Za-z-]*))*)?"
-    r"(?:\+[0-9A-Za-z-]+(?:\.[0-9A-Za-z-]+)*)?$"
-)
-HEX_COLOR_RE = re.compile(r"^#[0-9A-F]{6}$", re.IGNORECASE)
-
-
-def parse_args() -> argparse.Namespace:
-    parser = argparse.ArgumentParser(description="Validate a local Codex plugin.")
-    parser.add_argument("plugin_path", help="Path to the plugin root directory")
-    return parser.parse_args()
-
-
-def main() -> None:
-    args = parse_args()
-    plugin_root = Path(args.plugin_path).expanduser().resolve()
-    errors = validate_plugin(plugin_root)
-    if errors:
-        print("Plugin validation failed:")
-        for error in errors:
-            print(f"- {error}")
-        raise SystemExit(1)
-    print(f"Plugin validation passed: {plugin_root}")
-
-
-def validate_plugin(plugin_root: Path) -> list[str]:
-    errors: list[str] = []
-    manifest_path = plugin_root / ".codex-plugin" / "plugin.json"
-    manifest = load_json_object(manifest_path, errors)
-    if manifest is None:
-        return errors
-
-    reject_todo_markers(manifest, "$", errors)
-    validate_manifest_shape(plugin_root, manifest, errors)
-    return errors
-
-
-def load_json_object(path: Path, errors: list[str]) -> dict[str, Any] | None:
-    if not path.is_file():
-        errors.append("missing `.codex-plugin/plugin.json`")
-        return None
-    try:
-        payload = json.loads(path.read_text(encoding="utf-8"))
-    except OSError:
-        errors.append("unable to read `.codex-plugin/plugin.json`")
-        return None
-    except json.JSONDecodeError:
-        errors.append("`.codex-plugin/plugin.json` must be valid JSON")
-        return None
-    if not isinstance(payload, dict):
-        errors.append("`.codex-plugin/plugin.json` must contain a JSON object")
-        return None
-    return payload
-
-
-def reject_todo_markers(value: Any, path: str, errors: list[str]) -> None:
-    if isinstance(value, str):
-        if TODO_MARKER in value:
-            errors.append(f"{path} still contains a `[TODO: ...]` placeholder")
-        return
-    if isinstance(value, list):
-        for index, item in enumerate(value):
-            reject_todo_markers(item, f"{path}[{index}]", errors)
-        return
-    if isinstance(value, dict):
-        for key, item in value.items():
-            reject_todo_markers(item, f"{path}.{key}", errors)
-
-
-def validate_manifest_shape(
-    plugin_root: Path,
-    manifest: dict[str, Any],
-    errors: list[str],
-) -> None:
-    allowed_keys = {
-        "id",
-        "name",
-        "version",
-        "description",
-        "skills",
-        "apps",
-        "mcpServers",
-        "interface",
-        "author",
-        "homepage",
-        "repository",
-        "license",
-        "keywords",
-    }
-    for key in sorted(set(manifest) - allowed_keys):
-        errors.append(f"plugin.json field `{key}` is not accepted by plugin validation")
-
-    validate_optional_non_empty_string(manifest, "id", errors)
-    require_non_empty_string(manifest, "name", errors)
-    version = require_non_empty_string(manifest, "version", errors)
-    if version is not None and SEMVER_RE.fullmatch(version) is None:
-        errors.append("plugin.json field `version` must be strict semver")
-    require_non_empty_string(manifest, "description", errors)
-
-    author = require_object(manifest, "author", errors)
-    if author is not None:
-        reject_unknown_fields(author, {"name", "email", "url"}, "author", errors)
-        require_non_empty_string(author, "name", errors, prefix="author")
-        validate_optional_non_empty_string(author, "email", errors, prefix="author")
-        validate_optional_https_url(author, "url", errors, prefix="author")
-
-    validate_optional_contract_path(manifest, "skills", "skills", errors)
-    validate_optional_contract_path(manifest, "apps", ".app.json", errors)
-    validate_optional_contract_path(manifest, "mcpServers", ".mcp.json", errors)
-
-    if manifest.get("apps") is not None:
-        validate_app_manifest(
-            plugin_root / ".app.json",
-            errors,
-        )
-    if manifest.get("mcpServers") is not None:
-        validate_mcp_manifest(
-            plugin_root / ".mcp.json",
-            errors,
-        )
-    validate_skill_manifests(plugin_root, errors)
-
-    interface = require_object(manifest, "interface", errors)
-    if interface is None:
-        return
-    reject_unknown_fields(
-        interface,
-        {
-            "displayName",
-            "shortDescription",
-            "longDescription",
-            "developerName",
-            "category",
-            "capabilities",
-            "websiteURL",
-            "privacyPolicyURL",
-            "termsOfServiceURL",
-            "brandColor",
-            "composerIcon",
-            "logo",
-            "screenshots",
-            "defaultPrompt",
-            "default_prompt",
-        },
-        "interface",
-        errors,
-    )
-    for field in (
-        "displayName",
-        "shortDescription",
-        "longDescription",
-        "developerName",
-        "category",
-    ):
-        require_non_empty_string(interface, field, errors, prefix="interface")
-    if "defaultPrompt" not in interface and "default_prompt" not in interface:
-        errors.append(
-            "plugin.json field `interface.defaultPrompt` or `interface.default_prompt` is required"
-        )
-    capabilities = interface.get("capabilities")
-    if not isinstance(capabilities, list) or not all(
-        isinstance(value, str) and value.strip() for value in capabilities
-    ):
-        errors.append("plugin.json field `interface.capabilities` must be an array of strings")
-    for field in ("websiteURL", "privacyPolicyURL", "termsOfServiceURL"):
-        validate_optional_https_url(interface, field, errors, prefix="interface")
-    brand_color = interface.get("brandColor")
-    if brand_color is not None and (
-        not isinstance(brand_color, str) or HEX_COLOR_RE.fullmatch(brand_color) is None
-    ):
-        errors.append("plugin.json field `interface.brandColor` must use `#RRGGBB`")
-    for field in ("composerIcon", "logo"):
-        validate_optional_asset_path(plugin_root, plugin_root, interface, field, errors)
-    screenshots = interface.get("screenshots", [])
-    if not isinstance(screenshots, list):
-        errors.append("plugin.json field `interface.screenshots` must be an array")
-    else:
-        for index, raw_path in enumerate(screenshots):
-            validate_asset_path(
-                plugin_root,
-                plugin_root,
-                raw_path,
-                f"interface.screenshots[{index}]",
-                errors,
-            )
-
-
-def require_object(
-    payload: dict[str, Any],
-    key: str,
-    errors: list[str],
-) -> dict[str, Any] | None:
-    value = payload.get(key)
-    if not isinstance(value, dict):
-        errors.append(f"plugin.json field `{key}` must be an object")
-        return None
-    return value
-
-
-def require_non_empty_string(
-    payload: dict[str, Any],
-    key: str,
-    errors: list[str],
-    *,
-    prefix: str | None = None,
-) -> str | None:
-    value = payload.get(key)
-    field = f"{prefix}.{key}" if prefix is not None else key
-    if not isinstance(value, str) or not value.strip():
-        errors.append(f"plugin.json field `{field}` must be a non-empty string")
-        return None
-    return value
-
-
-def validate_optional_non_empty_string(
-    payload: dict[str, Any],
-    key: str,
-    errors: list[str],
-    *,
-    prefix: str | None = None,
-) -> None:
-    value = payload.get(key)
-    if value is None:
-        return
-    field = f"{prefix}.{key}" if prefix is not None else key
-    if not isinstance(value, str) or not value.strip():
-        errors.append(f"plugin.json field `{field}` must be a non-empty string")
-
-
-def reject_unknown_fields(
-    payload: dict[str, Any],
-    allowed_keys: set[str],
-    prefix: str,
-    errors: list[str],
-) -> None:
-    for key in sorted(set(payload) - allowed_keys):
-        errors.append(f"plugin.json field `{prefix}.{key}` is not accepted by plugin validation")
-
-
-def validate_optional_https_url(
-    payload: dict[str, Any],
-    key: str,
-    errors: list[str],
-    *,
-    prefix: str,
-) -> None:
-    value = payload.get(key)
-    if value is None:
-        return
-    parsed = urlparse(value) if isinstance(value, str) else None
-    if parsed is None or parsed.scheme != "https" or not parsed.netloc:
-        errors.append(f"plugin.json field `{prefix}.{key}` must be an absolute `https://` URL")
-
-
-def validate_optional_contract_path(
-    payload: dict[str, Any],
-    key: str,
-    expected: str,
-    errors: list[str],
-) -> None:
-    value = payload.get(key)
-    if value is None:
-        return
-    normalized = normalize_contract_path(value) if isinstance(value, str) else None
-    if normalized != expected:
-        errors.append(f"plugin.json field `{key}` must resolve to `{expected}`")
-
-
-def normalize_contract_path(raw_path: str) -> str | None:
-    path = Path(raw_path)
-    if path.is_absolute():
-        return None
-    normalized = path.as_posix().rstrip("/")
-    return normalized or None
-
-
-def validate_app_manifest(path: Path, errors: list[str]) -> None:
-    payload = load_companion_json_object(path, "`.app.json`", errors)
-    if payload is None:
-        return
-    reject_companion_unknown_fields(payload, {"apps"}, "`.app.json`", errors)
-    apps = payload.get("apps")
-    if not isinstance(apps, dict):
-        errors.append("`.app.json` field `apps` must be an object")
-        return
-    for key, value in apps.items():
-        if not isinstance(value, dict):
-            errors.append(f"`.app.json` app `{key}` must be an object")
-            continue
-        reject_companion_unknown_fields(
-            value, {"id", "category"}, f"`.app.json` app `{key}`", errors
-        )
-        app_id = value.get("id")
-        if not isinstance(app_id, str) or not app_id.strip():
-            errors.append(f"`.app.json` app `{key}` field `id` must be a non-empty string")
-        category = value.get("category")
-        if category is not None and (not isinstance(category, str) or not category.strip()):
-            errors.append(
-                f"`.app.json` app `{key}` field `category` must be a non-empty string"
-            )
-
-
-def validate_mcp_manifest(path: Path, errors: list[str]) -> None:
-    payload = load_companion_json_object(path, "`.mcp.json`", errors)
-    if payload is None:
-        return
-    reject_companion_unknown_fields(payload, {"mcpServers"}, "`.mcp.json`", errors)
-    servers = payload.get("mcpServers")
-    if not isinstance(servers, dict):
-        errors.append("`.mcp.json` field `mcpServers` must be an object")
-        return
-    for key, value in servers.items():
-        if not isinstance(key, str) or not key.strip():
-            errors.append("`.mcp.json` server names must be non-empty strings")
-        if not isinstance(value, dict):
-            errors.append(f"`.mcp.json` server `{key}` must be an object")
-
-
-def load_companion_json_object(
-    path: Path,
-    label: str,
-    errors: list[str],
-) -> dict[str, Any] | None:
-    if not path.is_file():
-        errors.append(f"{label} is required when its plugin.json field is present")
-        return None
-    try:
-        payload = json.loads(path.read_text(encoding="utf-8"))
-    except (OSError, json.JSONDecodeError):
-        errors.append(f"{label} must contain valid JSON")
-        return None
-    if not isinstance(payload, dict):
-        errors.append(f"{label} must contain a JSON object")
-        return None
-    return payload
-
-
-def reject_companion_unknown_fields(
-    payload: dict[str, Any],
-    allowed_keys: set[str],
-    prefix: str,
-    errors: list[str],
-) -> None:
-    for key in sorted(set(payload) - allowed_keys):
-        errors.append(f"{prefix} field `{key}` is not accepted by plugin validation")
-
-
-def validate_skill_manifests(plugin_root: Path, errors: list[str]) -> None:
-    skills_root = plugin_root / "skills"
-    if not skills_root.is_dir():
-        return
-    for skill_root in sorted(skills_root.iterdir(), key=lambda path: path.name):
-        if skill_root.name.startswith(".") or not skill_root.is_dir():
-            continue
-        validate_skill_manifest(skill_root, errors)
-
-
-def validate_skill_manifest(skill_root: Path, errors: list[str]) -> None:
-    skill_md_path = skill_root / "SKILL.md"
-    if not skill_md_path.is_file():
-        errors.append(f"skill `{skill_root.name}` is missing `SKILL.md`")
-        return
-    try:
-        contents = skill_md_path.read_text(encoding="utf-8")
-    except OSError:
-        errors.append(f"unable to read skill `{skill_root.name}`")
-        return
-    if not contents.startswith("---\n"):
-        errors.append(f"skill `{skill_root.name}` must start with YAML frontmatter")
-        return
-    frontmatter_end = contents.find("\n---", 4)
-    if frontmatter_end == -1:
-        errors.append(f"skill `{skill_root.name}` frontmatter is not closed")
-        return
-    try:
-        frontmatter = yaml.safe_load(contents[4:frontmatter_end])
-    except yaml.YAMLError:
-        errors.append(f"skill `{skill_root.name}` frontmatter must be valid YAML")
-        return
-    if not isinstance(frontmatter, dict):
-        errors.append(f"skill `{skill_root.name}` frontmatter must be an object")
-        return
-    skill_name = frontmatter.get("name")
-    if not isinstance(skill_name, str) or not skill_name.strip():
-        errors.append(f"skill `{skill_root.name}` frontmatter field `name` must be non-empty")
-    description = frontmatter.get("description")
-    if not isinstance(description, str) or not description.strip():
-        errors.append(
-            f"skill `{skill_root.name}` frontmatter field `description` must be non-empty"
-        )
-    disable_model_invocation = frontmatter.get("disable-model-invocation")
-    if disable_model_invocation is None:
-        disable_model_invocation = frontmatter.get("disable_model_invocation")
-    if disable_model_invocation not in (None, False):
-        errors.append(
-            f"skill `{skill_root.name}` frontmatter field `disable-model-invocation` must be false"
-        )
-    agent_yaml_path = skill_root / "agents" / "openai.yaml"
-    if agent_yaml_path.is_file():
-        validate_skill_agent_manifest(
-            plugin_root=skill_root.parent.parent,
-            skill_root=skill_root,
-            agent_yaml_path=agent_yaml_path,
-            errors=errors,
-        )
-
-
-def validate_skill_agent_manifest(
-    *,
-    plugin_root: Path,
-    skill_root: Path,
-    agent_yaml_path: Path,
-    errors: list[str],
-) -> None:
-    try:
-        payload = yaml.safe_load(agent_yaml_path.read_text(encoding="utf-8"))
-    except OSError:
-        errors.append(f"unable to read skill `{skill_root.name}` agent YAML")
-        return
-    except yaml.YAMLError:
-        errors.append(f"skill `{skill_root.name}` agent YAML must be valid YAML")
-        return
-    if not isinstance(payload, dict):
-        errors.append(f"skill `{skill_root.name}` agent YAML must be an object")
-        return
-
-    reject_skill_agent_unknown_fields(
-        payload,
-        {"interface", "policy", "dependencies"},
-        skill_root,
-        errors,
-    )
-    interface = payload.get("interface")
-    if not isinstance(interface, dict):
-        errors.append(f"skill `{skill_root.name}` agent field `interface` must be an object")
-        return
-    reject_skill_agent_unknown_fields(
-        interface,
-        {
-            "display_name",
-            "short_description",
-            "icon_small",
-            "icon_large",
-            "brand_color",
-            "default_prompt",
-        },
-        skill_root,
-        errors,
-        prefix="interface",
-    )
-    for field in ("display_name", "short_description"):
-        value = interface.get(field)
-        if not isinstance(value, str) or not value.strip():
-            errors.append(
-                f"skill `{skill_root.name}` agent field `interface.{field}` must be non-empty"
-            )
-    for field in ("icon_small", "icon_large"):
-        validate_optional_asset_path(
-            skill_root,
-            plugin_root,
-            interface,
-            field,
-            errors,
-            prefix=f"skill `{skill_root.name}` agent field `interface",
-        )
-    brand_color = interface.get("brand_color")
-    if brand_color is not None and (
-        not isinstance(brand_color, str) or HEX_COLOR_RE.fullmatch(brand_color) is None
-    ):
-        errors.append(
-            f"skill `{skill_root.name}` agent field `interface.brand_color` must use `#RRGGBB`"
-        )
-    default_prompt = interface.get("default_prompt")
-    if default_prompt is not None and (
-        not isinstance(default_prompt, str) or not default_prompt.strip()
-    ):
-        errors.append(
-            f"skill `{skill_root.name}` agent field `interface.default_prompt` must be non-empty"
-        )
-
-    policy = payload.get("policy")
-    if policy is not None:
-        if not isinstance(policy, dict):
-            errors.append(f"skill `{skill_root.name}` agent field `policy` must be an object")
-        else:
-            reject_skill_agent_unknown_fields(
-                policy,
-                {"allow_implicit_invocation"},
-                skill_root,
-                errors,
-                prefix="policy",
-            )
-            allow_implicit_invocation = policy.get("allow_implicit_invocation")
-            if allow_implicit_invocation is not None and not isinstance(
-                allow_implicit_invocation,
-                bool,
-            ):
-                errors.append(
-                    f"skill `{skill_root.name}` agent field "
-                    "`policy.allow_implicit_invocation` must be a boolean"
-                )
-
-    dependencies = payload.get("dependencies")
-    if dependencies is not None:
-        if not isinstance(dependencies, dict):
-            errors.append(
-                f"skill `{skill_root.name}` agent field `dependencies` must be an object"
-            )
-        else:
-            reject_skill_agent_unknown_fields(
-                dependencies,
-                {"tools"},
-                skill_root,
-                errors,
-                prefix="dependencies",
-            )
-
-
-def reject_skill_agent_unknown_fields(
-    payload: dict[str, Any],
-    allowed_keys: set[str],
-    skill_root: Path,
-    errors: list[str],
-    *,
-    prefix: str | None = None,
-) -> None:
-    for key in sorted(set(payload) - allowed_keys):
-        field = f"{prefix}.{key}" if prefix is not None else key
-        errors.append(
-            f"skill `{skill_root.name}` agent field `{field}` is not accepted by plugin validation"
-        )
-
-
-def validate_optional_asset_path(
-    base_dir: Path,
-    allowed_root: Path,
-    payload: dict[str, Any],
-    key: str,
-    errors: list[str],
-    *,
-    prefix: str = "interface",
-) -> None:
-    raw_path = payload.get(key)
-    if raw_path is None:
-        return
-    validate_asset_path(base_dir, allowed_root, raw_path, f"{prefix}.{key}", errors)
-
-
-def validate_asset_path(
-    base_dir: Path,
-    allowed_root: Path,
-    raw_path: Any,
-    field: str,
-    errors: list[str],
-) -> None:
-    label = field if field.startswith("skill `") else f"plugin.json field `{field}`"
-    if not isinstance(raw_path, str) or not raw_path.strip():
-        errors.append(f"{label} must be a non-empty relative path")
-        return
-    candidate = PurePosixPath(raw_path.replace("\\", "/"))
-    if candidate.is_absolute() or any(part in {"", ".", ".."} for part in candidate.parts):
-        errors.append(f"{label} must stay inside the plugin archive")
-        return
-    resolved_path = (base_dir / candidate.as_posix()).resolve()
-    if not resolved_path.is_relative_to(allowed_root.resolve()):
-        errors.append(f"{label} must stay inside the plugin archive")
-        return
-    if not resolved_path.is_file():
-        errors.append(f"{label} points to a missing file")
-
-
-if __name__ == "__main__":
-    main()
diff --git a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
deleted file mode 100644
index 859b6e9..0000000
--- a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/SKILL.md
+++ /dev/null
@@ -1,11 +0,0 @@
----
-name: "prompt-0ca565e9-3d44-45f1-832d-caa438aceddb"
-description: "文档编辑"
-metadata:
-  short-description: "文档编辑"
----
-
-# 文档编辑
-
-**规约：定义型修改先找单一权威，禁止外挂补丁。**
-当修改 prompt/schema/状态机/协议语义时，先定位“唯一权威定义区”，优先直接重写该定义；如果改动只是往附近追加说明、例外或补充规则，而没有收束原定义，默认视为错误方案。提交前必须自问：我是在降低信息熵，还是在制造第二套语义。
diff --git a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml b/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
deleted file mode 100644
index 80922d4..0000000
--- a/skills/prompt-0ca565e9-3d44-45f1-832d-caa438aceddb/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "文档编辑"
-  short_description: "文档编辑"
-  default_prompt: "Use $prompt-0ca565e9-3d44-45f1-832d-caa438aceddb."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
deleted file mode 100644
index 3cf610f..0000000
--- a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971"
-description: "始终批判自己"
-metadata:
-  short-description: "始终批判自己"
----
-
-# 始终批判自己
-
-始终批判自己，批判性思维，做了若干决策后，他们会综合作用产生效果，需要批判其中每一项，最终按优先级和最终预期收益看情况保留
diff --git a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml b/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
deleted file mode 100644
index 26b71cf..0000000
--- a/skills/prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "始终批判自己"
-  short_description: "始终批判自己"
-  default_prompt: "Use $prompt-1309ed22-5b5e-4774-9b85-41bb1b7cc971."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
deleted file mode 100644
index ef1315d..0000000
--- a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-1323c8c8-88a0-40d2-89df-14fc9533a122"
-description: "尽量减少确认项"
-metadata:
-  short-description: "尽量减少确认项"
----
-
-# 尽量减少确认项
-
-实现情况不要找用户确认，因为看代码就可以知道了，得自己看
diff --git a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml b/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
deleted file mode 100644
index 2010a57..0000000
--- a/skills/prompt-1323c8c8-88a0-40d2-89df-14fc9533a122/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "尽量减少确认项"
-  short_description: "尽量减少确认项"
-  default_prompt: "Use $prompt-1323c8c8-88a0-40d2-89df-14fc9533a122."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
deleted file mode 100644
index dc879e8..0000000
--- a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-144929a0-ae69-404b-9f58-a8696378e4e3"
-description: "Patch 式改动审阅"
-metadata:
-  short-description: "Patch 式改动审阅"
----
-
-# Patch 式改动审阅
-
-对于代码改动，你需要在我最终同意"落盘 diff"前，仅能 告知我 改动 位置 以及 代码 diff 详情，为我按 hunks 力度解释其修改动机和服务对象，并在 最终落盘时还要观察 最新状态代码一致性
diff --git a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml b/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
deleted file mode 100644
index 2d610b2..0000000
--- a/skills/prompt-144929a0-ae69-404b-9f58-a8696378e4e3/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "Patch 式改动审阅"
-  short_description: "Patch 式改动审阅"
-  default_prompt: "Use $prompt-144929a0-ae69-404b-9f58-a8696378e4e3."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
deleted file mode 100644
index 3c935ad..0000000
--- a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-15d9a907-a363-4ec7-81ad-806f9418ad72"
-description: "pua严肃设计"
-metadata:
-  short-description: "pua严肃设计"
----
-
-# pua严肃设计
-
-请严肃设计，我们在设计一套精密仪器，跨时代产品
diff --git a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml b/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
deleted file mode 100644
index d6bc16b..0000000
--- a/skills/prompt-15d9a907-a363-4ec7-81ad-806f9418ad72/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "pua严肃设计"
-  short_description: "pua严肃设计"
-  default_prompt: "Use $prompt-15d9a907-a363-4ec7-81ad-806f9418ad72."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
deleted file mode 100644
index 6b7f96d..0000000
--- a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/SKILL.md
+++ /dev/null
@@ -1,16 +0,0 @@
----
-name: "prompt-193dd3cd-2722-413b-b88c-12c2af645f80"
-description: "使用 agent-browser 排查运行时状态"
-metadata:
-  short-description: "使用 agent-browser 排查运行时状态"
----
-
-# 使用 agent-browser 排查运行时状态
-
-使用 agent-browser 排查运行时状态，
-# 业务指引
-请你 操作 agent-browser 打开 https://10.126.126.231:8111/ 然后通过侧栏进入 HY workspace， 打开 dever_for_dev 项目
-## 运行时 worknote 目录 
-- 我给予你 /opt/store_team_dev/zyc/dever_for_dev/attic/.agent-browser-runtime-workdir 这个工作目录 ，在每个 节点 把你 阶段性 的 操作截图 给我检查，截图 请 前缀 添加时间轴，格式为 <date>-<time>-<截图名称>.<图片文件格式>
-## 开发日常情况适应
-- 需要你去记忆这个情况: 我们在 不断迭代着 界面，所以有时候界面一下子 崩掉了是因为有其他组件在热更新，你要 适应这个情况，当你感觉 遇到了这个问题，你向我 确认 刚刚 是否 出现热更新，我往往 会 回答 "对,是的" 或者 "我不确定"，这种 情况 就希望 你不要被之前 状态误导，请你 重新 排查我们关注的 问题。
diff --git a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml b/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
deleted file mode 100644
index fa510bd..0000000
--- a/skills/prompt-193dd3cd-2722-413b-b88c-12c2af645f80/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "使用 agent-browser 排查运行时状态"
-  short_description: "使用 agent-browser 排查运行时状态"
-  default_prompt: "Use $prompt-193dd3cd-2722-413b-b88c-12c2af645f80."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
deleted file mode 100644
index c380b4c..0000000
--- a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/SKILL.md
+++ /dev/null
@@ -1,27 +0,0 @@
----
-name: "prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7"
-description: "状态机正确性"
-metadata:
-  short-description: "状态机正确性"
----
-
-# 状态机正确性
-
-高度抽象规约（公式级）
-任何副作用（发请求/写缓存/写 store/patch UI）都必须是一个纯函数式映射：Effect = f(ActorIdentity, IntentId, TargetIdentity, Payload)
-禁止让 Effect 依赖任何隐式上下文：currentXxx/globalXxx/数组下标对齐/默认回退对象/闭包里过期的 selectedXxx；因为这些在“列表重排 + 异步回写 + 流式并发”下会漂移，导致“写对了 payload，但写错了容器”。
-落地要点（必须同时满足）
-ActorIdentity（我是谁/谁在做）：谁发起这次 effect（组件/Hook/Stream/Workspace），用于界定权限与并发域（如 workspaceId、agentKey/machineKey）。
-IntentId（我这次想做什么）：一次用户意图/事务的稳定编号（如 click/open 的 seq），用于丢弃过期回写。
-TargetIdentity（我对谁做）：被操作对象的最小不可歧义闭包（按场景至少包含：machineKey/agentId + projectId + bucket/filterKey + sessionId/cursor）。
-写入前校验：在真正 setQueryData/setState 前，二次校验 Actor/Intent/Target 仍匹配当前上下文；不匹配就丢弃/重取，不能“凑合写”。
-具体例子（对照）
-1) TanStack Query 列表/分页
-正确：queryKey 与返回数据都绑定 machineKey+projectId+bucket+filterKey(+cursor)；渲染/回写前校验这些字段一致。
-错误：useQueries 用 i * buckets + j 取结果，projects 列表一重排就把 A 项目的结果读成 B 项目的。
-2) SSE/Stream patch
-正确：patch 必须携带 agentId/machineKey + projectId + sessionId，并且只允许更新对应 identity 的 queryKey 容器。
-错误：只带 sessionId 就去更新“当前项目的 sessions 列表”（TargetIdentity 缺失）。
-3) UI 选择态（跨 await）
-正确：点击会话生成 intentSeq，await 返回后如果 intentSeq 已变化则不写入（IntentId 防过期回写）；并且写入的目标必须是同一个 agentId+projectId+sessionId。
-错误：await 回来直接 setSelectedSession(x)，同时依赖“当前 selectedProject”作为目标（隐式 current 指针）。
diff --git a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml b/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
deleted file mode 100644
index 2d1858c..0000000
--- a/skills/prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "状态机正确性"
-  short_description: "状态机正确性"
-  default_prompt: "Use $prompt-2793a3a4-310f-40c8-ba5d-bc7f5c1cafd7."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
deleted file mode 100644
index a8dad69..0000000
--- a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-2d53cebd-afd4-4d35-94e9-74436da3148a"
-description: "关注收束"
-metadata:
-  short-description: "关注收束"
----
-
-# 关注收束
-
-关注收束，如果当前实现可以复用一些东西，优先复用
diff --git a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml b/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
deleted file mode 100644
index e95a2ae..0000000
--- a/skills/prompt-2d53cebd-afd4-4d35-94e9-74436da3148a/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "关注收束"
-  short_description: "关注收束"
-  default_prompt: "Use $prompt-2d53cebd-afd4-4d35-94e9-74436da3148a."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
deleted file mode 100644
index d381fe9..0000000
--- a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-2eaed145-d789-4b27-93b9-8ea990830b3a"
-description: "提示词模板位置"
-metadata:
-  short-description: "提示词模板位置"
----
-
-# 提示词模板位置
-
-dever项目所有提示词模板都应该放在独立的ts源码文件中，这样分离的更清楚，更好做提示词版本管理
diff --git a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml b/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
deleted file mode 100644
index 15fea0c..0000000
--- a/skills/prompt-2eaed145-d789-4b27-93b9-8ea990830b3a/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "提示词模板位置"
-  short_description: "提示词模板位置"
-  default_prompt: "Use $prompt-2eaed145-d789-4b27-93b9-8ea990830b3a."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
deleted file mode 100644
index b8f8bf8..0000000
--- a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb"
-description: "长期主义"
-metadata:
-  short-description: "长期主义"
----
-
-# 长期主义
-
-长期主义，解决一个问题时，要往上递归思考根因，想一下能不能做让未来更复利的事情，宁愿早期breakchange，也不要长期埋雷，做简单的缝缝补补
diff --git a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml b/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
deleted file mode 100644
index 7237bab..0000000
--- a/skills/prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "长期主义"
-  short_description: "长期主义"
-  default_prompt: "Use $prompt-345530e6-2736-42c3-9d4e-da5f14b8b8cb."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
deleted file mode 100644
index b9417ca..0000000
--- a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca"
-description: "更改前需要用户 review"
-metadata:
-  short-description: "更改前需要用户 review"
----
-
-# 更改前需要用户 review
-
-要执行内容改动，需要先输出计划，待用户 review 并回复后执行
diff --git a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml b/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
deleted file mode 100644
index 10dda57..0000000
--- a/skills/prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "更改前需要用户 review"
-  short_description: "更改前需要用户 review"
-  default_prompt: "Use $prompt-566905c8-0ad8-4d7e-857a-1c38ac7e54ca."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
deleted file mode 100644
index c699703..0000000
--- a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8"
-description: "变更简洁重设计"
-metadata:
-  short-description: "变更简洁重设计"
----
-
-# 变更简洁重设计
-
-变更不要像修补丁一样增量修改，每次补一块，要考虑尽量的复用，必要时重新设计，来达到更简洁的结构，次要的才是说让变化比较少，我们宁愿breakchange，也不要留下丑陋冗余的代码结构
diff --git a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml b/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
deleted file mode 100644
index 291eaad..0000000
--- a/skills/prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "变更简洁重设计"
-  short_description: "变更简洁重设计"
-  default_prompt: "Use $prompt-5e80deb4-c278-4424-a0f4-a3df4f3443d8."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
deleted file mode 100644
index 63fbb03..0000000
--- a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-615e1231-fe33-47f8-bf35-29fdf3766d98"
-description: "悬浮菜单组件复用"
-metadata:
-  short-description: "悬浮菜单组件复用"
----
-
-# 悬浮菜单组件复用
-
-组件复用，悬浮菜单，我觉得是完全可以复用一个的，现在出现在 右键菜单，会话选择模型，等地方，其他的你也得找，得收束成一套原始组件，这样代码冗余就小很多；决策者请定位已有核心组件，并逐步把大家收束到一起
diff --git a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml b/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
deleted file mode 100644
index aea2244..0000000
--- a/skills/prompt-615e1231-fe33-47f8-bf35-29fdf3766d98/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "悬浮菜单组件复用"
-  short_description: "悬浮菜单组件复用"
-  default_prompt: "Use $prompt-615e1231-fe33-47f8-bf35-29fdf3766d98."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
deleted file mode 100644
index 561a4f6..0000000
--- a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2"
-description: "dever_canvas仅做参考"
-metadata:
-  short-description: "dever_canvas仅做参考"
----
-
-# dever_canvas仅做参考
-
-dever_canvas 那一套是给你参考的，不是拿来直接用的
diff --git a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml b/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
deleted file mode 100644
index 4b8c732..0000000
--- a/skills/prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "dever_canvas仅做参考"
-  short_description: "dever_canvas仅做参考"
-  default_prompt: "Use $prompt-7ae16163-92c9-4fde-a74f-7c61eddd62f2."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
deleted file mode 100644
index f2b1ec4..0000000
--- a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-8c5cc431-635c-4c94-9deb-a502e77160eb"
-description: "关注 dever_yew 开发"
-metadata:
-  short-description: "关注 dever_yew 开发"
----
-
-# 关注 dever_yew 开发
-
-目前 dever 项目 使用和开发的 UI 界面是由 dever_yew 提供的，原 react 实现 dever_ui 目前是历史工程，不要改动，仅做参考
diff --git a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml b/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
deleted file mode 100644
index 8d3b586..0000000
--- a/skills/prompt-8c5cc431-635c-4c94-9deb-a502e77160eb/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "关注 dever_yew 开发"
-  short_description: "关注 dever_yew 开发"
-  default_prompt: "Use $prompt-8c5cc431-635c-4c94-9deb-a502e77160eb."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
deleted file mode 100644
index 6464ddb..0000000
--- a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c"
-description: "对话信息对接参考 codex 源码"
-metadata:
-  short-description: "对话信息对接参考 codex 源码"
----
-
-# 对话信息对接参考 codex 源码
-
-对话信息对接参考 codex 源码，工程内 attic/codex 存放了 codex cli 的源码，对接 app-server 等 codex app-server 给予的能力对接参考该工程代码
diff --git a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml b/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
deleted file mode 100644
index a8ca1af..0000000
--- a/skills/prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "对话信息对接参考 codex 源码"
-  short_description: "对话信息对接参考 codex 源码"
-  default_prompt: "Use $prompt-a7fb4e43-d1eb-4739-93b3-646d7a1c072c."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
deleted file mode 100644
index 6f96d9c..0000000
--- a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/SKILL.md
+++ /dev/null
@@ -1,15 +0,0 @@
----
-name: "prompt-ac42abf9-6df8-4539-99c7-e402e905a03b"
-description: "逻辑收束到agent"
-metadata:
-  short-description: "逻辑收束到agent"
----
-
-# 逻辑收束到agent
-
-规约：Manager/Agent 边界（强制收束）
-
-前端只允许访问 manager：所有 API 必须走 /api/router/:agentId/...（local 也一样）。
-manager 只负责：请求转发（router）、agent registry、（未来）登录鉴权、（可选）静态资源托管；严禁在 manager 实现任何业务能力与持久化。
-大部分“后端能力 + 数据落盘”（projects/sessions/chat/fs/git/terminal/notifications/uiState/uiWorkspaces/uiDock/uiScroll 等）必须在 agent 内实现与持久化；manager 不得读写 .dever/agent_data.json 或任何业务数据文件。
-发现 manager 出现新增 /api/* 实现模块或 store/JSON 持久化代码，一律视为架构违规：要么迁到 agent，要么删除并改为转发。
diff --git a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml b/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
deleted file mode 100644
index 1d669e7..0000000
--- a/skills/prompt-ac42abf9-6df8-4539-99c7-e402e905a03b/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "逻辑收束到agent"
-  short_description: "逻辑收束到agent"
-  default_prompt: "Use $prompt-ac42abf9-6df8-4539-99c7-e402e905a03b."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
deleted file mode 100644
index b0743b2..0000000
--- a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315"
-description: "mvp"
-metadata:
-  short-description: "mvp"
----
-
-# mvp
-
-dever_doc/mvp/target.md  我移动到了这里，作为我们的工作目标，现在我们就开始工作，过程记录按照步骤记录在 mvp文件夹里就行，合理拆分成文件
diff --git a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml b/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
deleted file mode 100644
index 86a71f3..0000000
--- a/skills/prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "mvp"
-  short_description: "mvp"
-  default_prompt: "Use $prompt-ae9ff67b-09d8-4848-bbde-aac1fb6e1315."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
deleted file mode 100644
index 8901c6e..0000000
--- a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/SKILL.md
+++ /dev/null
@@ -1,10 +0,0 @@
----
-name: "prompt-f118ab91-390b-48e2-a962-3abe4d54211e"
-description: "完美主义"
-metadata:
-  short-description: "完美主义"
----
-
-# 完美主义
-
-完成之前，核对下有没有问题，设计上有没有不完善，尽量一次性做到完美；完美不代表复杂，完美是刚好在简单和复杂直接达到平衡
diff --git a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml b/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
deleted file mode 100644
index 9600439..0000000
--- a/skills/prompt-f118ab91-390b-48e2-a962-3abe4d54211e/agents/openai.yaml
+++ /dev/null
@@ -1,6 +0,0 @@
-interface:
-  display_name: "完美主义"
-  short_description: "完美主义"
-  default_prompt: "Use $prompt-f118ab91-390b-48e2-a962-3abe4d54211e."
-policy:
-  allow_implicit_invocation: false
diff --git a/skills/rs-skill-smoke-09e1daf7/SKILL.md b/skills/rs-skill-smoke-09e1daf7/SKILL.md
deleted file mode 100644
index eb9b22f..0000000
--- a/skills/rs-skill-smoke-09e1daf7/SKILL.md
+++ /dev/null
@@ -1,8 +0,0 @@
----
-name: rs-skill-smoke-09e1daf7
-description: Used by project_contract_smoke.
----
-
-# RS Skill Smoke
-
-Used by project_contract_smoke.
diff --git a/skills/rs-skill-smoke-529efbc9/SKILL.md b/skills/rs-skill-smoke-529efbc9/SKILL.md
deleted file mode 100644
index 85c8a95..0000000
--- a/skills/rs-skill-smoke-529efbc9/SKILL.md
+++ /dev/null
@@ -1,8 +0,0 @@
----
-name: rs-skill-smoke-529efbc9
-description: Used by project_contract_smoke.
----
-
-# rs-skill-smoke-529efbc9
-
-Used by project_contract_smoke.
diff --git a/skills/rs-skill-smoke-cde1029f/SKILL.md b/skills/rs-skill-smoke-cde1029f/SKILL.md
deleted file mode 100644
index 4611722..0000000
--- a/skills/rs-skill-smoke-cde1029f/SKILL.md
+++ /dev/null
@@ -1,8 +0,0 @@
----
-name: rs-skill-smoke-cde1029f
-description: Used by project_contract_smoke.
----
-
-# RS Skill Smoke
-
-Used by project_contract_smoke.
diff --git a/skills/skill-creator/SKILL.md b/skills/skill-creator/SKILL.md
deleted file mode 100644
index 57f4e58..0000000
--- a/skills/skill-creator/SKILL.md
+++ /dev/null
@@ -1,416 +0,0 @@
----
-name: skill-creator
-description: Guide for creating effective skills. This skill should be used when users want to create a new skill (or update an existing skill) that extends Codex's capabilities with specialized knowledge, workflows, or tool integrations.
-metadata:
-  short-description: Create or update a skill
----
-
-# Skill Creator
-
-This skill provides guidance for creating effective skills.
-
-## About Skills
-
-Skills are modular, self-contained folders that extend Codex's capabilities by providing
-specialized knowledge, workflows, and tools. Think of them as "onboarding guides" for specific
-domains or tasks—they transform Codex from a general-purpose agent into a specialized agent
-equipped with procedural knowledge that no model can fully possess.
-
-### What Skills Provide
-
-1. Specialized workflows - Multi-step procedures for specific domains
-2. Tool integrations - Instructions for working with specific file formats or APIs
-3. Domain expertise - Company-specific knowledge, schemas, business logic
-4. Bundled resources - Scripts, references, and assets for complex and repetitive tasks
-
-## Core Principles
-
-### Concise is Key
-
-The context window is a public good. Skills share the context window with everything else Codex needs: system prompt, conversation history, other Skills' metadata, and the actual user request.
-
-**Default assumption: Codex is already very smart.** Only add context Codex doesn't already have. Challenge each piece of information: "Does Codex really need this explanation?" and "Does this paragraph justify its token cost?"
-
-Prefer concise examples over verbose explanations.
-
-### Set Appropriate Degrees of Freedom
-
-Match the level of specificity to the task's fragility and variability:
-
-**High freedom (text-based instructions)**: Use when multiple approaches are valid, decisions depend on context, or heuristics guide the approach.
-
-**Medium freedom (pseudocode or scripts with parameters)**: Use when a preferred pattern exists, some variation is acceptable, or configuration affects behavior.
-
-**Low freedom (specific scripts, few parameters)**: Use when operations are fragile and error-prone, consistency is critical, or a specific sequence must be followed.
-
-Think of Codex as exploring a path: a narrow bridge with cliffs needs specific guardrails (low freedom), while an open field allows many routes (high freedom).
-
-### Protect Validation Integrity
-
-You may use subagents during iteration to validate whether a skill works on realistic tasks or whether a suspected problem is real. This is most useful when you want an independent pass on the skill's behavior, outputs, or failure modes after a revision.  Only do this when it is possible to start new subagents.
-
-When using subagents for validation, treat that as an evaluation surface. The goal is to learn whether the skill generalizes, not whether another agent can reconstruct the answer from leaked context.
-
-Prefer raw artifacts such as example prompts, outputs, diffs, logs, or traces. Give the minimum task-local context needed to perform the validation. Avoid passing the intended answer, suspected bug, intended fix, or your prior conclusions unless the validation explicitly requires them.
-
-### Anatomy of a Skill
-
-Every skill consists of a required SKILL.md file and optional bundled resources:
-
-```
-skill-name/
-├── SKILL.md (required)
-│   ├── YAML frontmatter metadata (required)
-│   │   ├── name: (required)
-│   │   └── description: (required)
-│   └── Markdown instructions (required)
-├── agents/ (recommended)
-│   └── openai.yaml - UI metadata for skill lists and chips
-└── Bundled Resources (optional)
-    ├── scripts/          - Executable code (Python/Bash/etc.)
-    ├── references/       - Documentation intended to be loaded into context as needed
-    └── assets/           - Files used in output (templates, icons, fonts, etc.)
-```
-
-#### SKILL.md (required)
-
-Every SKILL.md consists of:
-
-- **Frontmatter** (YAML): Contains `name` and `description` fields. These are the only fields that Codex reads to determine when the skill gets used, thus it is very important to be clear and comprehensive in describing what the skill is, and when it should be used.
-- **Body** (Markdown): Instructions and guidance for using the skill. Only loaded AFTER the skill triggers (if at all).
-
-#### Agents metadata (recommended)
-
-- UI-facing metadata for skill lists and chips
-- Read references/openai_yaml.md before generating values and follow its descriptions and constraints
-- Create: human-facing `display_name`, `short_description`, and `default_prompt` by reading the skill
-- Generate deterministically by passing the values as `--interface key=value` to `scripts/generate_openai_yaml.py` or `scripts/init_skill.py`
-- On updates: validate `agents/openai.yaml` still matches SKILL.md; regenerate if stale
-- Only include other optional interface fields (icons, brand color) if explicitly provided
-- See references/openai_yaml.md for field definitions and examples
-
-#### Bundled Resources (optional)
-
-##### Scripts (`scripts/`)
-
-Executable code (Python/Bash/etc.) for tasks that require deterministic reliability or are repeatedly rewritten.
-
-- **When to include**: When the same code is being rewritten repeatedly or deterministic reliability is needed
-- **Example**: `scripts/rotate_pdf.py` for PDF rotation tasks
-- **Benefits**: Token efficient, deterministic, may be executed without loading into context
-- **Note**: Scripts may still need to be read by Codex for patching or environment-specific adjustments
-
-##### References (`references/`)
-
-Documentation and reference material intended to be loaded as needed into context to inform Codex's process and thinking.
-
-- **When to include**: For documentation that Codex should reference while working
-- **Examples**: `references/finance.md` for financial schemas, `references/mnda.md` for company NDA template, `references/policies.md` for company policies, `references/api_docs.md` for API specifications
-- **Use cases**: Database schemas, API documentation, domain knowledge, company policies, detailed workflow guides
-- **Benefits**: Keeps SKILL.md lean, loaded only when Codex determines it's needed
-- **Best practice**: If files are large (>10k words), include grep search patterns in SKILL.md
-- **Avoid duplication**: Information should live in either SKILL.md or references files, not both. Prefer references files for detailed information unless it's truly core to the skill—this keeps SKILL.md lean while making information discoverable without hogging the context window. Keep only essential procedural instructions and workflow guidance in SKILL.md; move detailed reference material, schemas, and examples to references files.
-
-##### Assets (`assets/`)
-
-Files not intended to be loaded into context, but rather used within the output Codex produces.
-
-- **When to include**: When the skill needs files that will be used in the final output
-- **Examples**: `assets/logo.png` for brand assets, `assets/slides.pptx` for PowerPoint templates, `assets/frontend-template/` for HTML/React boilerplate, `assets/font.ttf` for typography
-- **Use cases**: Templates, images, icons, boilerplate code, fonts, sample documents that get copied or modified
-- **Benefits**: Separates output resources from documentation, enables Codex to use files without loading them into context
-
-#### What to Not Include in a Skill
-
-A skill should only contain essential files that directly support its functionality. Do NOT create extraneous documentation or auxiliary files, including:
-
-- README.md
-- INSTALLATION_GUIDE.md
-- QUICK_REFERENCE.md
-- CHANGELOG.md
-- etc.
-
-The skill should only contain the information needed for an AI agent to do the job at hand. It should not contain auxiliary context about the process that went into creating it, setup and testing procedures, user-facing documentation, etc. Creating additional documentation files just adds clutter and confusion.
-
-### Progressive Disclosure Design Principle
-
-Skills use a three-level loading system to manage context efficiently:
-
-1. **Metadata (name + description)** - Always in context (~100 words)
-2. **SKILL.md body** - When skill triggers (<5k words)
-3. **Bundled resources** - As needed by Codex (Unlimited because scripts can be executed without reading into context window)
-
-#### Progressive Disclosure Patterns
-
-Keep SKILL.md body to the essentials and under 500 lines to minimize context bloat. Split content into separate files when approaching this limit. When splitting out content into other files, it is very important to reference them from SKILL.md and describe clearly when to read them, to ensure the reader of the skill knows they exist and when to use them.
-
-**Key principle:** When a skill supports multiple variations, frameworks, or options, keep only the core workflow and selection guidance in SKILL.md. Move variant-specific details (patterns, examples, configuration) into separate reference files.
-
-**Pattern 1: High-level guide with references**
-
-```markdown
-# PDF Processing
-
-## Quick start
-
-Extract text with pdfplumber:
-[code example]
-
-## Advanced features
-
-- **Form filling**: See [FORMS.md](FORMS.md) for complete guide
-- **API reference**: See [REFERENCE.md](REFERENCE.md) for all methods
-- **Examples**: See [EXAMPLES.md](EXAMPLES.md) for common patterns
-```
-
-Codex loads FORMS.md, REFERENCE.md, or EXAMPLES.md only when needed.
-
-**Pattern 2: Domain-specific organization**
-
-For Skills with multiple domains, organize content by domain to avoid loading irrelevant context:
-
-```
-bigquery-skill/
-├── SKILL.md (overview and navigation)
-└── reference/
-    ├── finance.md (revenue, billing metrics)
-    ├── sales.md (opportunities, pipeline)
-    ├── product.md (API usage, features)
-    └── marketing.md (campaigns, attribution)
-```
-
-When a user asks about sales metrics, Codex only reads sales.md.
-
-Similarly, for skills supporting multiple frameworks or variants, organize by variant:
-
-```
-cloud-deploy/
-├── SKILL.md (workflow + provider selection)
-└── references/
-    ├── aws.md (AWS deployment patterns)
-    ├── gcp.md (GCP deployment patterns)
-    └── azure.md (Azure deployment patterns)
-```
-
-When the user chooses AWS, Codex only reads aws.md.
-
-**Pattern 3: Conditional details**
-
-Show basic content, link to advanced content:
-
-```markdown
-# DOCX Processing
-
-## Creating documents
-
-Use docx-js for new documents. See [DOCX-JS.md](DOCX-JS.md).
-
-## Editing documents
-
-For simple edits, modify the XML directly.
-
-**For tracked changes**: See [REDLINING.md](REDLINING.md)
-**For OOXML details**: See [OOXML.md](OOXML.md)
-```
-
-Codex reads REDLINING.md or OOXML.md only when the user needs those features.
-
-**Important guidelines:**
-
-- **Avoid deeply nested references** - Keep references one level deep from SKILL.md. All reference files should link directly from SKILL.md.
-- **Structure longer reference files** - For files longer than 100 lines, include a table of contents at the top so Codex can see the full scope when previewing.
-
-## Skill Creation Process
-
-Skill creation involves these steps:
-
-1. Understand the skill with concrete examples
-2. Plan reusable skill contents (scripts, references, assets)
-3. Initialize the skill (run init_skill.py)
-4. Edit the skill (implement resources and write SKILL.md)
-5. Validate the skill (run quick_validate.py)
-6. Iterate based on real usage and forward-test complex skills.
-
-Follow these steps in order, skipping only if there is a clear reason why they are not applicable.
-
-### Skill Naming
-
-- Use lowercase letters, digits, and hyphens only; normalize user-provided titles to hyphen-case (e.g., "Plan Mode" -> `plan-mode`).
-- When generating names, generate a name under 64 characters (letters, digits, hyphens).
-- Prefer short, verb-led phrases that describe the action.
-- Namespace by tool when it improves clarity or triggering (e.g., `gh-address-comments`, `linear-address-issue`).
-- Name the skill folder exactly after the skill name.
-
-### Step 1: Understanding the Skill with Concrete Examples
-
-Skip this step only when the skill's usage patterns are already clearly understood. It remains valuable even when working with an existing skill.
-
-To create an effective skill, clearly understand concrete examples of how the skill will be used. This understanding can come from either direct user examples or generated examples that are validated with user feedback.
-
-For example, when building an image-editor skill, relevant questions include:
-
-- "What functionality should the image-editor skill support? Editing, rotating, anything else?"
-- "Can you give some examples of how this skill would be used?"
-- "I can imagine users asking for things like 'Remove the red-eye from this image' or 'Rotate this image'. Are there other ways you imagine this skill being used?"
-- "What would a user say that should trigger this skill?"
-- "Where should I create this skill? If you do not have a preference, I will place it in `$CODEX_HOME/skills` (or `~/.codex/skills` when `CODEX_HOME` is unset) so Codex can discover it automatically."
-
-To avoid overwhelming users, avoid asking too many questions in a single message. Start with the most important questions and follow up as needed for better effectiveness.
-
-Conclude this step when there is a clear sense of the functionality the skill should support.
-
-### Step 2: Planning the Reusable Skill Contents
-
-To turn concrete examples into an effective skill, analyze each example by:
-
-1. Considering how to execute on the example from scratch
-2. Identifying what scripts, references, and assets would be helpful when executing these workflows repeatedly
-
-Example: When building a `pdf-editor` skill to handle queries like "Help me rotate this PDF," the analysis shows:
-
-1. Rotating a PDF requires re-writing the same code each time
-2. A `scripts/rotate_pdf.py` script would be helpful to store in the skill
-
-Example: When designing a `frontend-webapp-builder` skill for queries like "Build me a todo app" or "Build me a dashboard to track my steps," the analysis shows:
-
-1. Writing a frontend webapp requires the same boilerplate HTML/React each time
-2. An `assets/hello-world/` template containing the boilerplate HTML/React project files would be helpful to store in the skill
-
-Example: When building a `big-query` skill to handle queries like "How many users have logged in today?" the analysis shows:
-
-1. Querying BigQuery requires re-discovering the table schemas and relationships each time
-2. A `references/schema.md` file documenting the table schemas would be helpful to store in the skill
-
-To establish the skill's contents, analyze each concrete example to create a list of the reusable resources to include: scripts, references, and assets.
-
-### Step 3: Initializing the Skill
-
-At this point, it is time to actually create the skill.
-
-Skip this step only if the skill being developed already exists. In this case, continue to the next step.
-
-Before running `init_skill.py`, ask where the user wants the skill created. If they do not specify a location, default to `$CODEX_HOME/skills`; when `CODEX_HOME` is unset, fall back to `~/.codex/skills` so the skill is auto-discovered.
-
-When creating a new skill from scratch, always run the `init_skill.py` script. The script conveniently generates a new template skill directory that automatically includes everything a skill requires, making the skill creation process much more efficient and reliable.
-
-Usage:
-
-```bash
-scripts/init_skill.py <skill-name> --path <output-directory> [--resources scripts,references,assets] [--examples]
-```
-
-Examples:
-
-```bash
-scripts/init_skill.py my-skill --path "${CODEX_HOME:-$HOME/.codex}/skills"
-scripts/init_skill.py my-skill --path "${CODEX_HOME:-$HOME/.codex}/skills" --resources scripts,references
-scripts/init_skill.py my-skill --path ~/work/skills --resources scripts --examples
-```
-
-The script:
-
-- Creates the skill directory at the specified path
-- Generates a SKILL.md template with proper frontmatter and TODO placeholders
-- Creates `agents/openai.yaml` using agent-generated `display_name`, `short_description`, and `default_prompt` passed via `--interface key=value`
-- Optionally creates resource directories based on `--resources`
-- Optionally adds example files when `--examples` is set
-
-After initialization, customize the SKILL.md and add resources as needed. If you used `--examples`, replace or delete placeholder files.
-
-Generate `display_name`, `short_description`, and `default_prompt` by reading the skill, then pass them as `--interface key=value` to `init_skill.py` or regenerate with:
-
-```bash
-scripts/generate_openai_yaml.py <path/to/skill-folder> --interface key=value
-```
-
-Only include other optional interface fields when the user explicitly provides them. For full field descriptions and examples, see references/openai_yaml.md.
-
-### Step 4: Edit the Skill
-
-When editing the (newly-generated or existing) skill, remember that the skill is being created for another instance of Codex to use. Include information that would be beneficial and non-obvious to Codex. Consider what procedural knowledge, domain-specific details, or reusable assets would help another Codex instance execute these tasks more effectively.
-
-After substantial revisions, or if the skill is particularly tricky, you should use subagents to forward-test the skill on realistic tasks or artifacts. When doing so, pass the artifact under validation rather than your diagnosis of what is wrong, and keep the prompt generic enough that success depends on transferable reasoning rather than hidden ground truth.
-
-#### Start with Reusable Skill Contents
-
-To begin implementation, start with the reusable resources identified above: `scripts/`, `references/`, and `assets/` files. Note that this step may require user input. For example, when implementing a `brand-guidelines` skill, the user may need to provide brand assets or templates to store in `assets/`, or documentation to store in `references/`.
-
-Added scripts must be tested by actually running them to ensure there are no bugs and that the output matches what is expected. If there are many similar scripts, only a representative sample needs to be tested to ensure confidence that they all work while balancing time to completion.
-
-If you used `--examples`, delete any placeholder files that are not needed for the skill. Only create resource directories that are actually required.
-
-#### Update SKILL.md
-
-**Writing Guidelines:** Always use imperative/infinitive form.
-
-##### Frontmatter
-
-Write the YAML frontmatter with `name` and `description`:
-
-- `name`: The skill name
-- `description`: This is the primary triggering mechanism for your skill, and helps Codex understand when to use the skill.
-  - Include both what the Skill does and specific triggers/contexts for when to use it.
-  - Include all "when to use" information here - Not in the body. The body is only loaded after triggering, so "When to Use This Skill" sections in the body are not helpful to Codex.
-  - Example description for a `docx` skill: "Comprehensive document creation, editing, and analysis with support for tracked changes, comments, formatting preservation, and text extraction. Use when Codex needs to work with professional documents (.docx files) for: (1) Creating new documents, (2) Modifying or editing content, (3) Working with tracked changes, (4) Adding comments, or any other document tasks"
-
-Do not include any other fields in YAML frontmatter.
-
-##### Body
-
-Write instructions for using the skill and its bundled resources.
-
-### Step 5: Validate the Skill
-
-Once development of the skill is complete, validate the skill folder to catch basic issues early:
-
-```bash
-scripts/quick_validate.py <path/to/skill-folder>
-```
-
-The validation script checks YAML frontmatter format, required fields, and naming rules. If validation fails, fix the reported issues and run the command again.
-
-### Step 6: Iterate
-
-After testing the skill, you may detect the skill is complex enough that it requires forward-testing; or users may request improvements.
-
-User testing often this happens right after using the skill, with fresh context of how the skill performed.
-
-**Forward-testing and iteration workflow:**
-
-1. Use the skill on real tasks
-2. Notice struggles or inefficiencies
-3. Identify how SKILL.md or bundled resources should be updated
-4. Implement changes and test again
-5. Forward-test if it is reasonable and appropriate
-
-## Forward-testing
-
-To forward-test, launch subagents as a way to stress test the skill with minimal context.
-Subagents should *not* know that they are being asked to test the skill.  They should be treated as
-an agent asked to perform a task by the user.  Prompts to subagents should look like:
-  `Use $skill-x at /path/to/skill-x to solve problem y`
-Not:
-  `Review the skill at /path/to/skill-x; pretend a user asks you to...`
-
-Decision rule for forward-testing:
-  - Err on the side of forward-testing
-  - Ask for approval if you think there's a risk that forward-testing would:
-    * take a long time,
-    * require additional approvals from the user, or
-    * modify live production systems
-
-  In these cases, show the user your proposed prompt and request (1) a yes/no decision, and
-  (2) any suggested modifictions.
-
-Considerations when forward-testing:
-   - use fresh threads for independent passes
-   - pass the skill, and a request in a similar way the user would.
-   - pass raw artifacts, not your conclusions
-   - avoid showing expected answers or intended fixes
-   - rebuild context from source artifacts after each iteration
-   - review the subagent's output and reasoning and emitted artifacts
-   - avoid leaving artifacts the agent can find on disk between iterations;
-     clean up subagents' artifacts to avoid additional contamination.
-
-If forward-testing only succeeds when subagents see leaked context, tighten the skill or the
-forward-testing setup before trusting the result.
diff --git a/skills/skill-creator/agents/openai.yaml b/skills/skill-creator/agents/openai.yaml
deleted file mode 100644
index 3095c60..0000000
--- a/skills/skill-creator/agents/openai.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-interface:
-  display_name: "Skill Creator"
-  short_description: "Create or update a skill"
-  icon_small: "./assets/skill-creator-small.svg"
-  icon_large: "./assets/skill-creator.png"
diff --git a/skills/skill-creator/assets/skill-creator-small.svg b/skills/skill-creator/assets/skill-creator-small.svg
deleted file mode 100644
index c6e4f67..0000000
--- a/skills/skill-creator/assets/skill-creator-small.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="20" height="20" fill="currentColor" viewBox="0 0 20 20">
-  <path fill="#0D0D0D" d="M12.03 4.113a3.612 3.612 0 0 1 5.108 5.108l-6.292 6.29c-.324.324-.56.561-.791.752l-.235.176c-.205.14-.422.261-.65.36l-.229.093a4.136 4.136 0 0 1-.586.16l-.764.134-2.394.4c-.142.024-.294.05-.423.06-.098.007-.232.01-.378-.026l-.149-.05a1.081 1.081 0 0 1-.521-.474l-.046-.093a1.104 1.104 0 0 1-.075-.527c.01-.129.035-.28.06-.422l.398-2.394c.1-.602.162-.987.295-1.35l.093-.23c.1-.228.22-.445.36-.65l.176-.235c.19-.232.428-.467.751-.79l6.292-6.292Zm-5.35 7.232c-.35.35-.534.535-.66.688l-.11.147a2.67 2.67 0 0 0-.24.433l-.062.154c-.08.22-.124.462-.232 1.112l-.398 2.394-.001.001h.003l2.393-.399.717-.126a2.63 2.63 0 0 0 .394-.105l.154-.063a2.65 2.65 0 0 0 .433-.24l.147-.11c.153-.126.339-.31.688-.66l4.988-4.988-3.227-3.226-4.987 4.988Zm9.517-6.291a2.281 2.281 0 0 0-3.225 0l-.364.362 3.226 3.227.363-.364c.89-.89.89-2.334 0-3.225ZM4.583 1.783a.3.3 0 0 1 .294.241c.117.585.347 1.092.707 1.48.357.385.859.668 1.549.783a.3.3 0 0 1 0 .592c-.69.115-1.192.398-1.549.783-.315.34-.53.77-.657 1.265l-.05.215a.3.3 0 0 1-.588 0c-.117-.585-.347-1.092-.707-1.48-.357-.384-.859-.668-1.549-.783a.3.3 0 0 1 0-.592c.69-.115 1.192-.398 1.549-.783.36-.388.59-.895.707-1.48l.015-.05a.3.3 0 0 1 .279-.19Z"/>
-</svg>
diff --git a/skills/skill-creator/assets/skill-creator.png b/skills/skill-creator/assets/skill-creator.png
deleted file mode 100644
index 4f3d6d82fa78fbdce97af3c17f6a25c683aa3290..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1563
zcmV+$2ITpPP)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1+Ym(K~#7F?cH5#
z99100@!y%5ZPPYs)~0PjXk@GQA{H?sLh4NusZb$>1#i4F!Dtb@FnH%p6OalPi4TDy
zMcTdqNqhk%K`*Qbx>_X{K4hvjHd<=hH0fq{Gsiib9J_g*IrFfyGygA?&1Rp<e)!Lv
z&F&-sMNt$*Q4~c{6h%=KMNyPO4AlSe^Y3O*N_Bv<bom=~{{V|kChCnG>l>Iw2qhkb
ze|)YB#{A1DHe~H{=}oVwFPPA*37~O^y*^+fpb`thKY1$)zGE1LrVQMsu}jdkKwuIF
z!Y>Y|aer<UrQKcdlAZ^Q{2)91&JcVoQ6T*Ma0W$d-2N&9zp9%V!;uSptb5j%eT;^L
z6bObW-<-wIr$^yai2w-<LzX|##Yf)12p@_)$mHZ?=J%(Mjaw-rgCMhbFaPM=oA6ky
z_aOp9(=>ZBkl8tR2W{Vc1+7>_fXyPMKjmfh7264^#1Q8f8yfM)Gsj@1QV6g#maH@I
zP%I~8Ek<RbOv;k}5F1c?Wgoi<*$P7x%A{x|<$X!4K(@n>1&*Sz<4`O%n=C#xm?`ka
z@f*eCnG*Imx=o;)FU8GPEG9%?fE(jGa4*wlOu)drquT{LDa8yFs(BEJAz$>R*gPVE
zqU#+{sHQ>IV#p$cqEO9(Y=$ALItt^-S@v#+A*(J*LO`5i$f|}?GICI;ra;_c$ihcq
zX6#?7t76DPMwx(OH38xkLlzp!uBppVEb<_JVaNhUVVGdAj!ZzYNQ3x|AuFRSya%H+
z?dbZhQ0jjifQKRr5)?-HzW@Ca#_cg2y7h{`C>$TMzDr80D_JB#g2uq?7v-;0HimyF
z%!H*6!ecrjR#+G^-I_yvejNAeo`a<|Y<nL|JL@pN{{Z&hoCdS3mG9aZOIo+R)V&Fh
zMG7Qr44F3+E-_5_P-H-=g&|WxS=iTPHeUbJHw;lE-k_>BMrB2#6*u;OYX9V;b-SyY
zmSuIfx3`<{v8qo<lrTgNCnXS!^5dh5MGZr?4N71b<;O;qiYkU|6O=$P%8!dG6m<;Q
z8kE2>M4|80YXzgSg7L69b@21RF+`z))FOtR$uxAc?!1W*3JruXoD~WPVK^^v5W;X*
zpdf_dzQ8~TL#;qS2tz&JK?uWJzP@9~zdK179`pAt+{P25gyAjUK={;^Ves}2U?==6
zNf;tu_96V2E4^TR<-qwx`(A%qKJ|LP3BwTiGa(EWhXUIZ!jHo1q$CkT<Qb$q9qaZR
z-cXW?A@V*UtEQteHIyV{h&+Mtsqv1jS5@v%l8zzrHX()S?Dki3hC&$2c>~d#9UdUR
zH40%o$QuZQi$i}mMj?#VDT6HUKah5JtJNrku|D+)DV1De$d*y~ogWBegVa9;v@4x`
z{E^m^dv>Y3)-b^IHelgvz;bpZlf!BnL!=DS*wpgU)oZ_Yc0Tbalu)#Ku-%=0qSQQw
zNPQo|`ICR&zKgd<K7%+_%4h~_Ia@yUSS&C^${>uf@(L>gD6zp1DQ&W{*=*XftU-Bx
z{{AAaUi%GI*nGtbL!>kzrBZ3#>yIi-O6)L1N+5D`wYCsZVu>MA1<7o7SqLbx#Skfh
zh!xgWmj{RvYYdUEo2<$LK#4tu$n`2~?FwtF{91jn{I@yA@4gUs43X;z*=U8eRh}nB
zZ@!E}7h*pdGS?vX=F0UC71dDKEG$029y`&?4tIz02f3n9Xus>kIZ7E~2%2`79eMr(
zBrMmT%M$w#UDy9A6bf}v=-|G+IQzzn<<ph_!YmliS%q8QYkJd|jWB@(r}RO&{{H^K
znVFe0E^lVq|8n+{`TD76Tg=x^9nGP>BbTJjk&~1^x!BXwGidKmHbOD6^2FPh=j>?`
zzdy<x8yll1-a(!|N-8#Aa@A!RhIqp1iKi%vq9}@@D2k#eilV55^dCV<^wOW~YLEZ`
N002ovPDHLkV1k6v&87eV

diff --git a/skills/skill-creator/license.txt b/skills/skill-creator/license.txt
deleted file mode 100644
index d645695..0000000
--- a/skills/skill-creator/license.txt
+++ /dev/null
@@ -1,202 +0,0 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding those notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. We also recommend that a
-      file or class name and description of purpose be included on the
-      same "printed page" as the copyright notice for easier
-      identification within third-party archives.
-
-   Copyright [yyyy] [name of copyright owner]
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/skills/skill-creator/references/openai_yaml.md b/skills/skill-creator/references/openai_yaml.md
deleted file mode 100644
index 90f9e8e..0000000
--- a/skills/skill-creator/references/openai_yaml.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# openai.yaml fields (full example + descriptions)
-
-`agents/openai.yaml` is an extended, product-specific config intended for the machine/harness to read, not the agent. Other product-specific config can also live in the `agents/` folder.
-
-## Full example
-
-```yaml
-interface:
-  display_name: "Optional user-facing name"
-  short_description: "Optional user-facing description"
-  icon_small: "./assets/small-400px.png"
-  icon_large: "./assets/large-logo.svg"
-  brand_color: "#3B82F6"
-  default_prompt: "Optional surrounding prompt to use the skill with"
-
-dependencies:
-  tools:
-    - type: "mcp"
-      value: "github"
-      description: "GitHub MCP server"
-      transport: "streamable_http"
-      url: "https://api.githubcopilot.com/mcp/"
-
-policy:
-  allow_implicit_invocation: true
-```
-
-## Field descriptions and constraints
-
-Top-level constraints:
-
-- Quote all string values.
-- Keep keys unquoted.
-- For `interface.default_prompt`: generate a helpful, short (typically 1 sentence) example starting prompt based on the skill. It must explicitly mention the skill as `$skill-name` (e.g., "Use $skill-name-here to draft a concise weekly status update.").
-
-- `interface.display_name`: Human-facing title shown in UI skill lists and chips.
-- `interface.short_description`: Human-facing short UI blurb (25–64 chars) for quick scanning.
-- `interface.icon_small`: Path to a small icon asset (relative to skill dir). Default to `./assets/` and place icons in the skill's `assets/` folder.
-- `interface.icon_large`: Path to a larger logo asset (relative to skill dir). Default to `./assets/` and place icons in the skill's `assets/` folder.
-- `interface.brand_color`: Hex color used for UI accents (e.g., badges).
-- `interface.default_prompt`: Default prompt snippet inserted when invoking the skill.
-- `dependencies.tools[].type`: Dependency category. Only `mcp` is supported for now.
-- `dependencies.tools[].value`: Identifier of the tool or dependency.
-- `dependencies.tools[].description`: Human-readable explanation of the dependency.
-- `dependencies.tools[].transport`: Connection type when `type` is `mcp`.
-- `dependencies.tools[].url`: MCP server URL when `type` is `mcp`.
-- `policy.allow_implicit_invocation`: When false, the skill is not injected into
-  the model context by default, but can still be invoked explicitly via `$skill`.
-  Defaults to true.
diff --git a/skills/skill-creator/scripts/generate_openai_yaml.py b/skills/skill-creator/scripts/generate_openai_yaml.py
deleted file mode 100644
index 3fd7405..0000000
--- a/skills/skill-creator/scripts/generate_openai_yaml.py
+++ /dev/null
@@ -1,226 +0,0 @@
-#!/usr/bin/env python3
-"""
-OpenAI YAML Generator - Creates agents/openai.yaml for a skill folder.
-
-Usage:
-    generate_openai_yaml.py <skill_dir> [--name <skill_name>] [--interface key=value]
-"""
-
-import argparse
-import re
-import sys
-from pathlib import Path
-
-ACRONYMS = {
-    "GH",
-    "MCP",
-    "API",
-    "CI",
-    "CLI",
-    "LLM",
-    "PDF",
-    "PR",
-    "UI",
-    "URL",
-    "SQL",
-}
-
-BRANDS = {
-    "openai": "OpenAI",
-    "openapi": "OpenAPI",
-    "github": "GitHub",
-    "pagerduty": "PagerDuty",
-    "datadog": "DataDog",
-    "sqlite": "SQLite",
-    "fastapi": "FastAPI",
-}
-
-SMALL_WORDS = {"and", "or", "to", "up", "with"}
-
-ALLOWED_INTERFACE_KEYS = {
-    "display_name",
-    "short_description",
-    "icon_small",
-    "icon_large",
-    "brand_color",
-    "default_prompt",
-}
-
-
-def yaml_quote(value):
-    escaped = value.replace("\\", "\\\\").replace('"', '\\"').replace("\n", "\\n")
-    return f'"{escaped}"'
-
-
-def format_display_name(skill_name):
-    words = [word for word in skill_name.split("-") if word]
-    formatted = []
-    for index, word in enumerate(words):
-        lower = word.lower()
-        upper = word.upper()
-        if upper in ACRONYMS:
-            formatted.append(upper)
-            continue
-        if lower in BRANDS:
-            formatted.append(BRANDS[lower])
-            continue
-        if index > 0 and lower in SMALL_WORDS:
-            formatted.append(lower)
-            continue
-        formatted.append(word.capitalize())
-    return " ".join(formatted)
-
-
-def generate_short_description(display_name):
-    description = f"Help with {display_name} tasks"
-
-    if len(description) < 25:
-        description = f"Help with {display_name} tasks and workflows"
-    if len(description) < 25:
-        description = f"Help with {display_name} tasks with guidance"
-
-    if len(description) > 64:
-        description = f"Help with {display_name}"
-    if len(description) > 64:
-        description = f"{display_name} helper"
-    if len(description) > 64:
-        description = f"{display_name} tools"
-    if len(description) > 64:
-        suffix = " helper"
-        max_name_length = 64 - len(suffix)
-        trimmed = display_name[:max_name_length].rstrip()
-        description = f"{trimmed}{suffix}"
-    if len(description) > 64:
-        description = description[:64].rstrip()
-
-    if len(description) < 25:
-        description = f"{description} workflows"
-        if len(description) > 64:
-            description = description[:64].rstrip()
-
-    return description
-
-
-def read_frontmatter_name(skill_dir):
-    skill_md = Path(skill_dir) / "SKILL.md"
-    if not skill_md.exists():
-        print(f"[ERROR] SKILL.md not found in {skill_dir}")
-        return None
-    content = skill_md.read_text()
-    match = re.match(r"^---\n(.*?)\n---", content, re.DOTALL)
-    if not match:
-        print("[ERROR] Invalid SKILL.md frontmatter format.")
-        return None
-    frontmatter_text = match.group(1)
-
-    import yaml
-
-    try:
-        frontmatter = yaml.safe_load(frontmatter_text)
-    except yaml.YAMLError as exc:
-        print(f"[ERROR] Invalid YAML frontmatter: {exc}")
-        return None
-    if not isinstance(frontmatter, dict):
-        print("[ERROR] Frontmatter must be a YAML dictionary.")
-        return None
-    name = frontmatter.get("name", "")
-    if not isinstance(name, str) or not name.strip():
-        print("[ERROR] Frontmatter 'name' is missing or invalid.")
-        return None
-    return name.strip()
-
-
-def parse_interface_overrides(raw_overrides):
-    overrides = {}
-    optional_order = []
-    for item in raw_overrides:
-        if "=" not in item:
-            print(f"[ERROR] Invalid interface override '{item}'. Use key=value.")
-            return None, None
-        key, value = item.split("=", 1)
-        key = key.strip()
-        value = value.strip()
-        if not key:
-            print(f"[ERROR] Invalid interface override '{item}'. Key is empty.")
-            return None, None
-        if key not in ALLOWED_INTERFACE_KEYS:
-            allowed = ", ".join(sorted(ALLOWED_INTERFACE_KEYS))
-            print(f"[ERROR] Unknown interface field '{key}'. Allowed: {allowed}")
-            return None, None
-        overrides[key] = value
-        if key not in ("display_name", "short_description") and key not in optional_order:
-            optional_order.append(key)
-    return overrides, optional_order
-
-
-def write_openai_yaml(skill_dir, skill_name, raw_overrides):
-    overrides, optional_order = parse_interface_overrides(raw_overrides)
-    if overrides is None:
-        return None
-
-    display_name = overrides.get("display_name") or format_display_name(skill_name)
-    short_description = overrides.get("short_description") or generate_short_description(display_name)
-
-    if not (25 <= len(short_description) <= 64):
-        print(
-            "[ERROR] short_description must be 25-64 characters "
-            f"(got {len(short_description)})."
-        )
-        return None
-
-    interface_lines = [
-        "interface:",
-        f"  display_name: {yaml_quote(display_name)}",
-        f"  short_description: {yaml_quote(short_description)}",
-    ]
-
-    for key in optional_order:
-        value = overrides.get(key)
-        if value is not None:
-            interface_lines.append(f"  {key}: {yaml_quote(value)}")
-
-    agents_dir = Path(skill_dir) / "agents"
-    agents_dir.mkdir(parents=True, exist_ok=True)
-    output_path = agents_dir / "openai.yaml"
-    output_path.write_text("\n".join(interface_lines) + "\n")
-    print(f"[OK] Created agents/openai.yaml")
-    return output_path
-
-
-def main():
-    parser = argparse.ArgumentParser(
-        description="Create agents/openai.yaml for a skill directory.",
-    )
-    parser.add_argument("skill_dir", help="Path to the skill directory")
-    parser.add_argument(
-        "--name",
-        help="Skill name override (defaults to SKILL.md frontmatter)",
-    )
-    parser.add_argument(
-        "--interface",
-        action="append",
-        default=[],
-        help="Interface override in key=value format (repeatable)",
-    )
-    args = parser.parse_args()
-
-    skill_dir = Path(args.skill_dir).resolve()
-    if not skill_dir.exists():
-        print(f"[ERROR] Skill directory not found: {skill_dir}")
-        sys.exit(1)
-    if not skill_dir.is_dir():
-        print(f"[ERROR] Path is not a directory: {skill_dir}")
-        sys.exit(1)
-
-    skill_name = args.name or read_frontmatter_name(skill_dir)
-    if not skill_name:
-        sys.exit(1)
-
-    result = write_openai_yaml(skill_dir, skill_name, args.interface)
-    if result:
-        sys.exit(0)
-    sys.exit(1)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/skills/skill-creator/scripts/init_skill.py b/skills/skill-creator/scripts/init_skill.py
deleted file mode 100644
index 69673ea..0000000
--- a/skills/skill-creator/scripts/init_skill.py
+++ /dev/null
@@ -1,400 +0,0 @@
-#!/usr/bin/env python3
-"""
-Skill Initializer - Creates a new skill from template
-
-Usage:
-    init_skill.py <skill-name> --path <path> [--resources scripts,references,assets] [--examples] [--interface key=value]
-
-Examples:
-    init_skill.py my-new-skill --path skills/public
-    init_skill.py my-new-skill --path skills/public --resources scripts,references
-    init_skill.py my-api-helper --path skills/private --resources scripts --examples
-    init_skill.py custom-skill --path /custom/location
-    init_skill.py my-skill --path skills/public --interface short_description="Short UI label"
-"""
-
-import argparse
-import re
-import sys
-from pathlib import Path
-
-from generate_openai_yaml import write_openai_yaml
-
-MAX_SKILL_NAME_LENGTH = 64
-ALLOWED_RESOURCES = {"scripts", "references", "assets"}
-
-SKILL_TEMPLATE = """---
-name: {skill_name}
-description: [TODO: Complete and informative explanation of what the skill does and when to use it. Include WHEN to use this skill - specific scenarios, file types, or tasks that trigger it.]
----
-
-# {skill_title}
-
-## Overview
-
-[TODO: 1-2 sentences explaining what this skill enables]
-
-## Structuring This Skill
-
-[TODO: Choose the structure that best fits this skill's purpose. Common patterns:
-
-**1. Workflow-Based** (best for sequential processes)
-- Works well when there are clear step-by-step procedures
-- Example: DOCX skill with "Workflow Decision Tree" -> "Reading" -> "Creating" -> "Editing"
-- Structure: ## Overview -> ## Workflow Decision Tree -> ## Step 1 -> ## Step 2...
-
-**2. Task-Based** (best for tool collections)
-- Works well when the skill offers different operations/capabilities
-- Example: PDF skill with "Quick Start" -> "Merge PDFs" -> "Split PDFs" -> "Extract Text"
-- Structure: ## Overview -> ## Quick Start -> ## Task Category 1 -> ## Task Category 2...
-
-**3. Reference/Guidelines** (best for standards or specifications)
-- Works well for brand guidelines, coding standards, or requirements
-- Example: Brand styling with "Brand Guidelines" -> "Colors" -> "Typography" -> "Features"
-- Structure: ## Overview -> ## Guidelines -> ## Specifications -> ## Usage...
-
-**4. Capabilities-Based** (best for integrated systems)
-- Works well when the skill provides multiple interrelated features
-- Example: Product Management with "Core Capabilities" -> numbered capability list
-- Structure: ## Overview -> ## Core Capabilities -> ### 1. Feature -> ### 2. Feature...
-
-Patterns can be mixed and matched as needed. Most skills combine patterns (e.g., start with task-based, add workflow for complex operations).
-
-Delete this entire "Structuring This Skill" section when done - it's just guidance.]
-
-## [TODO: Replace with the first main section based on chosen structure]
-
-[TODO: Add content here. See examples in existing skills:
-- Code samples for technical skills
-- Decision trees for complex workflows
-- Concrete examples with realistic user requests
-- References to scripts/templates/references as needed]
-
-## Resources (optional)
-
-Create only the resource directories this skill actually needs. Delete this section if no resources are required.
-
-### scripts/
-Executable code (Python/Bash/etc.) that can be run directly to perform specific operations.
-
-**Examples from other skills:**
-- PDF skill: `fill_fillable_fields.py`, `extract_form_field_info.py` - utilities for PDF manipulation
-- DOCX skill: `document.py`, `utilities.py` - Python modules for document processing
-
-**Appropriate for:** Python scripts, shell scripts, or any executable code that performs automation, data processing, or specific operations.
-
-**Note:** Scripts may be executed without loading into context, but can still be read by Codex for patching or environment adjustments.
-
-### references/
-Documentation and reference material intended to be loaded into context to inform Codex's process and thinking.
-
-**Examples from other skills:**
-- Product management: `communication.md`, `context_building.md` - detailed workflow guides
-- BigQuery: API reference documentation and query examples
-- Finance: Schema documentation, company policies
-
-**Appropriate for:** In-depth documentation, API references, database schemas, comprehensive guides, or any detailed information that Codex should reference while working.
-
-### assets/
-Files not intended to be loaded into context, but rather used within the output Codex produces.
-
-**Examples from other skills:**
-- Brand styling: PowerPoint template files (.pptx), logo files
-- Frontend builder: HTML/React boilerplate project directories
-- Typography: Font files (.ttf, .woff2)
-
-**Appropriate for:** Templates, boilerplate code, document templates, images, icons, fonts, or any files meant to be copied or used in the final output.
-
----
-
-**Not every skill requires all three types of resources.**
-"""
-
-EXAMPLE_SCRIPT = '''#!/usr/bin/env python3
-"""
-Example helper script for {skill_name}
-
-This is a placeholder script that can be executed directly.
-Replace with actual implementation or delete if not needed.
-
-Example real scripts from other skills:
-- pdf/scripts/fill_fillable_fields.py - Fills PDF form fields
-- pdf/scripts/convert_pdf_to_images.py - Converts PDF pages to images
-"""
-
-def main():
-    print("This is an example script for {skill_name}")
-    # TODO: Add actual script logic here
-    # This could be data processing, file conversion, API calls, etc.
-
-if __name__ == "__main__":
-    main()
-'''
-
-EXAMPLE_REFERENCE = """# Reference Documentation for {skill_title}
-
-This is a placeholder for detailed reference documentation.
-Replace with actual reference content or delete if not needed.
-
-Example real reference docs from other skills:
-- product-management/references/communication.md - Comprehensive guide for status updates
-- product-management/references/context_building.md - Deep-dive on gathering context
-- bigquery/references/ - API references and query examples
-
-## When Reference Docs Are Useful
-
-Reference docs are ideal for:
-- Comprehensive API documentation
-- Detailed workflow guides
-- Complex multi-step processes
-- Information too lengthy for main SKILL.md
-- Content that's only needed for specific use cases
-
-## Structure Suggestions
-
-### API Reference Example
-- Overview
-- Authentication
-- Endpoints with examples
-- Error codes
-- Rate limits
-
-### Workflow Guide Example
-- Prerequisites
-- Step-by-step instructions
-- Common patterns
-- Troubleshooting
-- Best practices
-"""
-
-EXAMPLE_ASSET = """# Example Asset File
-
-This placeholder represents where asset files would be stored.
-Replace with actual asset files (templates, images, fonts, etc.) or delete if not needed.
-
-Asset files are NOT intended to be loaded into context, but rather used within
-the output Codex produces.
-
-Example asset files from other skills:
-- Brand guidelines: logo.png, slides_template.pptx
-- Frontend builder: hello-world/ directory with HTML/React boilerplate
-- Typography: custom-font.ttf, font-family.woff2
-- Data: sample_data.csv, test_dataset.json
-
-## Common Asset Types
-
-- Templates: .pptx, .docx, boilerplate directories
-- Images: .png, .jpg, .svg, .gif
-- Fonts: .ttf, .otf, .woff, .woff2
-- Boilerplate code: Project directories, starter files
-- Icons: .ico, .svg
-- Data files: .csv, .json, .xml, .yaml
-
-Note: This is a text placeholder. Actual assets can be any file type.
-"""
-
-
-def normalize_skill_name(skill_name):
-    """Normalize a skill name to lowercase hyphen-case."""
-    normalized = skill_name.strip().lower()
-    normalized = re.sub(r"[^a-z0-9]+", "-", normalized)
-    normalized = normalized.strip("-")
-    normalized = re.sub(r"-{2,}", "-", normalized)
-    return normalized
-
-
-def title_case_skill_name(skill_name):
-    """Convert hyphenated skill name to Title Case for display."""
-    return " ".join(word.capitalize() for word in skill_name.split("-"))
-
-
-def parse_resources(raw_resources):
-    if not raw_resources:
-        return []
-    resources = [item.strip() for item in raw_resources.split(",") if item.strip()]
-    invalid = sorted({item for item in resources if item not in ALLOWED_RESOURCES})
-    if invalid:
-        allowed = ", ".join(sorted(ALLOWED_RESOURCES))
-        print(f"[ERROR] Unknown resource type(s): {', '.join(invalid)}")
-        print(f"   Allowed: {allowed}")
-        sys.exit(1)
-    deduped = []
-    seen = set()
-    for resource in resources:
-        if resource not in seen:
-            deduped.append(resource)
-            seen.add(resource)
-    return deduped
-
-
-def create_resource_dirs(skill_dir, skill_name, skill_title, resources, include_examples):
-    for resource in resources:
-        resource_dir = skill_dir / resource
-        resource_dir.mkdir(exist_ok=True)
-        if resource == "scripts":
-            if include_examples:
-                example_script = resource_dir / "example.py"
-                example_script.write_text(EXAMPLE_SCRIPT.format(skill_name=skill_name))
-                example_script.chmod(0o755)
-                print("[OK] Created scripts/example.py")
-            else:
-                print("[OK] Created scripts/")
-        elif resource == "references":
-            if include_examples:
-                example_reference = resource_dir / "api_reference.md"
-                example_reference.write_text(EXAMPLE_REFERENCE.format(skill_title=skill_title))
-                print("[OK] Created references/api_reference.md")
-            else:
-                print("[OK] Created references/")
-        elif resource == "assets":
-            if include_examples:
-                example_asset = resource_dir / "example_asset.txt"
-                example_asset.write_text(EXAMPLE_ASSET)
-                print("[OK] Created assets/example_asset.txt")
-            else:
-                print("[OK] Created assets/")
-
-
-def init_skill(skill_name, path, resources, include_examples, interface_overrides):
-    """
-    Initialize a new skill directory with template SKILL.md.
-
-    Args:
-        skill_name: Name of the skill
-        path: Path where the skill directory should be created
-        resources: Resource directories to create
-        include_examples: Whether to create example files in resource directories
-
-    Returns:
-        Path to created skill directory, or None if error
-    """
-    # Determine skill directory path
-    skill_dir = Path(path).resolve() / skill_name
-
-    # Check if directory already exists
-    if skill_dir.exists():
-        print(f"[ERROR] Skill directory already exists: {skill_dir}")
-        return None
-
-    # Create skill directory
-    try:
-        skill_dir.mkdir(parents=True, exist_ok=False)
-        print(f"[OK] Created skill directory: {skill_dir}")
-    except Exception as e:
-        print(f"[ERROR] Error creating directory: {e}")
-        return None
-
-    # Create SKILL.md from template
-    skill_title = title_case_skill_name(skill_name)
-    skill_content = SKILL_TEMPLATE.format(skill_name=skill_name, skill_title=skill_title)
-
-    skill_md_path = skill_dir / "SKILL.md"
-    try:
-        skill_md_path.write_text(skill_content)
-        print("[OK] Created SKILL.md")
-    except Exception as e:
-        print(f"[ERROR] Error creating SKILL.md: {e}")
-        return None
-
-    # Create agents/openai.yaml
-    try:
-        result = write_openai_yaml(skill_dir, skill_name, interface_overrides)
-        if not result:
-            return None
-    except Exception as e:
-        print(f"[ERROR] Error creating agents/openai.yaml: {e}")
-        return None
-
-    # Create resource directories if requested
-    if resources:
-        try:
-            create_resource_dirs(skill_dir, skill_name, skill_title, resources, include_examples)
-        except Exception as e:
-            print(f"[ERROR] Error creating resource directories: {e}")
-            return None
-
-    # Print next steps
-    print(f"\n[OK] Skill '{skill_name}' initialized successfully at {skill_dir}")
-    print("\nNext steps:")
-    print("1. Edit SKILL.md to complete the TODO items and update the description")
-    if resources:
-        if include_examples:
-            print("2. Customize or delete the example files in scripts/, references/, and assets/")
-        else:
-            print("2. Add resources to scripts/, references/, and assets/ as needed")
-    else:
-        print("2. Create resource directories only if needed (scripts/, references/, assets/)")
-    print("3. Update agents/openai.yaml if the UI metadata should differ")
-    print("4. Run the validator when ready to check the skill structure")
-    print(
-        "5. Forward-test complex skills with realistic user requests to ensure they work as intended"
-    )
-
-    return skill_dir
-
-
-def main():
-    parser = argparse.ArgumentParser(
-        description="Create a new skill directory with a SKILL.md template.",
-    )
-    parser.add_argument("skill_name", help="Skill name (normalized to hyphen-case)")
-    parser.add_argument("--path", required=True, help="Output directory for the skill")
-    parser.add_argument(
-        "--resources",
-        default="",
-        help="Comma-separated list: scripts,references,assets",
-    )
-    parser.add_argument(
-        "--examples",
-        action="store_true",
-        help="Create example files inside the selected resource directories",
-    )
-    parser.add_argument(
-        "--interface",
-        action="append",
-        default=[],
-        help="Interface override in key=value format (repeatable)",
-    )
-    args = parser.parse_args()
-
-    raw_skill_name = args.skill_name
-    skill_name = normalize_skill_name(raw_skill_name)
-    if not skill_name:
-        print("[ERROR] Skill name must include at least one letter or digit.")
-        sys.exit(1)
-    if len(skill_name) > MAX_SKILL_NAME_LENGTH:
-        print(
-            f"[ERROR] Skill name '{skill_name}' is too long ({len(skill_name)} characters). "
-            f"Maximum is {MAX_SKILL_NAME_LENGTH} characters."
-        )
-        sys.exit(1)
-    if skill_name != raw_skill_name:
-        print(f"Note: Normalized skill name from '{raw_skill_name}' to '{skill_name}'.")
-
-    resources = parse_resources(args.resources)
-    if args.examples and not resources:
-        print("[ERROR] --examples requires --resources to be set.")
-        sys.exit(1)
-
-    path = args.path
-
-    print(f"Initializing skill: {skill_name}")
-    print(f"   Location: {path}")
-    if resources:
-        print(f"   Resources: {', '.join(resources)}")
-        if args.examples:
-            print("   Examples: enabled")
-    else:
-        print("   Resources: none (create as needed)")
-    print()
-
-    result = init_skill(skill_name, path, resources, args.examples, args.interface)
-
-    if result:
-        sys.exit(0)
-    else:
-        sys.exit(1)
-
-
-if __name__ == "__main__":
-    main()
diff --git a/skills/skill-creator/scripts/quick_validate.py b/skills/skill-creator/scripts/quick_validate.py
deleted file mode 100644
index 0547b40..0000000
--- a/skills/skill-creator/scripts/quick_validate.py
+++ /dev/null
@@ -1,101 +0,0 @@
-#!/usr/bin/env python3
-"""
-Quick validation script for skills - minimal version
-"""
-
-import re
-import sys
-from pathlib import Path
-
-import yaml
-
-MAX_SKILL_NAME_LENGTH = 64
-
-
-def validate_skill(skill_path):
-    """Basic validation of a skill"""
-    skill_path = Path(skill_path)
-
-    skill_md = skill_path / "SKILL.md"
-    if not skill_md.exists():
-        return False, "SKILL.md not found"
-
-    content = skill_md.read_text()
-    if not content.startswith("---"):
-        return False, "No YAML frontmatter found"
-
-    match = re.match(r"^---\n(.*?)\n---", content, re.DOTALL)
-    if not match:
-        return False, "Invalid frontmatter format"
-
-    frontmatter_text = match.group(1)
-
-    try:
-        frontmatter = yaml.safe_load(frontmatter_text)
-        if not isinstance(frontmatter, dict):
-            return False, "Frontmatter must be a YAML dictionary"
-    except yaml.YAMLError as e:
-        return False, f"Invalid YAML in frontmatter: {e}"
-
-    allowed_properties = {"name", "description", "license", "allowed-tools", "metadata"}
-
-    unexpected_keys = set(frontmatter.keys()) - allowed_properties
-    if unexpected_keys:
-        allowed = ", ".join(sorted(allowed_properties))
-        unexpected = ", ".join(sorted(unexpected_keys))
-        return (
-            False,
-            f"Unexpected key(s) in SKILL.md frontmatter: {unexpected}. Allowed properties are: {allowed}",
-        )
-
-    if "name" not in frontmatter:
-        return False, "Missing 'name' in frontmatter"
-    if "description" not in frontmatter:
-        return False, "Missing 'description' in frontmatter"
-
-    name = frontmatter.get("name", "")
-    if not isinstance(name, str):
-        return False, f"Name must be a string, got {type(name).__name__}"
-    name = name.strip()
-    if name:
-        if not re.match(r"^[a-z0-9-]+$", name):
-            return (
-                False,
-                f"Name '{name}' should be hyphen-case (lowercase letters, digits, and hyphens only)",
-            )
-        if name.startswith("-") or name.endswith("-") or "--" in name:
-            return (
-                False,
-                f"Name '{name}' cannot start/end with hyphen or contain consecutive hyphens",
-            )
-        if len(name) > MAX_SKILL_NAME_LENGTH:
-            return (
-                False,
-                f"Name is too long ({len(name)} characters). "
-                f"Maximum is {MAX_SKILL_NAME_LENGTH} characters.",
-            )
-
-    description = frontmatter.get("description", "")
-    if not isinstance(description, str):
-        return False, f"Description must be a string, got {type(description).__name__}"
-    description = description.strip()
-    if description:
-        if "<" in description or ">" in description:
-            return False, "Description cannot contain angle brackets (< or >)"
-        if len(description) > 1024:
-            return (
-                False,
-                f"Description is too long ({len(description)} characters). Maximum is 1024 characters.",
-            )
-
-    return True, "Skill is valid!"
-
-
-if __name__ == "__main__":
-    if len(sys.argv) != 2:
-        print("Usage: python quick_validate.py <skill_directory>")
-        sys.exit(1)
-
-    valid, message = validate_skill(sys.argv[1])
-    print(message)
-    sys.exit(0 if valid else 1)
diff --git a/skills/skill-installer/LICENSE.txt b/skills/skill-installer/LICENSE.txt
deleted file mode 100644
index d645695..0000000
--- a/skills/skill-installer/LICENSE.txt
+++ /dev/null
@@ -1,202 +0,0 @@
-
-                                 Apache License
-                           Version 2.0, January 2004
-                        http://www.apache.org/licenses/
-
-   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION
-
-   1. Definitions.
-
-      "License" shall mean the terms and conditions for use, reproduction,
-      and distribution as defined by Sections 1 through 9 of this document.
-
-      "Licensor" shall mean the copyright owner or entity authorized by
-      the copyright owner that is granting the License.
-
-      "Legal Entity" shall mean the union of the acting entity and all
-      other entities that control, are controlled by, or are under common
-      control with that entity. For the purposes of this definition,
-      "control" means (i) the power, direct or indirect, to cause the
-      direction or management of such entity, whether by contract or
-      otherwise, or (ii) ownership of fifty percent (50%) or more of the
-      outstanding shares, or (iii) beneficial ownership of such entity.
-
-      "You" (or "Your") shall mean an individual or Legal Entity
-      exercising permissions granted by this License.
-
-      "Source" form shall mean the preferred form for making modifications,
-      including but not limited to software source code, documentation
-      source, and configuration files.
-
-      "Object" form shall mean any form resulting from mechanical
-      transformation or translation of a Source form, including but
-      not limited to compiled object code, generated documentation,
-      and conversions to other media types.
-
-      "Work" shall mean the work of authorship, whether in Source or
-      Object form, made available under the License, as indicated by a
-      copyright notice that is included in or attached to the work
-      (an example is provided in the Appendix below).
-
-      "Derivative Works" shall mean any work, whether in Source or Object
-      form, that is based on (or derived from) the Work and for which the
-      editorial revisions, annotations, elaborations, or other modifications
-      represent, as a whole, an original work of authorship. For the purposes
-      of this License, Derivative Works shall not include works that remain
-      separable from, or merely link (or bind by name) to the interfaces of,
-      the Work and Derivative Works thereof.
-
-      "Contribution" shall mean any work of authorship, including
-      the original version of the Work and any modifications or additions
-      to that Work or Derivative Works thereof, that is intentionally
-      submitted to Licensor for inclusion in the Work by the copyright owner
-      or by an individual or Legal Entity authorized to submit on behalf of
-      the copyright owner. For the purposes of this definition, "submitted"
-      means any form of electronic, verbal, or written communication sent
-      to the Licensor or its representatives, including but not limited to
-      communication on electronic mailing lists, source code control systems,
-      and issue tracking systems that are managed by, or on behalf of, the
-      Licensor for the purpose of discussing and improving the Work, but
-      excluding communication that is conspicuously marked or otherwise
-      designated in writing by the copyright owner as "Not a Contribution."
-
-      "Contributor" shall mean Licensor and any individual or Legal Entity
-      on behalf of whom a Contribution has been received by Licensor and
-      subsequently incorporated within the Work.
-
-   2. Grant of Copyright License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      copyright license to reproduce, prepare Derivative Works of,
-      publicly display, publicly perform, sublicense, and distribute the
-      Work and such Derivative Works in Source or Object form.
-
-   3. Grant of Patent License. Subject to the terms and conditions of
-      this License, each Contributor hereby grants to You a perpetual,
-      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
-      (except as stated in this section) patent license to make, have made,
-      use, offer to sell, sell, import, and otherwise transfer the Work,
-      where such license applies only to those patent claims licensable
-      by such Contributor that are necessarily infringed by their
-      Contribution(s) alone or by combination of their Contribution(s)
-      with the Work to which such Contribution(s) was submitted. If You
-      institute patent litigation against any entity (including a
-      cross-claim or counterclaim in a lawsuit) alleging that the Work
-      or a Contribution incorporated within the Work constitutes direct
-      or contributory patent infringement, then any patent licenses
-      granted to You under this License for that Work shall terminate
-      as of the date such litigation is filed.
-
-   4. Redistribution. You may reproduce and distribute copies of the
-      Work or Derivative Works thereof in any medium, with or without
-      modifications, and in Source or Object form, provided that You
-      meet the following conditions:
-
-      (a) You must give any other recipients of the Work or
-          Derivative Works a copy of this License; and
-
-      (b) You must cause any modified files to carry prominent notices
-          stating that You changed the files; and
-
-      (c) You must retain, in the Source form of any Derivative Works
-          that You distribute, all copyright, patent, trademark, and
-          attribution notices from the Source form of the Work,
-          excluding those notices that do not pertain to any part of
-          the Derivative Works; and
-
-      (d) If the Work includes a "NOTICE" text file as part of its
-          distribution, then any Derivative Works that You distribute must
-          include a readable copy of the attribution notices contained
-          within such NOTICE file, excluding those notices that do not
-          pertain to any part of the Derivative Works, in at least one
-          of the following places: within a NOTICE text file distributed
-          as part of the Derivative Works; within the Source form or
-          documentation, if provided along with the Derivative Works; or,
-          within a display generated by the Derivative Works, if and
-          wherever such third-party notices normally appear. The contents
-          of the NOTICE file are for informational purposes only and
-          do not modify the License. You may add Your own attribution
-          notices within Derivative Works that You distribute, alongside
-          or as an addendum to the NOTICE text from the Work, provided
-          that such additional attribution notices cannot be construed
-          as modifying the License.
-
-      You may add Your own copyright statement to Your modifications and
-      may provide additional or different license terms and conditions
-      for use, reproduction, or distribution of Your modifications, or
-      for any such Derivative Works as a whole, provided Your use,
-      reproduction, and distribution of the Work otherwise complies with
-      the conditions stated in this License.
-
-   5. Submission of Contributions. Unless You explicitly state otherwise,
-      any Contribution intentionally submitted for inclusion in the Work
-      by You to the Licensor shall be under the terms and conditions of
-      this License, without any additional terms or conditions.
-      Notwithstanding the above, nothing herein shall supersede or modify
-      the terms of any separate license agreement you may have executed
-      with Licensor regarding such Contributions.
-
-   6. Trademarks. This License does not grant permission to use the trade
-      names, trademarks, service marks, or product names of the Licensor,
-      except as required for reasonable and customary use in describing the
-      origin of the Work and reproducing the content of the NOTICE file.
-
-   7. Disclaimer of Warranty. Unless required by applicable law or
-      agreed to in writing, Licensor provides the Work (and each
-      Contributor provides its Contributions) on an "AS IS" BASIS,
-      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
-      implied, including, without limitation, any warranties or conditions
-      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
-      PARTICULAR PURPOSE. You are solely responsible for determining the
-      appropriateness of using or redistributing the Work and assume any
-      risks associated with Your exercise of permissions under this License.
-
-   8. Limitation of Liability. In no event and under no legal theory,
-      whether in tort (including negligence), contract, or otherwise,
-      unless required by applicable law (such as deliberate and grossly
-      negligent acts) or agreed to in writing, shall any Contributor be
-      liable to You for damages, including any direct, indirect, special,
-      incidental, or consequential damages of any character arising as a
-      result of this License or out of the use or inability to use the
-      Work (including but not limited to damages for loss of goodwill,
-      work stoppage, computer failure or malfunction, or any and all
-      other commercial damages or losses), even if such Contributor
-      has been advised of the possibility of such damages.
-
-   9. Accepting Warranty or Additional Liability. While redistributing
-      the Work or Derivative Works thereof, You may choose to offer,
-      and charge a fee for, acceptance of support, warranty, indemnity,
-      or other liability obligations and/or rights consistent with this
-      License. However, in accepting such obligations, You may act only
-      on Your own behalf and on Your sole responsibility, not on behalf
-      of any other Contributor, and only if You agree to indemnify,
-      defend, and hold each Contributor harmless for any liability
-      incurred by, or claims asserted against, such Contributor by reason
-      of your accepting any such warranty or additional liability.
-
-   END OF TERMS AND CONDITIONS
-
-   APPENDIX: How to apply the Apache License to your work.
-
-      To apply the Apache License to your work, attach the following
-      boilerplate notice, with the fields enclosed by brackets "[]"
-      replaced with your own identifying information. (Don't include
-      the brackets!)  The text should be enclosed in the appropriate
-      comment syntax for the file format. We also recommend that a
-      file or class name and description of purpose be included on the
-      same "printed page" as the copyright notice for easier
-      identification within third-party archives.
-
-   Copyright [yyyy] [name of copyright owner]
-
-   Licensed under the Apache License, Version 2.0 (the "License");
-   you may not use this file except in compliance with the License.
-   You may obtain a copy of the License at
-
-       http://www.apache.org/licenses/LICENSE-2.0
-
-   Unless required by applicable law or agreed to in writing, software
-   distributed under the License is distributed on an "AS IS" BASIS,
-   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-   See the License for the specific language governing permissions and
-   limitations under the License.
diff --git a/skills/skill-installer/SKILL.md b/skills/skill-installer/SKILL.md
deleted file mode 100644
index 313626a..0000000
--- a/skills/skill-installer/SKILL.md
+++ /dev/null
@@ -1,58 +0,0 @@
----
-name: skill-installer
-description: Install Codex skills into $CODEX_HOME/skills from a curated list or a GitHub repo path. Use when a user asks to list installable skills, install a curated skill, or install a skill from another repo (including private repos).
-metadata:
-  short-description: Install curated skills from openai/skills or other repos
----
-
-# Skill Installer
-
-Helps install skills. By default these are from https://github.com/openai/skills/tree/main/skills/.curated, but users can also provide other locations. Experimental skills live in https://github.com/openai/skills/tree/main/skills/.experimental and can be installed the same way.
-
-Use the helper scripts based on the task:
-- List skills when the user asks what is available, or if the user uses this skill without specifying what to do. Default listing is `.curated`, but you can pass `--path skills/.experimental` when they ask about experimental skills.
-- Install from the curated list when the user provides a skill name.
-- Install from another repo when the user provides a GitHub repo/path (including private repos).
-
-Install skills with the helper scripts.
-
-## Communication
-
-When listing skills, output approximately as follows, depending on the context of the user's request. If they ask about experimental skills, list from `.experimental` instead of `.curated` and label the source accordingly:
-"""
-Skills from {repo}:
-1. skill-1
-2. skill-2 (already installed)
-3. ...
-Which ones would you like installed?
-"""
-
-After installing a skill, tell the user: "Restart Codex to pick up new skills."
-
-## Scripts
-
-All of these scripts use network, so when running in the sandbox, request escalation when running them.
-
-- `scripts/list-skills.py` (prints skills list with installed annotations)
-- `scripts/list-skills.py --format json`
-- Example (experimental list): `scripts/list-skills.py --path skills/.experimental`
-- `scripts/install-skill-from-github.py --repo <owner>/<repo> --path <path/to/skill> [<path/to/skill> ...]`
-- `scripts/install-skill-from-github.py --url https://github.com/<owner>/<repo>/tree/<ref>/<path>`
-- Example (experimental skill): `scripts/install-skill-from-github.py --repo openai/skills --path skills/.experimental/<skill-name>`
-
-## Behavior and Options
-
-- Defaults to direct download for public GitHub repos.
-- If download fails with auth/permission errors, falls back to git sparse checkout.
-- Aborts if the destination skill directory already exists.
-- Installs into `$CODEX_HOME/skills/<skill-name>` (defaults to `~/.codex/skills`).
-- Multiple `--path` values install multiple skills in one run, each named from the path basename unless `--name` is supplied.
-- Options: `--ref <ref>` (default `main`), `--dest <path>`, `--method auto|download|git`.
-
-## Notes
-
-- Curated listing is fetched from `https://github.com/openai/skills/tree/main/skills/.curated` via the GitHub API. If it is unavailable, explain the error and exit.
-- Private GitHub repos can be accessed via existing git credentials or optional `GITHUB_TOKEN`/`GH_TOKEN` for download.
-- Git fallback tries HTTPS first, then SSH.
-- The skills at https://github.com/openai/skills/tree/main/skills/.system are preinstalled, so no need to help users install those. If they ask, just explain this. If they insist, you can download and overwrite.
-- Installed annotations come from `$CODEX_HOME/skills`.
diff --git a/skills/skill-installer/agents/openai.yaml b/skills/skill-installer/agents/openai.yaml
deleted file mode 100644
index 88d40cd..0000000
--- a/skills/skill-installer/agents/openai.yaml
+++ /dev/null
@@ -1,5 +0,0 @@
-interface:
-  display_name: "Skill Installer"
-  short_description: "Install curated skills from openai/skills or other repos"
-  icon_small: "./assets/skill-installer-small.svg"
-  icon_large: "./assets/skill-installer.png"
diff --git a/skills/skill-installer/assets/skill-installer-small.svg b/skills/skill-installer/assets/skill-installer-small.svg
deleted file mode 100644
index ccfc034..0000000
--- a/skills/skill-installer/assets/skill-installer-small.svg
+++ /dev/null
@@ -1,3 +0,0 @@
-<svg xmlns="http://www.w3.org/2000/svg" width="16" height="16" fill="currentColor" viewBox="0 0 16 16">
-  <path fill="#0D0D0D" d="M2.145 3.959a2.033 2.033 0 0 1 2.022-1.824h5.966c.551 0 .997 0 1.357.029.367.03.692.093.993.246l.174.098c.397.243.72.593.932 1.01l.053.114c.116.269.168.557.194.878.03.36.03.805.03 1.357v4.3a2.365 2.365 0 0 1-2.366 2.365h-1.312a2.198 2.198 0 0 1-4.377 0H4.167A2.032 2.032 0 0 1 2.135 10.5V9.333l.004-.088A.865.865 0 0 1 3 8.468l.116-.006A1.135 1.135 0 0 0 3 6.199a.865.865 0 0 1-.865-.864V4.167l.01-.208Zm1.054 1.186a2.198 2.198 0 0 1 0 4.376v.98c0 .534.433.967.968.967H6l.089.004a.866.866 0 0 1 .776.861 1.135 1.135 0 0 0 2.27 0c0-.478.387-.865.865-.865h1.5c.719 0 1.301-.583 1.301-1.301v-4.3c0-.57 0-.964-.025-1.27a1.933 1.933 0 0 0-.09-.493L12.642 4a1.47 1.47 0 0 0-.541-.585l-.102-.056c-.126-.065-.295-.11-.596-.135a17.31 17.31 0 0 0-1.27-.025H4.167a.968.968 0 0 0-.968.968v.978Z"/>
-</svg>
diff --git a/skills/skill-installer/assets/skill-installer.png b/skills/skill-installer/assets/skill-installer.png
deleted file mode 100644
index 2977cd5bb49b3b8bd50d8bf476d7cffbb3f88a46..0000000000000000000000000000000000000000
GIT binary patch
literal 0
HcmV?d00001

literal 1086
zcmV-E1i|}>P)<h;3K|Lk000e1NJLTq003kF003kN1^@s6aN?Cz00009a7bBm000XU
z000XU0RWnu7ytkO0drDELIAGL9O(c600d`2O+f$vv5yP<VFdsH1Jg-FK~#7F?cL8#
z6Hye$@!!m}r7gu`q4F=mKXIWfR1#c}xWFZkz|)xc0KSA9R=RSljSE@0z_@UM$Uh@!
zfKm(;XgjTQY^otF=(KaonK|c^kf2r}e7SSy-aAA<DW#NBN-3q3Qc9_Cu;5eU<&!zU
zo&z(dZ^pq;A+@+z@bed9@Xels)p!Qgu7aNz+fb}%5N0$8Ga7^$4Z@5DVMc>6qd}PI
zU}1Q*8dV$h?`gQj1R5vJPv45w5fz~cLLuCh0o2wr7yk^=5sDx*5-Ll>Xp|j99s4;%
zQVhaANX@%UNr^#N2cgm7dK0)Ltb@2~8A!uANPWK#(lEbd$(cJ^cn7KaK4A_$)<LYa
z3u#yfv4_qe4eKDz$SI`ZJwirL#9g-7uhioY4<HHqAT*D}rVb%RC=RG%caD&lDT=s!
zh2}hj=95IWg8EJhwT(=m8;<tCHN>)6Sba%Y@i-cF@4&0#eXMdBwS%I!9;%>MLUm$j
zrCd1PXrVVcuxk8{|NH&3w<GY&PWK}|HvTulxsPLe7mj2S4!z}aa1Rer+uQ9)n9v>J
zwpj5xtS;6mPHqVC8|_7OywPK))2M818jm9KAqOWj&~}U#8byi8o8IU#yT2wbh!syD
zHZqD%P!uPhhe_gsIGN0aIm3_G^_<aBA}@$HcXa)43}#`9tRRll)#zxUyE9Wn1+l$#
zMj*U-$P|5)lo?S$0$W44=C*MBFAN{OZ|`S!S04aJ0Ze{VAA!W>=OW3~=jat$Bqr}o
zwed>-54oBfA#OmM02NtJp6DFHjJY6*fR0~N$B@KakW2uFN)*+pK@xL8a=*~E{5GU9
z7lgjE^FPor8XehvNMm+VAKmi4upORROsoYr4~2-?AT&zue)b<_;+x3PLCl{R(swyU
z`8f#`M=pQu<Vt5Z1pOr-U248x_4cevot=4HwcZ@zw!YAG3EQ1$uHb3GM~g=qJ*lJS
zO+YuJV*bVXUmp(wd$)lvPn++DL~qa3DGXhXdVxkv|1vPV-i)$2jWCG*N}a+ye(mjv
zy+att**c*h`3-O<YcFf&m3O$r`&L?35W0LZA0_g3dv7g+GkHO>JK#)Skp2=llNY2K
z(32;I$O}>$17`w*@ZRH+7i4u7oXHA8`&rC48s!9`5TEA3U1)!T$`_i*mloLHVUcJD
zp#WcJn{OeAL8236`~Lrp!}4JBZfavXG$C4|6Xe4JqCg)dWk!QAqd}O_Ak1hGW;6&h
z8iW}Q!b~R%!vfF$u!G|#Wf!27Qc5YMlu}A5rBp=y0R^AlXy0glYybcN07*qoM6N<$
Ef|C;DQ~&?~

diff --git a/skills/skill-installer/scripts/github_utils.py b/skills/skill-installer/scripts/github_utils.py
deleted file mode 100644
index 711f597..0000000
--- a/skills/skill-installer/scripts/github_utils.py
+++ /dev/null
@@ -1,21 +0,0 @@
-#!/usr/bin/env python3
-"""Shared GitHub helpers for skill install scripts."""
-
-from __future__ import annotations
-
-import os
-import urllib.request
-
-
-def github_request(url: str, user_agent: str) -> bytes:
-    headers = {"User-Agent": user_agent}
-    token = os.environ.get("GITHUB_TOKEN") or os.environ.get("GH_TOKEN")
-    if token:
-        headers["Authorization"] = f"token {token}"
-    req = urllib.request.Request(url, headers=headers)
-    with urllib.request.urlopen(req) as resp:
-        return resp.read()
-
-
-def github_api_contents_url(repo: str, path: str, ref: str) -> str:
-    return f"https://api.github.com/repos/{repo}/contents/{path}?ref={ref}"
diff --git a/skills/skill-installer/scripts/install-skill-from-github.py b/skills/skill-installer/scripts/install-skill-from-github.py
deleted file mode 100644
index 1c8ce89..0000000
--- a/skills/skill-installer/scripts/install-skill-from-github.py
+++ /dev/null
@@ -1,308 +0,0 @@
-#!/usr/bin/env python3
-"""Install a skill from a GitHub repo path into $CODEX_HOME/skills."""
-
-from __future__ import annotations
-
-import argparse
-from dataclasses import dataclass
-import os
-import shutil
-import subprocess
-import sys
-import tempfile
-import urllib.error
-import urllib.parse
-import zipfile
-
-from github_utils import github_request
-DEFAULT_REF = "main"
-
-
-@dataclass
-class Args:
-    url: str | None = None
-    repo: str | None = None
-    path: list[str] | None = None
-    ref: str = DEFAULT_REF
-    dest: str | None = None
-    name: str | None = None
-    method: str = "auto"
-
-
-@dataclass
-class Source:
-    owner: str
-    repo: str
-    ref: str
-    paths: list[str]
-    repo_url: str | None = None
-
-
-class InstallError(Exception):
-    pass
-
-
-def _codex_home() -> str:
-    return os.environ.get("CODEX_HOME", os.path.expanduser("~/.codex"))
-
-
-def _tmp_root() -> str:
-    base = os.path.join(tempfile.gettempdir(), "codex")
-    os.makedirs(base, exist_ok=True)
-    return base
-
-
-def _request(url: str) -> bytes:
-    return github_request(url, "codex-skill-install")
-
-
-def _parse_github_url(url: str, default_ref: str) -> tuple[str, str, str, str | None]:
-    parsed = urllib.parse.urlparse(url)
-    if parsed.netloc != "github.com":
-        raise InstallError("Only GitHub URLs are supported for download mode.")
-    parts = [p for p in parsed.path.split("/") if p]
-    if len(parts) < 2:
-        raise InstallError("Invalid GitHub URL.")
-    owner, repo = parts[0], parts[1]
-    ref = default_ref
-    subpath = ""
-    if len(parts) > 2:
-        if parts[2] in ("tree", "blob"):
-            if len(parts) < 4:
-                raise InstallError("GitHub URL missing ref or path.")
-            ref = parts[3]
-            subpath = "/".join(parts[4:])
-        else:
-            subpath = "/".join(parts[2:])
-    return owner, repo, ref, subpath or None
-
-
-def _download_repo_zip(owner: str, repo: str, ref: str, dest_dir: str) -> str:
-    zip_url = f"https://codeload.github.com/{owner}/{repo}/zip/{ref}"
-    zip_path = os.path.join(dest_dir, "repo.zip")
-    try:
-        payload = _request(zip_url)
-    except urllib.error.HTTPError as exc:
-        raise InstallError(f"Download failed: HTTP {exc.code}") from exc
-    with open(zip_path, "wb") as file_handle:
-        file_handle.write(payload)
-    with zipfile.ZipFile(zip_path, "r") as zip_file:
-        _safe_extract_zip(zip_file, dest_dir)
-        top_levels = {name.split("/")[0] for name in zip_file.namelist() if name}
-    if not top_levels:
-        raise InstallError("Downloaded archive was empty.")
-    if len(top_levels) != 1:
-        raise InstallError("Unexpected archive layout.")
-    return os.path.join(dest_dir, next(iter(top_levels)))
-
-
-def _run_git(args: list[str]) -> None:
-    result = subprocess.run(args, stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True)
-    if result.returncode != 0:
-        raise InstallError(result.stderr.strip() or "Git command failed.")
-
-
-def _safe_extract_zip(zip_file: zipfile.ZipFile, dest_dir: str) -> None:
-    dest_root = os.path.realpath(dest_dir)
-    for info in zip_file.infolist():
-        extracted_path = os.path.realpath(os.path.join(dest_dir, info.filename))
-        if extracted_path == dest_root or extracted_path.startswith(dest_root + os.sep):
-            continue
-        raise InstallError("Archive contains files outside the destination.")
-    zip_file.extractall(dest_dir)
-
-
-def _validate_relative_path(path: str) -> None:
-    if os.path.isabs(path) or os.path.normpath(path).startswith(".."):
-        raise InstallError("Skill path must be a relative path inside the repo.")
-
-
-def _validate_skill_name(name: str) -> None:
-    altsep = os.path.altsep
-    if not name or os.path.sep in name or (altsep and altsep in name):
-        raise InstallError("Skill name must be a single path segment.")
-    if name in (".", ".."):
-        raise InstallError("Invalid skill name.")
-
-
-def _git_sparse_checkout(repo_url: str, ref: str, paths: list[str], dest_dir: str) -> str:
-    repo_dir = os.path.join(dest_dir, "repo")
-    clone_cmd = [
-        "git",
-        "clone",
-        "--filter=blob:none",
-        "--depth",
-        "1",
-        "--sparse",
-        "--single-branch",
-        "--branch",
-        ref,
-        repo_url,
-        repo_dir,
-    ]
-    try:
-        _run_git(clone_cmd)
-    except InstallError:
-        _run_git(
-            [
-                "git",
-                "clone",
-                "--filter=blob:none",
-                "--depth",
-                "1",
-                "--sparse",
-                "--single-branch",
-                repo_url,
-                repo_dir,
-            ]
-        )
-    _run_git(["git", "-C", repo_dir, "sparse-checkout", "set", *paths])
-    _run_git(["git", "-C", repo_dir, "checkout", ref])
-    return repo_dir
-
-
-def _validate_skill(path: str) -> None:
-    if not os.path.isdir(path):
-        raise InstallError(f"Skill path not found: {path}")
-    skill_md = os.path.join(path, "SKILL.md")
-    if not os.path.isfile(skill_md):
-        raise InstallError("SKILL.md not found in selected skill directory.")
-
-
-def _copy_skill(src: str, dest_dir: str) -> None:
-    os.makedirs(os.path.dirname(dest_dir), exist_ok=True)
-    if os.path.exists(dest_dir):
-        raise InstallError(f"Destination already exists: {dest_dir}")
-    shutil.copytree(src, dest_dir)
-
-
-def _build_repo_url(owner: str, repo: str) -> str:
-    return f"https://github.com/{owner}/{repo}.git"
-
-
-def _build_repo_ssh(owner: str, repo: str) -> str:
-    return f"git@github.com:{owner}/{repo}.git"
-
-
-def _prepare_repo(source: Source, method: str, tmp_dir: str) -> str:
-    if method in ("download", "auto"):
-        try:
-            return _download_repo_zip(source.owner, source.repo, source.ref, tmp_dir)
-        except InstallError as exc:
-            if method == "download":
-                raise
-            err_msg = str(exc)
-            if "HTTP 401" in err_msg or "HTTP 403" in err_msg or "HTTP 404" in err_msg:
-                pass
-            else:
-                raise
-    if method in ("git", "auto"):
-        repo_url = source.repo_url or _build_repo_url(source.owner, source.repo)
-        try:
-            return _git_sparse_checkout(repo_url, source.ref, source.paths, tmp_dir)
-        except InstallError:
-            repo_url = _build_repo_ssh(source.owner, source.repo)
-            return _git_sparse_checkout(repo_url, source.ref, source.paths, tmp_dir)
-    raise InstallError("Unsupported method.")
-
-
-def _resolve_source(args: Args) -> Source:
-    if args.url:
-        owner, repo, ref, url_path = _parse_github_url(args.url, args.ref)
-        if args.path is not None:
-            paths = list(args.path)
-        elif url_path:
-            paths = [url_path]
-        else:
-            paths = []
-        if not paths:
-            raise InstallError("Missing --path for GitHub URL.")
-        return Source(owner=owner, repo=repo, ref=ref, paths=paths)
-
-    if not args.repo:
-        raise InstallError("Provide --repo or --url.")
-    if "://" in args.repo:
-        return _resolve_source(
-            Args(url=args.repo, repo=None, path=args.path, ref=args.ref)
-        )
-
-    repo_parts = [p for p in args.repo.split("/") if p]
-    if len(repo_parts) != 2:
-        raise InstallError("--repo must be in owner/repo format.")
-    if not args.path:
-        raise InstallError("Missing --path for --repo.")
-    paths = list(args.path)
-    return Source(
-        owner=repo_parts[0],
-        repo=repo_parts[1],
-        ref=args.ref,
-        paths=paths,
-    )
-
-
-def _default_dest() -> str:
-    return os.path.join(_codex_home(), "skills")
-
-
-def _parse_args(argv: list[str]) -> Args:
-    parser = argparse.ArgumentParser(description="Install a skill from GitHub.")
-    parser.add_argument("--repo", help="owner/repo")
-    parser.add_argument("--url", help="https://github.com/owner/repo[/tree/ref/path]")
-    parser.add_argument(
-        "--path",
-        nargs="+",
-        help="Path(s) to skill(s) inside repo",
-    )
-    parser.add_argument("--ref", default=DEFAULT_REF)
-    parser.add_argument("--dest", help="Destination skills directory")
-    parser.add_argument(
-        "--name", help="Destination skill name (defaults to basename of path)"
-    )
-    parser.add_argument(
-        "--method",
-        choices=["auto", "download", "git"],
-        default="auto",
-    )
-    return parser.parse_args(argv, namespace=Args())
-
-
-def main(argv: list[str]) -> int:
-    args = _parse_args(argv)
-    try:
-        source = _resolve_source(args)
-        source.ref = source.ref or args.ref
-        if not source.paths:
-            raise InstallError("No skill paths provided.")
-        for path in source.paths:
-            _validate_relative_path(path)
-        dest_root = args.dest or _default_dest()
-        tmp_dir = tempfile.mkdtemp(prefix="skill-install-", dir=_tmp_root())
-        try:
-            repo_root = _prepare_repo(source, args.method, tmp_dir)
-            installed = []
-            for path in source.paths:
-                skill_name = args.name if len(source.paths) == 1 else None
-                skill_name = skill_name or os.path.basename(path.rstrip("/"))
-                _validate_skill_name(skill_name)
-                if not skill_name:
-                    raise InstallError("Unable to derive skill name.")
-                dest_dir = os.path.join(dest_root, skill_name)
-                if os.path.exists(dest_dir):
-                    raise InstallError(f"Destination already exists: {dest_dir}")
-                skill_src = os.path.join(repo_root, path)
-                _validate_skill(skill_src)
-                _copy_skill(skill_src, dest_dir)
-                installed.append((skill_name, dest_dir))
-        finally:
-            if os.path.isdir(tmp_dir):
-                shutil.rmtree(tmp_dir, ignore_errors=True)
-        for skill_name, dest_dir in installed:
-            print(f"Installed {skill_name} to {dest_dir}")
-        return 0
-    except InstallError as exc:
-        print(f"Error: {exc}", file=sys.stderr)
-        return 1
-
-
-if __name__ == "__main__":
-    raise SystemExit(main(sys.argv[1:]))
diff --git a/skills/skill-installer/scripts/list-skills.py b/skills/skill-installer/scripts/list-skills.py
deleted file mode 100644
index 0977c29..0000000
--- a/skills/skill-installer/scripts/list-skills.py
+++ /dev/null
@@ -1,107 +0,0 @@
-#!/usr/bin/env python3
-"""List skills from a GitHub repo path."""
-
-from __future__ import annotations
-
-import argparse
-import json
-import os
-import sys
-import urllib.error
-
-from github_utils import github_api_contents_url, github_request
-
-DEFAULT_REPO = "openai/skills"
-DEFAULT_PATH = "skills/.curated"
-DEFAULT_REF = "main"
-
-
-class ListError(Exception):
-    pass
-
-
-class Args(argparse.Namespace):
-    repo: str
-    path: str
-    ref: str
-    format: str
-
-
-def _request(url: str) -> bytes:
-    return github_request(url, "codex-skill-list")
-
-
-def _codex_home() -> str:
-    return os.environ.get("CODEX_HOME", os.path.expanduser("~/.codex"))
-
-
-def _installed_skills() -> set[str]:
-    root = os.path.join(_codex_home(), "skills")
-    if not os.path.isdir(root):
-        return set()
-    entries = set()
-    for name in os.listdir(root):
-        path = os.path.join(root, name)
-        if os.path.isdir(path):
-            entries.add(name)
-    return entries
-
-
-def _list_skills(repo: str, path: str, ref: str) -> list[str]:
-    api_url = github_api_contents_url(repo, path, ref)
-    try:
-        payload = _request(api_url)
-    except urllib.error.HTTPError as exc:
-        if exc.code == 404:
-            raise ListError(
-                "Skills path not found: "
-                f"https://github.com/{repo}/tree/{ref}/{path}"
-            ) from exc
-        raise ListError(f"Failed to fetch skills: HTTP {exc.code}") from exc
-    data = json.loads(payload.decode("utf-8"))
-    if not isinstance(data, list):
-        raise ListError("Unexpected skills listing response.")
-    skills = [item["name"] for item in data if item.get("type") == "dir"]
-    return sorted(skills)
-
-
-def _parse_args(argv: list[str]) -> Args:
-    parser = argparse.ArgumentParser(description="List skills.")
-    parser.add_argument("--repo", default=DEFAULT_REPO)
-    parser.add_argument(
-        "--path",
-        default=DEFAULT_PATH,
-        help="Repo path to list (default: skills/.curated)",
-    )
-    parser.add_argument("--ref", default=DEFAULT_REF)
-    parser.add_argument(
-        "--format",
-        choices=["text", "json"],
-        default="text",
-        help="Output format",
-    )
-    return parser.parse_args(argv, namespace=Args())
-
-
-def main(argv: list[str]) -> int:
-    args = _parse_args(argv)
-    try:
-        skills = _list_skills(args.repo, args.path, args.ref)
-        installed = _installed_skills()
-        if args.format == "json":
-            payload = [
-                {"name": name, "installed": name in installed} for name in skills
-            ]
-            print(json.dumps(payload))
-        else:
-            for idx, name in enumerate(skills, start=1):
-                suffix = " (already installed)" if name in installed else ""
-                print(f"{idx}. {name}{suffix}")
-        return 0
-    except ListError as exc:
-        print(f"Error: {exc}", file=sys.stderr)
-        return 1
-
-
-if __name__ == "__main__":
-    raise SystemExit(main(sys.argv[1:]))

From ce5b88600f25d4cf8444f0fe4bd0242cbc5cee50 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Wed, 24 Jun 2026 13:31:08 +0800
Subject: [PATCH 11/13] test

---
 deployment/tests/test_gen_bare_deploy_bash.py |  3 +-
 examples/fluxon_quick_start/start.py          |  6 +-
 examples/start_kv_and_fs_svc.py               |  6 +-
 examples/start_master_owner.py                |  6 +-
 ...15\347\275\256\346\200\273\350\247\210.md" |  3 +-
 ...13\350\257\225\346\265\201\347\250\213.md" |  2 +-
 ...04\345\222\214\346\246\202\345\277\265.md" |  2 +-
 ...15\345\212\241\345\271\263\351\235\242.md" |  4 +-
 ...7 - 3 - KV-RPC\346\216\245\345\217\243.md" |  9 +-
 ...0\267 - 4 - MQ\346\216\245\345\217\243.md" |  6 +-
 ...0\267 - 5 - FS\346\216\245\345\217\243.md" |  4 +-
 .../User - 1 - Architecture and Concepts.md   |  2 +-
 .../User - 3 - KV and RPC Interface.md        |  9 +-
 .../user_doc/User - 4 - MQ Interface.md       |  1 +
 fluxon_py/config.py                           | 14 +--
 .../tests/fluxon_fs_transfer_tikv_support.py  |  4 +-
 ...est_backend_relay_deployconf.template.yaml | 12 +--
 fluxon_py/tests/test_config.py                | 13 +--
 .../tests/test_mq/test_example_ctrl_c_exit.py |  4 +-
 fluxon_rs/fluxon_kv/src/config.rs             | 91 +++++++------------
 .../external_client_test.rs                   |  4 +-
 fluxon_rs/fluxon_kv/src/kv_test.rs            |  4 +-
 fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs    |  2 +-
 fluxon_rs/fluxon_kv/src/lib.rs                | 13 ++-
 .../fluxon_kv/src/memholder/memholder_test.rs |  4 +-
 fluxon_test_stack/deployconf_testbed.yml      |  3 +-
 fluxon_test_stack/test_runner.py              | 11 +--
 .../tests/test_ci_2_virt_node_contract.py     |  4 +-
 .../test_test_runner_testbed_contract.py      | 10 +-
 .../tests/test_quick_start_release_only.py    |  5 +-
 30 files changed, 99 insertions(+), 162 deletions(-)

diff --git a/deployment/tests/test_gen_bare_deploy_bash.py b/deployment/tests/test_gen_bare_deploy_bash.py
index 0ca0a79..21f11a6 100644
--- a/deployment/tests/test_gen_bare_deploy_bash.py
+++ b/deployment/tests/test_gen_bare_deploy_bash.py
@@ -400,8 +400,7 @@ def test_normalized_testbed_owner_emits_large_file_paths() -> None:
 
         script = (outdir / "entrypoint__fluxon-self-host2-fluxon_core_controller__owner.sh").read_text(encoding="utf-8")
         assert 'large_file_paths:' in script, script
-        assert 'log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"' in script, script
-        assert 'cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"' in script, script
+        assert '- "${HOSTWORKDIR}/large/owner_${NODE_ID}"' in script, script
         print("PASS: test_normalized_testbed_owner_emits_large_file_paths")
 
 
diff --git a/examples/fluxon_quick_start/start.py b/examples/fluxon_quick_start/start.py
index 472f45c..1ee0acf 100644
--- a/examples/fluxon_quick_start/start.py
+++ b/examples/fluxon_quick_start/start.py
@@ -528,10 +528,8 @@ def _monitoring_block(greptime_http_port: int) -> Dict[str, Any]:
     }
 
 
-def _owner_large_file_paths(workdir: Path) -> Dict[str, str]:
-    return {
-        "root_paths": [str(workdir / "large" / "owner")],
-    }
+def _owner_large_file_paths(workdir: Path) -> List[str]:
+    return [str(workdir / "large" / "owner")]
 
 
 def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: int,
diff --git a/examples/start_kv_and_fs_svc.py b/examples/start_kv_and_fs_svc.py
index b79043c..9cec14f 100644
--- a/examples/start_kv_and_fs_svc.py
+++ b/examples/start_kv_and_fs_svc.py
@@ -38,10 +38,8 @@
 FS_MASTER_ACCESS_DB_PATH = (WORKDIR / "fs_master" / "access.db").resolve()
 
 
-def build_owner_large_file_paths() -> dict:
-    return {
-        "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-    }
+def build_owner_large_file_paths() -> list[str]:
+    return [str((WORKDIR / "large" / "owner").resolve())]
 
 
 def main() -> None:
diff --git a/examples/start_master_owner.py b/examples/start_master_owner.py
index fbfb600..078450b 100644
--- a/examples/start_master_owner.py
+++ b/examples/start_master_owner.py
@@ -23,10 +23,8 @@
 OWNER_DRAM_BYTES = 1073741824
 
 
-def build_owner_large_file_paths() -> dict:
-    return {
-        "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-    }
+def build_owner_large_file_paths() -> list[str]:
+    return [str((WORKDIR / "large" / "owner").resolve())]
 
 
 def main() -> None:
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
index 7f273a1..50e2b38 100644
--- "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -285,8 +285,7 @@ fluxonkv_spec:
   # owner 必须声明大文件根目录列表；运行时按数组顺序选择第一个可用 root，
   # 日志和 cache 等子目录都从固定相对位置派生
   large_file_paths:
-    root_paths:
-      - /var/lib/fluxon/large
+    - /var/lib/fluxon/large
 
   # 可选
   p2p_listen_port: 31001
diff --git "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md" "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
index ca85ac6..df93b67 100644
--- "a/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
+++ "b/fluxon_doc_cn/design/teststack_1_\345\275\223\345\211\215\346\236\266\346\236\204\344\270\216CI\346\265\213\350\257\225\346\265\201\347\250\213.md"
@@ -382,7 +382,7 @@ deploy.instances 不写死在 suite 中。Runner 会结合 scale、profile 和
 
 **稳定结论：**
 
-- owner 模式配置一律必须显式提供 `fluxonkv_spec.large_file_paths.root_paths`，并按数组顺序表达大文件根目录优先级。
+- owner 模式配置一律必须显式提供 `fluxonkv_spec.large_file_paths`，并按数组顺序表达大文件根目录优先级。
 - `fluxonkv_spec.p2p_listen_port` 不是 owner 模式的必填项；是否显式写入，取决于具体分支的运行契约。
 - 不要把 `TEST_STACK` case-local owner 的显式端口分配规则，复制到 shared testbed / CI owner 配置上。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"
index e83afe3..f85811d 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"	
@@ -62,7 +62,7 @@
 
 **`shared_memory_path`** — 共享内存目录，同机进程通过它附着到同一内存池；这是 mmap / data plane 的本机 authority。
 
-**`shared_file_path`** — 共享文件目录，`shared.json`、日志、profile 等本机共享文件位于这里；这是 file / metadata attachment 的本机 authority。
+**`shared_file_path`** — 共享文件目录，`shared.json` 与 peer metadata 等本机共享文件位于这里；这是 file / metadata attachment 的本机 authority。
 
 **`log_dir`** — master 自己的日志目录 authority。master 运行时会在这个目录下继续派生 cluster 级日志和 profile 子目录。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"
index d31ba03..5daa633 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
@@ -312,9 +312,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
-            "large_file_paths": {
-                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-            },
+            "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
     }
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"
index 97affbf..55d4cd1 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
@@ -173,9 +173,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
-            "large_file_paths": {
-                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-            },
+            "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
     }
 
@@ -617,7 +615,8 @@ fluxonkv_spec:
 这里需要把两个本机 authority 分清楚：
 
 - `shared_memory_path`：共享内存 / mmap authority，同机进程靠它附着到同一块内存池
-- `shared_file_path`：共享文件 authority，`shared.json`、日志、profile 等文件位于这里
+- `shared_file_path`：共享文件 authority，只承载 `shared.json` 和 peer metadata 等共享文件
+- `large_file_paths`：owner 独占的大文件 authority，日志、profile、cache 等运行时资产都从这里派生
 - `FLUXON_LOG`：用户 Python 进程 console log 的门限，不写时默认 `INFO`
 
-zero-contribution external 模式下有一个硬约束：`fluxonkv_spec.etcd_addresses`、`fluxonkv_spec.sub_cluster`、`fluxonkv_spec.redis_compat` 这类 owner 侧字段不应出现。
+zero-contribution external 模式下有一个硬约束：`fluxonkv_spec.etcd_addresses`、`fluxonkv_spec.sub_cluster`、`fluxonkv_spec.large_file_paths`、`fluxonkv_spec.redis_compat` 这类 owner 侧字段不应出现。
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"
index 8805da8..4501abb 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
@@ -199,9 +199,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
-            "large_file_paths": {
-                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-            },
+            "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
     }
 
@@ -555,7 +553,7 @@ FLUXON_LOG=DEBUG python3 examples/start_mpmc_demo.py --role consumer
 
 - MQ Python 部分：由 `init_logger(...)` 初始化，直接输出到当前终端，不默认落盘，门限由 `FLUXON_LOG` 控制
 - MQ Rust / KV 后台部分：和 KV 一起走服务平面的后台日志链路；`master` 本地日志目录由 `master_cfg["log_dir"]` 指定
-- `shared_file_path`：本机共享文件 authority，用来承载 `shared.json` 等共享文件
+- `shared_file_path`：本机共享文件 authority，只承载 `shared.json` 等共享文件
 
 如果服务平面的 `master.monitoring.otlp_log_api` 已经配置，MQ Rust / KV 后台部分的日志还会继续采集到 Greptime 的 `fluxon_logs` 表。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"
index f06fe44..9f67aaf 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
@@ -286,9 +286,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
-            "large_file_paths": {
-                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-            },
+            "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
     }
 
diff --git a/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md b/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md
index 05818ac..9c64b7f 100644
--- a/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md	
+++ b/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md	
@@ -80,7 +80,7 @@ Cross-machine transport:
 
 `shared_file_path`
 
-- Shared-file authority for `shared.json`, logs, profiles, and other local shared files
+- Shared-file authority for `shared.json`, peer metadata, and other local shared files
 
 `log_dir`
 
diff --git a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md
index d466820..ab3932a 100644
--- a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
@@ -148,9 +148,7 @@ def build_owner_config() -> dict:
             "shared_memory_path": str(SHARED_MEMORY_PATH),
             "shared_file_path": str(SHARED_FILE_PATH),
             "sub_cluster": "default",
-            "large_file_paths": {
-                "root_paths": [str((WORKDIR / "large" / "owner").resolve())],
-            },
+            "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
     }
 
@@ -388,7 +386,8 @@ fluxonkv_spec:
 Keep these authorities separate:
 
 - `shared_memory_path`: shared-memory / mmap authority
-- `shared_file_path`: shared-file authority for `shared.json`, logs, and profiles
+- `shared_file_path`: shared-file authority for `shared.json` and peer metadata files
+- `large_file_paths`: owner-only large-file authority for logs, profiles, caches, and other derived runtime assets
 - `FLUXON_LOG`: console log threshold for the user process
 
-In zero-contribution external mode, owner-only fields such as `fluxonkv_spec.etcd_addresses`, `fluxonkv_spec.sub_cluster`, and `fluxonkv_spec.redis_compat` should not appear.
+In zero-contribution external mode, owner-only fields such as `fluxonkv_spec.etcd_addresses`, `fluxonkv_spec.sub_cluster`, `fluxonkv_spec.large_file_paths`, and `fluxonkv_spec.redis_compat` should not appear.
diff --git a/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md b/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md
index 3445aff..dcfe33c 100644
--- a/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md	
@@ -125,6 +125,7 @@ Parameter constraints:
 - Python-side MQ logs come from `init_logger(...)` and go to the current terminal by default; the threshold is controlled by `FLUXON_LOG`
 - Rust / KV background logs follow the shared service-plane pipeline, and the master's local log authority is `master_cfg["log_dir"]`
 - `shared_file_path` remains the local shared-file authority for `shared.json` and related files
+- `large_file_paths` remains the owner-only large-file authority for backend logs, profiles, caches, and other derived runtime assets
 
 If `master.monitoring.otlp_log_api` is configured, backend logs continue to flow into the Greptime `fluxon_logs` table.
 
diff --git a/fluxon_py/config.py b/fluxon_py/config.py
index a59a9b1..e591d65 100644
--- a/fluxon_py/config.py
+++ b/fluxon_py/config.py
@@ -110,8 +110,7 @@ def _yaml_template():
   cluster_name:                       # Cluster name (str)
   shared_memory_path:                 # Shared memory path (str)
   shared_file_path:                   # Shared file path for shared.json/logs/profiles (str)
-  large_file_paths:                   # Owner-mode ordered large-file roots (dict(optional))
-    root_paths:                       # Ordered root directories; runtime uses the first usable root and derives fixed relative subdirectories under it (['{str}'])
+  large_file_paths:                   # Owner-mode ordered large-file roots (['{str}'](optional))
   p2p_listen_port:                    # P2P QUIC listen port override (int(optional))
   redis_compat:                       # Enable Redis protocol shim (dict(optional))
     listen_addr:                      # TCP listen addr, e.g. "127.0.0.1:16379" (str)
@@ -401,15 +400,12 @@ def _validate_fluxonkv_contract(cfg: Dict[str, Any]) -> None:
     if "large_file_paths" not in spec:
         raise ValueError("fluxonkv_spec.large_file_paths is required for owner mode")
     large_file_paths = spec.get("large_file_paths")
-    if not isinstance(large_file_paths, dict):
-        raise ValueError("fluxonkv_spec.large_file_paths must be a mapping in owner mode")
-    root_paths = large_file_paths.get("root_paths")
-    if not isinstance(root_paths, list) or len(root_paths) == 0:
-        raise ValueError("fluxonkv_spec.large_file_paths.root_paths must be a non-empty list in owner mode")
-    for idx, field_value in enumerate(root_paths):
+    if not isinstance(large_file_paths, list) or len(large_file_paths) == 0:
+        raise ValueError("fluxonkv_spec.large_file_paths must be a non-empty list in owner mode")
+    for idx, field_value in enumerate(large_file_paths):
         if not isinstance(field_value, str) or not field_value.strip():
             raise ValueError(
-                f"fluxonkv_spec.large_file_paths.root_paths[{idx}] must be a non-empty string in owner mode"
+                f"fluxonkv_spec.large_file_paths[{idx}] must be a non-empty string in owner mode"
             )
 
 
diff --git a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
index 1bad008..d120cc7 100644
--- a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
+++ b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
@@ -1598,9 +1598,7 @@ def _owner_kvclient_config(self) -> dict[str, Any]:
                 "shared_memory_path": str(self._shared_memory_root),
                 "shared_file_path": str(self._shared_file_root),
                 "sub_cluster": "transfer_owner",
-                "large_file_paths": {
-                    "root_paths": [str(self._work_root / "large" / "owner")],
-                },
+                "large_file_paths": [str(self._work_root / "large" / "owner")],
             },
             "test_spec_config": {
                 "disable_observability": True,
diff --git a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
index 52296a1..74f4943 100644
--- a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
+++ b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
@@ -88,8 +88,7 @@ service:
           shared_memory_path: "__OWNER1_SHM__"
           shared_file_path: "__OWNER1_SHARED_FILE__"
           sub_cluster: "owner1"
-          large_file_paths:
-            root_paths: ["__OWNER1_LARGE_ROOT__"]
+          large_file_paths: ["__OWNER1_LARGE_ROOT__"]
           p2p_listen_port: 31011
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner1"
@@ -120,8 +119,7 @@ service:
           shared_memory_path: "__OWNER2_SHM__"
           shared_file_path: "__OWNER2_SHARED_FILE__"
           sub_cluster: "owner2"
-          large_file_paths:
-            root_paths: ["__OWNER2_LARGE_ROOT__"]
+          large_file_paths: ["__OWNER2_LARGE_ROOT__"]
           p2p_listen_port: 31012
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner2"
@@ -152,8 +150,7 @@ service:
           shared_memory_path: "__OWNER3_SHM__"
           shared_file_path: "__OWNER3_SHARED_FILE__"
           sub_cluster: "owner3"
-          large_file_paths:
-            root_paths: ["__OWNER3_LARGE_ROOT__"]
+          large_file_paths: ["__OWNER3_LARGE_ROOT__"]
           p2p_listen_port: 31013
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner3"
@@ -184,8 +181,7 @@ service:
           shared_memory_path: "__OWNER4_SHM__"
           shared_file_path: "__OWNER4_SHARED_FILE__"
           sub_cluster: "owner4"
-          large_file_paths:
-            root_paths: ["__OWNER4_LARGE_ROOT__"]
+          large_file_paths: ["__OWNER4_LARGE_ROOT__"]
           p2p_listen_port: 31014
       YAML
       exec python3 -m fluxon_py.runtime.start_owner_kvclient -c all_config.yaml -w "__RUNTIME_ROOT__/work/owner4"
diff --git a/fluxon_py/tests/test_config.py b/fluxon_py/tests/test_config.py
index b6ced9e..dc1e6dc 100644
--- a/fluxon_py/tests/test_config.py
+++ b/fluxon_py/tests/test_config.py
@@ -144,10 +144,8 @@ def _import_fluxon_pyo3_tool_without_package_init():
 _PYO3_TOOL = _import_fluxon_pyo3_tool_without_package_init()
 
 
-def _owner_large_file_paths(tag: str) -> dict[str, list[str]]:
-    return {
-        "root_paths": [f"/tmp/kvcache_large/{tag}"],
-    }
+def _owner_large_file_paths(tag: str) -> list[str]:
+    return [f"/tmp/kvcache_large/{tag}"]
 
 
 def _owner_fluxonkv_base_config(
@@ -297,12 +295,10 @@ def test_fluxonkv_owner_requires_large_file_paths():
             pass
 
         invalid_blank = copy.deepcopy(base)
-        invalid_blank["fluxonkv_spec"]["large_file_paths"] = {
-            "root_paths": ["   "],
-        }
+        invalid_blank["fluxonkv_spec"]["large_file_paths"] = ["   "]
         try:
             FluxonKvClientConfig(invalid_blank)
-            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - blank root_paths entry should be rejected")
+            print("❌ FAIL: test_fluxonkv_owner_requires_large_file_paths - blank large_file_paths entry should be rejected")
             return
         except ValueError:
             pass
@@ -310,7 +306,6 @@ def test_fluxonkv_owner_requires_large_file_paths():
         valid = _owner_fluxonkv_base_config(tag="owner_requires_large_file_paths_valid")
         rendered = FluxonKvClientConfig(valid).to_fluxon_kv_client_config_yaml_str()
         assert "large_file_paths:" in rendered
-        assert "root_paths:" in rendered
         assert "- /tmp/kvcache_large/owner_requires_large_file_paths_valid" in rendered
         print("✅ PASS: test_fluxonkv_owner_requires_large_file_paths")
     except Exception as e:
diff --git a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
index 88c346b..6257f4f 100644
--- a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
+++ b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
@@ -486,9 +486,7 @@ def _build_example_config(
                 "shared_memory_path": shared_memory_path,
                 "shared_file_path": str((Path(shared_memory_path).parent / "sharefile").resolve()),
                 "sub_cluster": "demo",
-                "large_file_paths": {
-                    "root_paths": [str((Path(shared_memory_path).parent / "large" / "owner").resolve())],
-                },
+                "large_file_paths": [str((Path(shared_memory_path).parent / "large" / "owner").resolve())],
             },
         },
         "kvexternal": {
diff --git a/fluxon_rs/fluxon_kv/src/config.rs b/fluxon_rs/fluxon_kv/src/config.rs
index 973d15e..fad6082 100644
--- a/fluxon_rs/fluxon_kv/src/config.rs
+++ b/fluxon_rs/fluxon_kv/src/config.rs
@@ -390,15 +390,15 @@ fn verify_non_empty_root_path(root: &str, field_name: &str) -> KvResult<String>
     Ok(trimmed.to_string())
 }
 
-fn verify_non_empty_root_path_list(root_paths: &[String], field_name: &str) -> KvResult<Vec<String>> {
-    if root_paths.is_empty() {
+fn verify_non_empty_root_path_list(paths: &[String], field_name: &str) -> KvResult<Vec<String>> {
+    if paths.is_empty() {
         return Err(ConfigError::InvalidClientConfig {
             detail: format!("{field_name} must contain at least one path"),
         }
         .into_kverror());
     }
-    let mut out = Vec::with_capacity(root_paths.len());
-    for (idx, root) in root_paths.iter().enumerate() {
+    let mut out = Vec::with_capacity(paths.len());
+    for (idx, root) in paths.iter().enumerate() {
         out.push(verify_non_empty_root_path(
             root,
             &format!("{field_name}[{idx}]"),
@@ -590,10 +590,8 @@ pub struct FluxonKvSpecYaml {
 }
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
-#[serde(deny_unknown_fields)]
-pub struct LargeFilePathsYaml {
-    pub root_paths: Vec<String>,
-}
+#[serde(transparent)]
+pub struct LargeFilePathsYaml(pub Vec<String>);
 
 #[derive(Debug, Clone, Serialize, Deserialize)]
 #[serde(deny_unknown_fields)]
@@ -645,15 +643,16 @@ pub struct FluxonKvSpec {
 }
 
 #[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
+#[serde(transparent)]
 pub struct LargeFilePaths {
-    pub root_paths: Vec<String>,
+    pub paths: Vec<String>,
 }
 
 impl LargeFilePaths {
-    fn require_configured_root_paths(&self) -> KvResult<()> {
-        if self.root_paths.is_empty() {
+    fn require_configured_paths(&self) -> KvResult<()> {
+        if self.paths.is_empty() {
             return Err(ConfigError::InvalidClientConfig {
-                detail: "large_file_paths.root_paths must contain at least one path".to_string(),
+                detail: "large_file_paths must contain at least one path".to_string(),
             }
             .into_kverror());
         }
@@ -665,9 +664,9 @@ impl LargeFilePaths {
         relative_dir: &Path,
         target_name: &str,
     ) -> KvResult<PathBuf> {
-        self.require_configured_root_paths()?;
+        self.require_configured_paths()?;
         let mut errors = Vec::new();
-        for root in &self.root_paths {
+        for root in &self.paths {
             let candidate = Path::new(root).join(relative_dir);
             match fs::create_dir_all(&candidate) {
                 Ok(()) => return Ok(candidate),
@@ -676,7 +675,7 @@ impl LargeFilePaths {
         }
         Err(ConfigError::InvalidClientConfig {
             detail: format!(
-                "large_file_paths.root_paths contains no usable root for {}; tried: {}",
+                "large_file_paths contains no usable root for {}; tried: {}",
                 target_name,
                 errors.join(", ")
             ),
@@ -1170,7 +1169,7 @@ impl ClientConfigYaml {
         // callers may pin it, while shared testbed owners can leave it unset
         // and let the runtime bind a free port.
         let large_file_paths = if is_external {
-            LargeFilePaths { root_paths: Vec::new() }
+            LargeFilePaths { paths: Vec::new() }
         } else {
             let Some(large_file_paths_yaml) = self.fluxonkv_spec.large_file_paths.as_ref() else {
                 return Err(ConfigError::InvalidClientConfig {
@@ -1180,10 +1179,7 @@ impl ClientConfigYaml {
                 .into_kverror());
             };
             LargeFilePaths {
-                root_paths: verify_non_empty_root_path_list(
-                    &large_file_paths_yaml.root_paths,
-                    "large_file_paths.root_paths",
-                )?,
+                paths: verify_non_empty_root_path_list(&large_file_paths_yaml.0, "large_file_paths")?,
             }
         };
 
@@ -1574,8 +1570,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   disable_observability: true
@@ -1622,8 +1617,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
         )
@@ -1649,7 +1643,7 @@ fluxonkv_spec:
         )
         .unwrap();
         let verified = cfg.verify().unwrap();
-        assert_eq!(verified.large_file_paths.root_paths, Vec::<String>::new());
+        assert_eq!(verified.large_file_paths.paths, Vec::<String>::new());
         assert_eq!(verified.fluxonkv_spec.etcd_addresses, Vec::<String>::new());
         assert_eq!(verified.fluxonkv_spec.sub_cluster, None);
     }
@@ -1663,8 +1657,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_external
   shared_file_path: /tmp/test_external_files
-  large_file_paths:
-    root_paths: [/tmp/test_external_large]
+  large_file_paths: [/tmp/test_external_large]
 "#,
         )
         .unwrap();
@@ -1681,7 +1674,7 @@ fluxonkv_spec:
         std::fs::create_dir_all(&second_root).unwrap();
 
         let large_file_paths = LargeFilePaths {
-            root_paths: vec![
+            paths: vec![
                 first_root.join("child").to_string_lossy().into_owned(),
                 second_root.to_string_lossy().into_owned(),
             ],
@@ -1708,8 +1701,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1763,8 +1755,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -1800,8 +1791,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1833,8 +1823,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   require_transfer_rpc_fast_path_ready_timeout_seconds: 45
@@ -1860,8 +1849,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   tcp_thread_control_lane_count: 0
@@ -1888,8 +1876,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1921,8 +1908,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
@@ -1947,8 +1933,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   rdma_device_names: ["mlx5_0"]
@@ -2003,8 +1988,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
-  large_file_paths:
-    root_paths: [/tmp/test_side_worker_large]
+  large_file_paths: [/tmp/test_side_worker_large]
   p2p_listen_port: 18081
 test_spec_config:
   enable_side_transfer: true
@@ -2044,8 +2028,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
-  large_file_paths:
-    root_paths: [/tmp/test_side_worker_large]
+  large_file_paths: [/tmp/test_side_worker_large]
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -2077,8 +2060,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_side_worker
   shared_file_path: /tmp/test_side_worker_files
-  large_file_paths:
-    root_paths: [/tmp/test_side_worker_large]
+  large_file_paths: [/tmp/test_side_worker_large]
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -2108,8 +2090,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   p2p_listen_port: 18081
   sub_cluster: rack-a
 test_spec_config:
@@ -2142,8 +2123,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
         )
@@ -2169,8 +2149,7 @@ fluxonkv_spec:
   cluster_name: test_cluster
   shared_memory_path: /tmp/test_owner
   shared_file_path: /tmp/test_owner_files
-  large_file_paths:
-    root_paths: [/tmp/test_owner_large]
+  large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_with_rpc
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
index 765881a..a43c021 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
@@ -83,7 +83,7 @@ fn new_client_config(
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
         large_file_paths: LargeFilePaths {
-            root_paths: vec![format!("{}_large", shm_path)],
+            paths: vec![format!("{}_large", shm_path)],
         },
         test_spec_config: TestSpecConfig::default(),
     }
@@ -127,7 +127,7 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: shm_path.to_string(),
         shared_file_path: format!("{}_files", shm_path),
-        large_file_paths: LargeFilePaths { root_paths: Vec::new() },
+        large_file_paths: LargeFilePaths { paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_rs/fluxon_kv/src/kv_test.rs b/fluxon_rs/fluxon_kv/src/kv_test.rs
index b1b79c9..0ede369 100644
--- a/fluxon_rs/fluxon_kv/src/kv_test.rs
+++ b/fluxon_rs/fluxon_kv/src/kv_test.rs
@@ -857,10 +857,10 @@ fn default_client_large_file_paths(
     if contribute_to_cluster_pool_size.dram == 0
         && contribute_to_cluster_pool_size.vram.is_empty()
     {
-        return LargeFilePaths { root_paths: Vec::new() };
+        return LargeFilePaths { paths: Vec::new() };
     }
     LargeFilePaths {
-        root_paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
+        paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
     }
 }
 
diff --git a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
index b569fe0..1a64c83 100644
--- a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
+++ b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
@@ -148,7 +148,7 @@ fn new_client_config_with_cluster_and_dram(
         shared_memory_path,
         shared_file_path,
         large_file_paths: crate::config::LargeFilePaths {
-            root_paths: vec![format!("{}/large/{}", base, instance_key)],
+            paths: vec![format!("{}/large/{}", base, instance_key)],
         },
         test_spec_config: TestSpecConfig::default(),
     };
diff --git a/fluxon_rs/fluxon_kv/src/lib.rs b/fluxon_rs/fluxon_kv/src/lib.rs
index 0a35f69..94bb34d 100644
--- a/fluxon_rs/fluxon_kv/src/lib.rs
+++ b/fluxon_rs/fluxon_kv/src/lib.rs
@@ -2545,7 +2545,7 @@ mod tests {
             shared_memory_path: "/tmp/fluxon_side_transfer_test".to_string(),
             shared_file_path: "/tmp/fluxon_side_transfer_test_files".to_string(),
             large_file_paths: crate::config::LargeFilePaths {
-                root_paths: vec!["/tmp/fluxon_side_transfer_test_large".to_string()],
+                paths: vec!["/tmp/fluxon_side_transfer_test_large".to_string()],
             },
             test_spec_config: TestSpecConfig {
                 enable_side_transfer: true,
@@ -2819,15 +2819,18 @@ mod tests {
                 .to_string_lossy()
                 .into_owned(),
             large_file_paths: crate::config::LargeFilePaths {
-                root_paths: vec![owner_large_root.to_string_lossy().into_owned()],
+                paths: vec![owner_large_root.to_string_lossy().into_owned()],
             },
             protocol_version:
                 fluxon_util::git_version_build_record::get_current_git_commitid().unwrap(),
             write_ts: Some(chrono::Utc::now().timestamp_micros()),
         };
+        let shared_meta_json = serde_json::to_string(&shared_meta).unwrap();
+        assert!(shared_meta_json.contains("\"large_file_paths\":["));
+        assert!(!shared_meta_json.contains("root_paths"));
         std::fs::write(
             shared_file_root.join("shared.json"),
-            serde_json::to_vec(&shared_meta).unwrap(),
+            shared_meta_json.as_bytes(),
         )
         .unwrap();
 
@@ -2855,7 +2858,7 @@ mod tests {
             },
             shared_memory_path: shared_memory_root.to_string_lossy().into_owned(),
             shared_file_path: shared_file_root.to_string_lossy().into_owned(),
-            large_file_paths: crate::config::LargeFilePaths { root_paths: Vec::new() },
+            large_file_paths: crate::config::LargeFilePaths { paths: Vec::new() },
             test_spec_config: TestSpecConfig::default(),
         };
 
@@ -2863,7 +2866,7 @@ mod tests {
             .await
             .expect("bootstrap zero-contribution config");
         assert_eq!(
-            bootstrapped.large_file_paths.root_paths,
+            bootstrapped.large_file_paths.paths,
             vec![owner_large_root.to_string_lossy().into_owned()]
         );
         assert_eq!(
diff --git a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
index 625cb91..83e29de 100644
--- a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
+++ b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
@@ -95,7 +95,7 @@ fn new_client_config_with_size(
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", instance_key),
         large_file_paths: crate::config::LargeFilePaths {
-            root_paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
+            paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
         },
         test_spec_config: TestSpecConfig::default(),
     }
@@ -130,7 +130,7 @@ fn new_zero_contribution_client_config(
         },
         shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", owner_instance_key),
         shared_file_path: format!("/tmp/kvcache_shared_files/{}", owner_instance_key),
-        large_file_paths: crate::config::LargeFilePaths { root_paths: Vec::new() },
+        large_file_paths: crate::config::LargeFilePaths { paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
 }
diff --git a/fluxon_test_stack/deployconf_testbed.yml b/fluxon_test_stack/deployconf_testbed.yml
index 552ce13..0a74ed4 100644
--- a/fluxon_test_stack/deployconf_testbed.yml
+++ b/fluxon_test_stack/deployconf_testbed.yml
@@ -350,8 +350,7 @@ service:
         shared_memory_path: "${FLUXON_SHARED_MEM}"
         shared_file_path: "${FLUXON_SHARED_FILE}"
         large_file_paths:
-          log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"
-          cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"
+        - "${HOSTWORKDIR}/large/owner_${NODE_ID}"
         sub_cluster: "owner"
       YAML
       ${HOSTWORKDIR}/venv/bin/python -m fluxon_py.runtime.start_owner_kvclient -c "${CONFIG_PATH}" -w "${WORKDIR}"
diff --git a/fluxon_test_stack/test_runner.py b/fluxon_test_stack/test_runner.py
index 2d965df..031443f 100644
--- a/fluxon_test_stack/test_runner.py
+++ b/fluxon_test_stack/test_runner.py
@@ -9296,14 +9296,11 @@ def _test_stack_kv_owner_runtime_instance_key(*, runtime_instance_prefix: str, o
     return f"{runtime_instance_prefix}__kv_owner__{target_slug}"
 
 
-def _fluxon_kv_owner_large_file_paths(*, owner_work_root: Path) -> Dict[str, str]:
-    # Owner mode always needs explicit large-file roots for logs and caches,
-    # even on surfaces that intentionally leave p2p_listen_port implicit.
+def _fluxon_kv_owner_large_file_paths(*, owner_work_root: Path) -> List[str]:
+    # Owner mode always needs explicit large-file roots, even on surfaces that
+    # intentionally leave p2p_listen_port implicit.
     root = owner_work_root.resolve()
-    return {
-        "log_root_path": str((root / "large" / "log").resolve()),
-        "cache_root_path": str((root / "large" / "cache").resolve()),
-    }
+    return [str((root / "large").resolve())]
 
 
 def _build_test_stack_external_kv_owner_instances(
diff --git a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
index 100bec7..042e5d5 100644
--- a/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
+++ b/fluxon_test_stack/tests/test_ci_2_virt_node_contract.py
@@ -235,11 +235,11 @@ def test_generated_deployconf_rewrites_to_dual_local_nodes(self) -> None:
         self.assertEqual(generated["atomic_groups"]["fluxon_core_controller"]["nodes"], ["local-node-a", "local-node-b"])
         self.assertEqual(generated["service"]["owner"]["node_bind"]["node"], ["local-node-a", "local-node-b"])
         self.assertIn(
-            'log_root_path: "${HOSTWORKDIR}/large/log/owner_${NODE_ID}"',
+            'large_file_paths:',
             generated["service"]["owner"]["entrypoint"],
         )
         self.assertIn(
-            'cache_root_path: "${HOSTWORKDIR}/large/cache/owner_${NODE_ID}"',
+            '- "${HOSTWORKDIR}/large/owner_${NODE_ID}"',
             generated["service"]["owner"]["entrypoint"],
         )
         self.assertEqual(generated["service"]["ops_controller"]["port"], 19180)
diff --git a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
index 3f43433..46dcc4f 100644
--- a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
+++ b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
@@ -65,10 +65,7 @@ def test_write_ci_master_owner_configs_emits_owner_large_file_paths(self) -> Non
             owner_cfg = yaml.safe_load(owner_path.read_text(encoding="utf-8"))
             self.assertEqual(
                 owner_cfg["fluxonkv_spec"]["large_file_paths"],
-                {
-                    "log_root_path": str((run_dir / "services" / "owner_0" / "large" / "log").resolve()),
-                    "cache_root_path": str((run_dir / "services" / "owner_0" / "large" / "cache").resolve()),
-                },
+                [str((run_dir / "services" / "owner_0" / "large").resolve())],
             )
 
     def test_write_ci_scene_config_yaml_emits_structured_scene_config(self) -> None:
@@ -170,10 +167,7 @@ def test_generated_test_stack_owner_config_emits_large_file_paths(self) -> None:
             owner_cfg = yaml.safe_load(owner_cfg_path.read_text(encoding="utf-8"))
             self.assertEqual(
                 owner_cfg["fluxonkv_spec"]["large_file_paths"],
-                {
-                    "log_root_path": str((run_dir / "services" / "kv_owner" / target_slug / "large" / "log").resolve()),
-                    "cache_root_path": str((run_dir / "services" / "kv_owner" / target_slug / "large" / "cache").resolve()),
-                },
+                [str((run_dir / "services" / "kv_owner" / target_slug / "large").resolve())],
             )
 
     def test_ci_source_overlay_includes_fluxon_test_stack(self) -> None:
diff --git a/setup_and_pack/tests/test_quick_start_release_only.py b/setup_and_pack/tests/test_quick_start_release_only.py
index 413eee4..5b5b29f 100644
--- a/setup_and_pack/tests/test_quick_start_release_only.py
+++ b/setup_and_pack/tests/test_quick_start_release_only.py
@@ -153,10 +153,7 @@ def test_quick_start_owner_configs_include_large_file_paths(self) -> None:
                 workdir,
             )
 
-            expected = {
-                "log_root_path": str(workdir / "large" / "log" / "owner"),
-                "cache_root_path": str(workdir / "large" / "cache" / "owner"),
-            }
+            expected = [str(workdir / "large" / "owner")]
             self.assertEqual(kv_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)
             self.assertEqual(mq_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)
             self.assertEqual(fs_cfg["kvclient"]["fluxonkv_spec"]["large_file_paths"], expected)

From ab1cd2c8b08ad9537b8bbbe3e940edb3aaf2dbf9 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Wed, 24 Jun 2026 15:03:23 +0800
Subject: [PATCH 12/13] test

---
 .../test_selection_supervisor_codegen.py      |  72 +-
 .../utils/selection_supervisor_codegen.py     |  20 +-
 fluxon_rs/fluxon_ops/src/lib.rs               | 778 +++++++++++++-----
 3 files changed, 641 insertions(+), 229 deletions(-)

diff --git a/deployment/tests/test_selection_supervisor_codegen.py b/deployment/tests/test_selection_supervisor_codegen.py
index adc82a9..bd2e34c 100644
--- a/deployment/tests/test_selection_supervisor_codegen.py
+++ b/deployment/tests/test_selection_supervisor_codegen.py
@@ -3,13 +3,13 @@
 from __future__ import annotations
 
 import argparse
+import importlib.util
 import json
 import os
 import subprocess
 import sys
 import tempfile
 import time
-import types
 from pathlib import Path
 from types import SimpleNamespace
 from typing import Callable, List, Optional, Tuple
@@ -39,6 +39,7 @@ def main() -> int:
 def _build_checks(selected_test_id: Optional[str]) -> List[Tuple[str, Callable[[], None]]]:
     checks: List[Tuple[str, Callable[[], None]]] = [
         ("runtime_only_supports_run_stop", test_runtime_only_supports_run_stop),
+        ("runtime_requires_same_directory_log_shard_helper", test_runtime_requires_same_directory_log_shard_helper),
         ("install_subreaper_uses_prctl", test_install_subreaper_uses_prctl),
         ("spawn_child_sanitizes_rdma_driver_env", test_spawn_child_sanitizes_rdma_driver_env),
         ("selection_present_requires_live_child_process", test_selection_present_requires_live_child_process),
@@ -82,13 +83,20 @@ def _run_check(check: Callable[[], None]) -> bool:
 
 
 def _load_runtime_module():
-    module = types.ModuleType("test_selection_supervisor_runtime")
-    sys.modules[module.__name__] = module
-    code = render_python_selection_supervisor_module(
-        timeouts=SimpleNamespace(term_seconds=5, kill_seconds=5, supersede_seconds=2),
-    )
-    exec(code, module.__dict__)
-    return module
+    root = Path(tempfile.mkdtemp(prefix="test_selection_supervisor_runtime_module_"))
+    try:
+        supervisor_path = _write_runtime_script(root)
+        module_name = f"test_selection_supervisor_runtime_{os.getpid()}_{time.time_ns()}"
+        spec = importlib.util.spec_from_file_location(module_name, supervisor_path)
+        if spec is None or spec.loader is None:
+            raise RuntimeError(f"failed to load runtime module spec: {supervisor_path}")
+        module = importlib.util.module_from_spec(spec)
+        module._test_runtime_root = root
+        sys.modules[module_name] = module
+        spec.loader.exec_module(module)
+        return module
+    finally:
+        sys.modules.pop(module_name, None)
 
 
 def _write_runtime_script(root: Path, *, term_seconds: int = 5, kill_seconds: int = 5, supersede_seconds: int = 2) -> Path:
@@ -438,6 +446,16 @@ def _wait_pid_absent(pid: int, *, timeout_seconds: float = 10.0) -> None:
     raise RuntimeError(f"timeout waiting pid absent: pid={pid}")
 
 
+def _read_runtime_log(root: Path, service_name: str) -> str:
+    shard_path = root / f"{service_name}.{time.strftime('%Y-%m-%d', time.gmtime())}.log"
+    deadline = time.time() + 5.0
+    while time.time() < deadline:
+        if shard_path.exists():
+            return shard_path.read_text(encoding="utf-8", errors="replace")
+        time.sleep(0.1)
+    raise RuntimeError(f"runtime log shard missing: {shard_path}")
+
+
 def test_runtime_only_supports_run_stop() -> None:
     code = render_python_selection_supervisor_module(
         timeouts=SimpleNamespace(term_seconds=5, kill_seconds=5, supersede_seconds=2),
@@ -452,6 +470,28 @@ def test_runtime_only_supports_run_stop() -> None:
     assert "--require-supervisor-start-time-ticks" not in code
 
 
+def test_runtime_requires_same_directory_log_shard_helper() -> None:
+    with tempfile.TemporaryDirectory(prefix="test_selection_supervisor_missing_helper_") as td:
+        root = Path(td)
+        supervisor_path = root / "selection_supervisor.py"
+        supervisor_path.write_text(
+            render_python_selection_supervisor_module(
+                timeouts=SimpleNamespace(term_seconds=5, kill_seconds=5, supersede_seconds=2),
+            ),
+            encoding="utf-8",
+        )
+        proc = subprocess.run(
+            [sys.executable, str(supervisor_path), "stop", "--label", "DaemonSet/test-missing-helper", "--missing-ok"],
+            cwd=str(root),
+            capture_output=True,
+            text=True,
+            timeout=10,
+            check=False,
+        )
+        assert proc.returncode != 0, proc
+        assert "missing log shard helper next to selection_supervisor.py" in proc.stderr, proc.stderr
+
+
 def test_install_subreaper_uses_prctl() -> None:
     module = _load_runtime_module()
 
@@ -1022,12 +1062,12 @@ def test_replace_supersedes_old_generation() -> None:
             assert status["apply_id"] == "apply-2", f"expected new apply to own selection, got {status!r}"
             assert status["owner_ts_ms"] == 2, f"expected owner_ts_ms=2 after replace, got {status!r}"
             old_supervisor.wait(timeout=10)
-            old_stderr = old_supervisor.stderr.read() if old_supervisor.stderr is not None else ""
+            runtime_log = _read_runtime_log(root, "test-supersede")
             assert (
-                "running generation superseded" in old_stderr
-                or "superseded child exited without restart" in old_stderr
+                "running generation superseded" in runtime_log
+                or "superseded child exited without restart" in runtime_log
             ), (
-                f"expected old supervisor supersede log, stderr={old_stderr!r}"
+                f"expected old supervisor supersede log, runtime_log={runtime_log!r}"
             )
         finally:
             _terminate_process(new_supervisor)
@@ -1200,11 +1240,11 @@ def test_newer_apply_owned_overlap_with_applyless_owner_defers_retire() -> None:
             assert bare_supervisor.poll() is None, "old bare supervisor retired before phase-2 cutover or fallback"
 
             bare_supervisor.wait(timeout=20)
-            old_stderr = bare_supervisor.stderr.read() if bare_supervisor.stderr is not None else ""
+            runtime_log = _read_runtime_log(root, "test-phase1-overlap-applyless")
             assert (
-                "running generation superseded" in old_stderr
-                or "superseded child exited without restart" in old_stderr
-            ), old_stderr
+                "running generation superseded" in runtime_log
+                or "superseded child exited without restart" in runtime_log
+            ), runtime_log
         finally:
             _terminate_process(takeover_supervisor)
             _terminate_process(bare_supervisor)
diff --git a/deployment/utils/selection_supervisor_codegen.py b/deployment/utils/selection_supervisor_codegen.py
index 8e8d7fb..cc27872 100644
--- a/deployment/utils/selection_supervisor_codegen.py
+++ b/deployment/utils/selection_supervisor_codegen.py
@@ -70,22 +70,12 @@ def render_python_selection_supervisor_module(*, timeouts) -> str:
 
 
 def _load_log_shard_helper():
-    candidates = []
     raw_file = globals().get("__file__")
-    if isinstance(raw_file, str) and raw_file:
-        candidates.append(Path(raw_file).resolve().with_name("__LOG_SHARD_HELPER_FILENAME__"))
-    cwd = Path.cwd().resolve()
-    candidates.append(cwd / "__LOG_SHARD_HELPER_FILENAME__")
-    candidates.append(cwd / "deployment" / "utils" / "__LOG_SHARD_HELPER_FILENAME__")
-    for entry in sys.path:
-        if not isinstance(entry, str) or not entry:
-            continue
-        candidates.append(Path(entry).resolve() / "__LOG_SHARD_HELPER_FILENAME__")
-    helper_path = candidates[0]
-    for candidate in candidates:
-        if candidate.is_file():
-            helper_path = candidate
-            break
+    if not isinstance(raw_file, str) or not raw_file:
+        raise RuntimeError("selection_supervisor.py requires __file__ to resolve log shard helper")
+    helper_path = Path(raw_file).resolve().with_name("__LOG_SHARD_HELPER_FILENAME__")
+    if not helper_path.is_file():
+        raise RuntimeError(f"missing log shard helper next to selection_supervisor.py: {helper_path}")
     spec = importlib.util.spec_from_file_location("_fluxon_selection_log_shard", helper_path)
     if spec is None or spec.loader is None:
         raise RuntimeError(f"failed to load log shard helper: {helper_path}")
diff --git a/fluxon_rs/fluxon_ops/src/lib.rs b/fluxon_rs/fluxon_ops/src/lib.rs
index b27420b..29d9434 100644
--- a/fluxon_rs/fluxon_ops/src/lib.rs
+++ b/fluxon_rs/fluxon_ops/src/lib.rs
@@ -228,6 +228,132 @@ fn workload_log_filename(kind: WorkloadKind, name: &str) -> anyhow::Result<Strin
     Ok(format!("workload__{}__{}.log", kind.as_str(), name))
 }
 
+fn workload_log_shard_identity_from_path(
+    logical_path: &Path,
+    resolved_path: &Path,
+) -> anyhow::Result<String> {
+    let logical_name = logical_path
+        .file_name()
+        .and_then(|v| v.to_str())
+        .ok_or_else(|| anyhow::anyhow!("logical log path must end with a utf-8 filename"))?;
+    let resolved_name = resolved_path
+        .file_name()
+        .and_then(|v| v.to_str())
+        .ok_or_else(|| anyhow::anyhow!("resolved log path must end with a utf-8 filename"))?;
+    if resolved_name == logical_name {
+        return Ok("base".to_string());
+    }
+    let stem = logical_name
+        .strip_suffix(".log")
+        .ok_or_else(|| anyhow::anyhow!("logical log filename must end with .log"))?;
+    let prefix = format!("{stem}.");
+    let suffix = ".log";
+    if !resolved_name.starts_with(prefix.as_str()) || !resolved_name.ends_with(suffix) {
+        anyhow::bail!(
+            "resolved log path is not a recognized shard of logical log: logical={} resolved={}",
+            logical_name,
+            resolved_name
+        );
+    }
+    let shard = &resolved_name[prefix.len()..resolved_name.len() - suffix.len()];
+    if shard.is_empty() {
+        anyhow::bail!(
+            "resolved log shard identity is empty: logical={} resolved={}",
+            logical_name,
+            resolved_name
+        );
+    }
+    Ok(shard.to_string())
+}
+
+fn workload_log_path_for_shard(logical_path: &Path, shard: &str) -> anyhow::Result<PathBuf> {
+    if shard == "base" {
+        return Ok(logical_path.to_path_buf());
+    }
+    let date = chrono::NaiveDate::parse_from_str(shard, "%Y-%m-%d")
+        .map_err(|e| anyhow::anyhow!("invalid workload log shard identity '{}': {}", shard, e))?;
+    fluxon_util::daily_sharded_log_path(logical_path, date)
+}
+
+fn workload_log_existing_shards(logical_path: &Path) -> anyhow::Result<Vec<String>> {
+    let mut dated_shards = Vec::new();
+    let mut has_base = false;
+    let parent = logical_path.parent().unwrap_or_else(|| Path::new("."));
+    let logical_name = logical_path
+        .file_name()
+        .and_then(|v| v.to_str())
+        .ok_or_else(|| anyhow::anyhow!("logical log path must end with a utf-8 filename"))?;
+    let stem = logical_name
+        .strip_suffix(".log")
+        .ok_or_else(|| anyhow::anyhow!("logical log filename must end with .log"))?;
+    let prefix = format!("{stem}.");
+    let suffix = ".log";
+    let entries = std::fs::read_dir(parent)?;
+    for entry in entries {
+        let entry = entry?;
+        let path = entry.path();
+        if !path.is_file() {
+            continue;
+        }
+        let entry_name = entry.file_name();
+        let Some(entry_name) = entry_name.to_str() else {
+            continue;
+        };
+        if entry_name == logical_name {
+            has_base = true;
+            continue;
+        }
+        if !entry_name.starts_with(prefix.as_str()) || !entry_name.ends_with(suffix) {
+            continue;
+        }
+        if entry_name.len() <= prefix.len() + suffix.len() {
+            continue;
+        }
+        let shard = &entry_name[prefix.len()..entry_name.len() - suffix.len()];
+        if chrono::NaiveDate::parse_from_str(shard, "%Y-%m-%d").is_ok() {
+            dated_shards.push(shard.to_string());
+        }
+    }
+    dated_shards.sort();
+    dated_shards.dedup();
+    if !dated_shards.is_empty() {
+        return Ok(dated_shards);
+    }
+    if has_base {
+        return Ok(vec!["base".to_string()]);
+    }
+    Ok(Vec::new())
+}
+
+fn workload_log_previous_shard(logical_path: &Path, shard: &str) -> anyhow::Result<Option<String>> {
+    let shards = workload_log_existing_shards(logical_path)?;
+    let Some(idx) = shards.iter().position(|v| v == shard) else {
+        return Ok(None);
+    };
+    if idx == 0 {
+        return Ok(None);
+    }
+    Ok(Some(shards[idx - 1].clone()))
+}
+
+fn workload_log_next_shard(logical_path: &Path, shard: &str) -> anyhow::Result<Option<String>> {
+    let shards = workload_log_existing_shards(logical_path)?;
+    let Some(idx) = shards.iter().position(|v| v == shard) else {
+        return Ok(None);
+    };
+    if idx + 1 >= shards.len() {
+        return Ok(None);
+    }
+    Ok(Some(shards[idx + 1].clone()))
+}
+
+fn workload_log_latest_shard_identity(logical_path: &Path) -> anyhow::Result<Option<String>> {
+    let Some(path) = resolve_readable_log_path(logical_path) else {
+        return Ok(None);
+    };
+    Ok(Some(workload_log_shard_identity_from_path(logical_path, &path)?))
+}
+
 #[derive(Debug, Clone, PartialEq, Eq, PartialOrd, Ord, Serialize, Deserialize)]
 #[serde(deny_unknown_fields)]
 struct WorkloadId {
@@ -580,7 +706,7 @@ struct ReadWorkloadLogReq {
     name: String,
     direction: LogReadDirection,
     #[serde(skip_serializing_if = "Option::is_none")]
-    cursor: Option<u64>,
+    cursor: Option<WorkloadLogCursor>,
     // Contract:
     // - max_bytes may be omitted to mean "unlimited" (no byte cap).
     // - This supports ad-hoc debugging where the caller wants the full log without knowing file_size up-front.
@@ -602,9 +728,20 @@ struct ReadWorkloadLogResp {
     #[serde(skip_serializing_if = "Option::is_none")]
     end_offset: Option<u64>,
     #[serde(skip_serializing_if = "Option::is_none")]
+    start_cursor: Option<WorkloadLogCursor>,
+    #[serde(skip_serializing_if = "Option::is_none")]
+    end_cursor: Option<WorkloadLogCursor>,
+    #[serde(skip_serializing_if = "Option::is_none")]
     text: Option<String>,
 }
 
+#[derive(Debug, Clone, PartialEq, Eq, Serialize, Deserialize)]
+#[serde(deny_unknown_fields)]
+struct WorkloadLogCursor {
+    shard: String,
+    offset: u64,
+}
+
 fn ensure_positive_u64(v: u64, field: &str) -> KvResult<u64> {
     if v == 0 {
         return Err(KvError::Api(ApiError::InvalidArgument {
@@ -2991,6 +3128,8 @@ impl UserRpcHandler for ReadWorkloadLogChunkHandler {
                     file_size: None,
                     start_offset: None,
                     end_offset: None,
+                    start_cursor: None,
+                    end_cursor: None,
                     text: None,
                 };
                 return Ok(serde_json::to_vec(&resp).unwrap());
@@ -2998,111 +3137,259 @@ impl UserRpcHandler for ReadWorkloadLogChunkHandler {
         };
 
         let logical_path = self.log_dir.join(log_filename);
-        let path = resolve_readable_log_path(&logical_path).unwrap_or(logical_path.clone());
+        let make_err_resp = |err: String, file_size: Option<u64>| ReadWorkloadLogResp {
+            ok: false,
+            err: Some(err),
+            file_size,
+            start_offset: None,
+            end_offset: None,
+            start_cursor: None,
+            end_cursor: None,
+            text: None,
+        };
+
+        let (path, shard) = match req.cursor.as_ref() {
+            Some(cursor) => match workload_log_path_for_shard(&logical_path, &cursor.shard) {
+                Ok(path) => (path, cursor.shard.clone()),
+                Err(e) => {
+                    let resp = make_err_resp(format!("{}", e), None);
+                    return Ok(serde_json::to_vec(&resp).unwrap());
+                }
+            },
+            None => {
+                let Some(path) = resolve_readable_log_path(&logical_path) else {
+                    let resp = make_err_resp(
+                        format!("log file is not available yet: logical_path={}", logical_path.display()),
+                        None,
+                    );
+                    return Ok(serde_json::to_vec(&resp).unwrap());
+                };
+                let shard = match workload_log_shard_identity_from_path(&logical_path, &path) {
+                    Ok(v) => v,
+                    Err(e) => {
+                        let resp = make_err_resp(format!("{}", e), None);
+                        return Ok(serde_json::to_vec(&resp).unwrap());
+                    }
+                };
+                (path, shard)
+            }
+        };
         let meta = match std::fs::metadata(&path) {
             Ok(v) => v,
             Err(e) => {
-                let resp = ReadWorkloadLogResp {
-                    ok: false,
-                    err: Some(format!(
-                        "stat log failed: path={} err={}",
-                        path.display(),
-                        e
-                    )),
-                    file_size: None,
-                    start_offset: None,
-                    end_offset: None,
-                    text: None,
-                };
+                let resp = make_err_resp(
+                    format!("stat log failed: path={} err={}", path.display(), e),
+                    None,
+                );
                 return Ok(serde_json::to_vec(&resp).unwrap());
             }
         };
 
         let file_size = meta.len();
-        let (start, end) = match req.direction {
-            LogReadDirection::Forward => {
-                if let Some(cursor) = req.cursor {
-                    if cursor > file_size {
-                        let resp = ReadWorkloadLogResp {
-                            ok: false,
-                            err: Some(format!(
-                                "cursor out of range: cursor={} file_size={}",
-                                cursor, file_size
-                            )),
-                            file_size: Some(file_size),
-                            start_offset: None,
-                            end_offset: None,
-                            text: None,
+        let (start, end, start_cursor, end_cursor, effective_path, effective_file_size) =
+            match req.direction {
+                LogReadDirection::Forward => {
+                    if let Some(cursor) = req.cursor.as_ref() {
+                        if cursor.offset > file_size {
+                            let resp = make_err_resp(
+                                format!(
+                                    "cursor out of range: shard={} cursor={} file_size={}",
+                                    cursor.shard, cursor.offset, file_size
+                                ),
+                                Some(file_size),
+                            );
+                            return Ok(serde_json::to_vec(&resp).unwrap());
+                        }
+                        let mut effective_path = path.clone();
+                        let mut effective_shard = shard.clone();
+                        let mut effective_file_size = file_size;
+                        let mut start = cursor.offset;
+                        if cursor.offset == file_size {
+                            if let Ok(Some(next_shard)) =
+                                workload_log_next_shard(&logical_path, &cursor.shard)
+                            {
+                                let next_path = match workload_log_path_for_shard(&logical_path, &next_shard) {
+                                    Ok(v) => v,
+                                    Err(e) => {
+                                        let resp = make_err_resp(format!("{}", e), Some(file_size));
+                                        return Ok(serde_json::to_vec(&resp).unwrap());
+                                    }
+                                };
+                                match std::fs::metadata(&next_path) {
+                                    Ok(next_meta) => {
+                                        effective_file_size = next_meta.len();
+                                        effective_path = next_path;
+                                        effective_shard = next_shard;
+                                        start = 0;
+                                    }
+                                    Err(e) => {
+                                        let resp = make_err_resp(
+                                            format!(
+                                                "stat next log shard failed: path={} err={}",
+                                                next_path.display(),
+                                                e
+                                            ),
+                                            Some(file_size),
+                                        );
+                                        return Ok(serde_json::to_vec(&resp).unwrap());
+                                    }
+                                }
+                            } else if let Ok(Some(latest_shard)) =
+                                workload_log_latest_shard_identity(&logical_path)
+                            {
+                                if latest_shard != cursor.shard {
+                                    let latest_path =
+                                        match workload_log_path_for_shard(&logical_path, &latest_shard) {
+                                            Ok(v) => v,
+                                            Err(e) => {
+                                                let resp = make_err_resp(format!("{}", e), Some(file_size));
+                                                return Ok(serde_json::to_vec(&resp).unwrap());
+                                            }
+                                        };
+                                    match std::fs::metadata(&latest_path) {
+                                        Ok(latest_meta) => {
+                                            effective_file_size = latest_meta.len();
+                                            effective_path = latest_path;
+                                            effective_shard = latest_shard;
+                                            start = 0;
+                                        }
+                                        Err(e) => {
+                                            let resp = make_err_resp(
+                                                format!(
+                                                    "stat latest log shard failed: path={} err={}",
+                                                    latest_path.display(),
+                                                    e
+                                                ),
+                                                Some(file_size),
+                                            );
+                                            return Ok(serde_json::to_vec(&resp).unwrap());
+                                        }
+                                    }
+                                }
+                            }
+                        }
+                        let end = match max_bytes {
+                            Some(max_bytes) => {
+                                std::cmp::min(effective_file_size, start.saturating_add(max_bytes))
+                            }
+                            None => effective_file_size,
+                        };
+                        (
+                            start,
+                            end,
+                            Some(WorkloadLogCursor {
+                                shard: effective_shard.clone(),
+                                offset: start,
+                            }),
+                            Some(WorkloadLogCursor {
+                                shard: effective_shard.clone(),
+                                offset: end,
+                            }),
+                            effective_path,
+                            effective_file_size,
+                        )
+                    } else {
+                        let end = file_size;
+                        let start = match max_bytes {
+                            Some(max_bytes) => end.saturating_sub(max_bytes),
+                            None => 0,
                         };
+                        (
+                            start,
+                            end,
+                            Some(WorkloadLogCursor {
+                                shard: shard.clone(),
+                                offset: start,
+                            }),
+                            Some(WorkloadLogCursor {
+                                shard: shard.clone(),
+                                offset: end,
+                            }),
+                            path.clone(),
+                            file_size,
+                        )
+                    }
+                }
+                LogReadDirection::Backward => {
+                    let Some(cursor) = req.cursor.as_ref() else {
+                        let resp = make_err_resp(
+                            "cursor is required for Backward reads".to_string(),
+                            Some(file_size),
+                        );
+                        return Ok(serde_json::to_vec(&resp).unwrap());
+                    };
+                    if cursor.offset > file_size {
+                        let resp = make_err_resp(
+                            format!(
+                                "cursor out of range: shard={} cursor={} file_size={}",
+                                cursor.shard, cursor.offset, file_size
+                            ),
+                            Some(file_size),
+                        );
                         return Ok(serde_json::to_vec(&resp).unwrap());
                     }
-                    let start = cursor;
-                    let end = match max_bytes {
-                        Some(max_bytes) => {
-                            std::cmp::min(file_size, start.saturating_add(max_bytes))
+                    let mut effective_path = path.clone();
+                    let mut effective_shard = shard.clone();
+                    let mut effective_file_size = file_size;
+                    let mut end = cursor.offset;
+                    if cursor.offset == 0 {
+                        if let Ok(Some(prev_shard)) =
+                            workload_log_previous_shard(&logical_path, &cursor.shard)
+                        {
+                            let prev_path = match workload_log_path_for_shard(&logical_path, &prev_shard) {
+                                Ok(v) => v,
+                                Err(e) => {
+                                    let resp = make_err_resp(format!("{}", e), Some(file_size));
+                                    return Ok(serde_json::to_vec(&resp).unwrap());
+                                }
+                            };
+                            match std::fs::metadata(&prev_path) {
+                                Ok(prev_meta) => {
+                                    effective_file_size = prev_meta.len();
+                                    effective_path = prev_path;
+                                    effective_shard = prev_shard;
+                                    end = effective_file_size;
+                                }
+                                Err(e) => {
+                                    let resp = make_err_resp(
+                                        format!(
+                                            "stat previous log shard failed: path={} err={}",
+                                            prev_path.display(),
+                                            e
+                                        ),
+                                        Some(file_size),
+                                    );
+                                    return Ok(serde_json::to_vec(&resp).unwrap());
+                                }
+                            }
                         }
-                        None => file_size,
-                    };
-                    (start, end)
-                } else {
-                    // Tail:
-                    // - max_bytes=Some => return the last max_bytes bytes.
-                    // - max_bytes=None => return the whole file.
-                    let end = file_size;
+                    }
                     let start = match max_bytes {
                         Some(max_bytes) => end.saturating_sub(max_bytes),
                         None => 0,
                     };
-                    (start, end)
-                }
-            }
-            LogReadDirection::Backward => {
-                let Some(cursor) = req.cursor else {
-                    let resp = ReadWorkloadLogResp {
-                        ok: false,
-                        err: Some("cursor is required for Backward reads".to_string()),
-                        file_size: Some(file_size),
-                        start_offset: None,
-                        end_offset: None,
-                        text: None,
-                    };
-                    return Ok(serde_json::to_vec(&resp).unwrap());
-                };
-                if cursor > file_size {
-                    let resp = ReadWorkloadLogResp {
-                        ok: false,
-                        err: Some(format!(
-                            "cursor out of range: cursor={} file_size={}",
-                            cursor, file_size
-                        )),
-                        file_size: Some(file_size),
-                        start_offset: None,
-                        end_offset: None,
-                        text: None,
-                    };
-                    return Ok(serde_json::to_vec(&resp).unwrap());
+                    (
+                        start,
+                        end,
+                        Some(WorkloadLogCursor {
+                            shard: effective_shard.clone(),
+                            offset: start,
+                        }),
+                        Some(WorkloadLogCursor {
+                            shard: effective_shard.clone(),
+                            offset: end,
+                        }),
+                        effective_path,
+                        effective_file_size,
+                    )
                 }
-                let end = cursor;
-                let start = match max_bytes {
-                    Some(max_bytes) => end.saturating_sub(max_bytes),
-                    None => 0,
-                };
-                (start, end)
-            }
-        };
+            };
 
         if end < start {
-            let resp = ReadWorkloadLogResp {
-                ok: false,
-                err: Some(format!(
-                    "internal error: end < start: start={} end={}",
-                    start, end
-                )),
-                file_size: Some(file_size),
-                start_offset: None,
-                end_offset: None,
-                text: None,
-            };
+            let resp = make_err_resp(
+                format!("internal error: end < start: start={} end={}", start, end),
+                Some(effective_file_size),
+            );
             return Ok(serde_json::to_vec(&resp).unwrap());
         }
 
@@ -3114,70 +3401,42 @@ impl UserRpcHandler for ReadWorkloadLogChunkHandler {
         })?;
         if let Some(max_bytes_usize) = max_bytes_usize {
             if len > max_bytes_usize {
-                let resp = ReadWorkloadLogResp {
-                    ok: false,
-                    err: Some(format!(
+                let resp = make_err_resp(
+                    format!(
                         "internal error: computed read_len exceeds max_bytes: read_len={} max_bytes={}",
                         len, max_bytes_usize
-                    )),
-                    file_size: Some(file_size),
-                    start_offset: None,
-                    end_offset: None,
-                    text: None,
-                };
+                    ),
+                    Some(effective_file_size),
+                );
                 return Ok(serde_json::to_vec(&resp).unwrap());
             }
         }
 
-        let mut f = match std::fs::File::open(&path) {
+        let mut f = match std::fs::File::open(&effective_path) {
             Ok(v) => v,
             Err(e) => {
-                let resp = ReadWorkloadLogResp {
-                    ok: false,
-                    err: Some(format!(
-                        "open log failed: path={} err={}",
-                        path.display(),
-                        e
-                    )),
-                    file_size: Some(file_size),
-                    start_offset: None,
-                    end_offset: None,
-                    text: None,
-                };
+                let resp = make_err_resp(
+                    format!("open log failed: path={} err={}", effective_path.display(), e),
+                    Some(effective_file_size),
+                );
                 return Ok(serde_json::to_vec(&resp).unwrap());
             }
         };
 
         if let Err(e) = std::io::Seek::seek(&mut f, std::io::SeekFrom::Start(start)) {
-            let resp = ReadWorkloadLogResp {
-                ok: false,
-                err: Some(format!(
-                    "seek log failed: path={} err={}",
-                    path.display(),
-                    e
-                )),
-                file_size: Some(file_size),
-                start_offset: None,
-                end_offset: None,
-                text: None,
-            };
+            let resp = make_err_resp(
+                format!("seek log failed: path={} err={}", effective_path.display(), e),
+                Some(effective_file_size),
+            );
             return Ok(serde_json::to_vec(&resp).unwrap());
         }
 
         let mut buf: Vec<u8> = vec![0; len];
         if let Err(e) = std::io::Read::read_exact(&mut f, &mut buf) {
-            let resp = ReadWorkloadLogResp {
-                ok: false,
-                err: Some(format!(
-                    "read log failed: path={} err={}",
-                    path.display(),
-                    e
-                )),
-                file_size: Some(file_size),
-                start_offset: None,
-                end_offset: None,
-                text: None,
-            };
+            let resp = make_err_resp(
+                format!("read log failed: path={} err={}", effective_path.display(), e),
+                Some(effective_file_size),
+            );
             return Ok(serde_json::to_vec(&resp).unwrap());
         }
 
@@ -3190,9 +3449,11 @@ impl UserRpcHandler for ReadWorkloadLogChunkHandler {
         let resp = ReadWorkloadLogResp {
             ok: true,
             err: None,
-            file_size: Some(file_size),
+            file_size: Some(effective_file_size),
             start_offset: Some(start),
             end_offset: Some(end),
+            start_cursor,
+            end_cursor,
             text: Some(text),
         };
         Ok(serde_json::to_vec(&resp).unwrap())
@@ -8391,20 +8652,22 @@ async function deleteGenerationFromControl() {
 		const LOG_DIR_FORWARD = 'Forward';
 		const LOG_DIR_BACKWARD = 'Backward';
 
-		let workloadLogTimer = null;
-		let workloadLogSelection = { instanceKey: '', kind: '', name: '' };
-		let workloadLogStartOffset = 0;
-		let workloadLogEndOffset = 0;
-		let workloadLogLoadingOlder = false;
-		let workloadLogAnsiState = newAnsiSgrState();
+			let workloadLogTimer = null;
+			let workloadLogSelection = { instanceKey: '', kind: '', name: '' };
+			let workloadLogStartOffset = 0;
+			let workloadLogEndOffset = 0;
+			let workloadLogStartCursor = null;
+			let workloadLogEndCursor = null;
+			let workloadLogLoadingOlder = false;
+			let workloadLogAnsiState = newAnsiSgrState();
 
 		function isWorkloadLogFollowEnabled() {
 		  const cb = document.getElementById('workload_log_follow');
 		  return cb && cb.checked === true;
 		}
 
-		function setWorkloadLogHeader() {
-		  const h = document.getElementById('workload_log_header');
+			function setWorkloadLogHeader() {
+			  const h = document.getElementById('workload_log_header');
 		  const ik = workloadLogSelection.instanceKey || '';
 		  const kind = workloadLogSelection.kind || '';
 		  const name = workloadLogSelection.name || '';
@@ -8412,10 +8675,14 @@ async function deleteGenerationFromControl() {
 		  if (!ik || !kind || !name) {
 		    h.textContent = 'No log selected. Click "Logs" in the table.';
 		    return;
-		  }
-		  h.textContent = 'instance_key=' + ik + ' workload=' + kind + '/' + name
-		    + ' range=[' + String(workloadLogStartOffset) + ',' + String(workloadLogEndOffset) + ')';
-		}
+			  }
+			  const shardText = (workloadLogEndCursor && workloadLogEndCursor.shard)
+			    ? String(workloadLogEndCursor.shard)
+			    : ((workloadLogStartCursor && workloadLogStartCursor.shard) ? String(workloadLogStartCursor.shard) : '-');
+			  h.textContent = 'instance_key=' + ik + ' workload=' + kind + '/' + name
+			    + ' shard=' + shardText
+			    + ' range=[' + String(workloadLogStartOffset) + ',' + String(workloadLogEndOffset) + ')';
+			}
 
 		function stopWorkloadLogTail() {
 		  if (workloadLogTimer != null) {
@@ -8424,12 +8691,14 @@ async function deleteGenerationFromControl() {
 		  }
 		}
 
-		function clearWorkloadLogView() {
-		  stopWorkloadLogTail();
-		  workloadLogStartOffset = 0;
-		  workloadLogEndOffset = 0;
-		  workloadLogLoadingOlder = false;
-		  workloadLogAnsiState = newAnsiSgrState();
+			function clearWorkloadLogView() {
+			  stopWorkloadLogTail();
+			  workloadLogStartOffset = 0;
+			  workloadLogEndOffset = 0;
+			  workloadLogStartCursor = null;
+			  workloadLogEndCursor = null;
+			  workloadLogLoadingOlder = false;
+			  workloadLogAnsiState = newAnsiSgrState();
 		  setWorkloadLogHeader();
 		  const pre = document.getElementById('workload_log_out');
 		  if (pre) { pre.textContent = '(empty)'; }
@@ -8485,11 +8754,13 @@ async function deleteGenerationFromControl() {
 		    return;
 		  }
 
-		  const txt = (v.text != null) ? String(v.text) : '';
-		  workloadLogStartOffset = (v.start_offset != null) ? Number(v.start_offset) : 0;
-		  workloadLogEndOffset = (v.end_offset != null) ? Number(v.end_offset) : workloadLogStartOffset;
-		  workloadLogLoadingOlder = false;
-		  setWorkloadLogHeader();
+			  const txt = (v.text != null) ? String(v.text) : '';
+			  workloadLogStartOffset = (v.start_offset != null) ? Number(v.start_offset) : 0;
+			  workloadLogEndOffset = (v.end_offset != null) ? Number(v.end_offset) : workloadLogStartOffset;
+			  workloadLogStartCursor = (v.start_cursor != null) ? v.start_cursor : null;
+			  workloadLogEndCursor = (v.end_cursor != null) ? v.end_cursor : null;
+			  workloadLogLoadingOlder = false;
+			  setWorkloadLogHeader();
 
 		  if (pre) {
 		    const r = ansiSgrToHtmlChunkWithState(txt, workloadLogAnsiState);
@@ -8509,8 +8780,8 @@ async function deleteGenerationFromControl() {
 		      return;
 		    }
 
-		    const v2 = await fetchWorkloadLogChunk(LOG_DIR_FORWARD, workloadLogEndOffset);
-		    if (!v2 || v2.ok !== true) {
+			    const v2 = await fetchWorkloadLogChunk(LOG_DIR_FORWARD, workloadLogEndCursor);
+			    if (!v2 || v2.ok !== true) {
 		      // Keep the existing view; update the header so operators see the error.
 		      const h = document.getElementById('workload_log_header');
 		      if (h) {
@@ -8518,12 +8789,15 @@ async function deleteGenerationFromControl() {
 		        h.textContent = 'log tail ERROR: ' + err;
 		      }
 		      return;
-		    }
-		    const txt2 = (v2.text != null) ? String(v2.text) : '';
-		    const newEnd = (v2.end_offset != null) ? Number(v2.end_offset) : workloadLogEndOffset;
-		    if (newEnd < workloadLogEndOffset) {
-		      const h = document.getElementById('workload_log_header');
-		      if (h) {
+			    }
+			    const txt2 = (v2.text != null) ? String(v2.text) : '';
+			    const newEnd = (v2.end_offset != null) ? Number(v2.end_offset) : workloadLogEndOffset;
+			    const newEndCursor = (v2.end_cursor != null) ? v2.end_cursor : workloadLogEndCursor;
+			    const sameShard = workloadLogEndCursor && newEndCursor
+			      && workloadLogEndCursor.shard === newEndCursor.shard;
+			    if (sameShard && newEnd < workloadLogEndOffset) {
+			      const h = document.getElementById('workload_log_header');
+			      if (h) {
 		        h.textContent = 'log tail ERROR: end_offset moved backwards (file truncated/rotated?)'
 		          + ' old_end=' + String(workloadLogEndOffset)
 		          + ' new_end=' + String(newEnd);
@@ -8532,21 +8806,26 @@ async function deleteGenerationFromControl() {
 		      return;
 		    }
 
-		    if (txt2.length > 0) {
-		      const r2 = ansiSgrToHtmlChunkWithState(txt2, workloadLogAnsiState);
-		      workloadLogAnsiState = r2.state;
-		      pre2.insertAdjacentHTML('beforeend', r2.html);
-		      workloadLogEndOffset = newEnd;
-		      setWorkloadLogHeader();
+			    if (txt2.length > 0) {
+			      const r2 = ansiSgrToHtmlChunkWithState(txt2, workloadLogAnsiState);
+			      workloadLogAnsiState = r2.state;
+			      pre2.insertAdjacentHTML('beforeend', r2.html);
+			      workloadLogEndOffset = newEnd;
+			      workloadLogEndCursor = newEndCursor;
+			      if (v2.start_cursor != null && workloadLogStartCursor == null) {
+			        workloadLogStartCursor = v2.start_cursor;
+			      }
+			      setWorkloadLogHeader();
 		      if (follow || atBottom) {
 		        pre2.scrollTop = pre2.scrollHeight;
 		      }
-		    } else {
-		      workloadLogEndOffset = newEnd;
-		      setWorkloadLogHeader();
-		    }
-		  }, WORKLOAD_LOG_POLL_INTERVAL_MS);
-		}
+			    } else {
+			      workloadLogEndOffset = newEnd;
+			      workloadLogEndCursor = newEndCursor;
+			      setWorkloadLogHeader();
+			    }
+			  }, WORKLOAD_LOG_POLL_INTERVAL_MS);
+			}
 
 		async function loadOlderWorkloadLog() {
 		  if (workloadLogLoadingOlder) { return; }
@@ -8556,39 +8835,46 @@ async function deleteGenerationFromControl() {
 		    pre.textContent = 'ERROR: no log selected.';
 		    return;
 		  }
-		  if (workloadLogStartOffset <= 0) {
-		    return;
-		  }
-		  workloadLogLoadingOlder = true;
-		  const beforeHeight = pre.scrollHeight;
-		  const v = await fetchWorkloadLogChunk(LOG_DIR_BACKWARD, workloadLogStartOffset);
-		  if (!v || v.ok !== true) {
+			  if (workloadLogStartCursor == null) {
+			    return;
+			  }
+			  workloadLogLoadingOlder = true;
+			  const beforeHeight = pre.scrollHeight;
+			  const v = await fetchWorkloadLogChunk(LOG_DIR_BACKWARD, workloadLogStartCursor);
+			  if (!v || v.ok !== true) {
 		    const err = v && v.err ? String(v.err) : 'unknown error';
 		    pre.insertAdjacentText('afterbegin', 'ERROR: ' + err + '\n\n');
 		    workloadLogLoadingOlder = false;
 		    return;
-		  }
-		  const txt = (v.text != null) ? String(v.text) : '';
-		  const newStart = (v.start_offset != null) ? Number(v.start_offset) : workloadLogStartOffset;
-		  if (txt.length > 0) {
+			  }
+			  const txt = (v.text != null) ? String(v.text) : '';
+			  const newStart = (v.start_offset != null) ? Number(v.start_offset) : workloadLogStartOffset;
+			  const newStartCursor = (v.start_cursor != null) ? v.start_cursor : workloadLogStartCursor;
+			  if (txt.length > 0) {
 		    // English note: prepend is stateless; this is best-effort because boundary SGR state
 		    // cannot be re-applied to already-rendered newer content.
 		    pre.insertAdjacentHTML('afterbegin', ansiSgrToHtmlChunkStateless(txt));
-		  }
-		  workloadLogStartOffset = newStart;
-		  setWorkloadLogHeader();
+			  }
+			  workloadLogStartOffset = newStart;
+			  workloadLogStartCursor = newStartCursor;
+			  if (v.end_cursor != null) {
+			    workloadLogEndCursor = workloadLogEndCursor || v.end_cursor;
+			  }
+			  setWorkloadLogHeader();
 
 		  const afterHeight = pre.scrollHeight;
 		  pre.scrollTop = (afterHeight - beforeHeight) + pre.scrollTop;
 		  workloadLogLoadingOlder = false;
 		}
 
-		function openWorkloadLog(instanceKey, kind, name) {
-		  workloadLogSelection = { instanceKey: String(instanceKey || ''), kind: String(kind || ''), name: String(name || '') };
-		  workloadLogStartOffset = 0;
-		  workloadLogEndOffset = 0;
-		  workloadLogLoadingOlder = false;
-		  setWorkloadLogHeader();
+			function openWorkloadLog(instanceKey, kind, name) {
+			  workloadLogSelection = { instanceKey: String(instanceKey || ''), kind: String(kind || ''), name: String(name || '') };
+			  workloadLogStartOffset = 0;
+			  workloadLogEndOffset = 0;
+			  workloadLogStartCursor = null;
+			  workloadLogEndCursor = null;
+			  workloadLogLoadingOlder = false;
+			  setWorkloadLogHeader();
 		  const pre = document.getElementById('workload_log_out');
 		  if (pre) { pre.textContent = 'Selected. Click Tail to start.'; }
 		  startWorkloadLogTail();
@@ -10337,7 +10623,7 @@ struct WorkloadLogHttpReq {
     kind: WorkloadKind,
     name: String,
     direction: LogReadDirection,
-    cursor: Option<u64>,
+    cursor: Option<WorkloadLogCursor>,
     #[serde(skip_serializing_if = "Option::is_none")]
     max_bytes: Option<u64>,
 }
@@ -10355,6 +10641,8 @@ async fn handle_workload_log(
             file_size: None,
             start_offset: None,
             end_offset: None,
+            start_cursor: None,
+            end_cursor: None,
             text: None,
         };
         return Ok(response_json(StatusCode::BAD_REQUEST, &resp));
@@ -10371,6 +10659,8 @@ async fn handle_workload_log(
             file_size: None,
             start_offset: None,
             end_offset: None,
+            start_cursor: None,
+            end_cursor: None,
             text: None,
         };
         return Ok(response_json(StatusCode::BAD_REQUEST, &resp));
@@ -10415,6 +10705,8 @@ async fn handle_workload_log(
                 file_size: None,
                 start_offset: None,
                 end_offset: None,
+                start_cursor: None,
+                end_cursor: None,
                 text: None,
             };
             Ok(response_json(StatusCode::BAD_GATEWAY, &resp))
@@ -14846,4 +15138,94 @@ mod tests {
             Some("workload__Deployment__demo.2026-06-20.log")
         );
     }
+
+    #[test]
+    fn read_workload_log_forward_cursor_rolls_into_next_shard() {
+        let td = tempfile::tempdir().unwrap();
+        let log_dir = td.path().to_path_buf();
+        std::fs::write(
+            log_dir.join("workload__Deployment__demo.2026-06-19.log"),
+            "old\n",
+        )
+        .unwrap();
+        std::fs::write(
+            log_dir.join("workload__Deployment__demo.2026-06-20.log"),
+            "new\n",
+        )
+        .unwrap();
+        let handler = ReadWorkloadLogChunkHandler { log_dir };
+        let req = ReadWorkloadLogReq {
+            kind: WorkloadKind::Deployment,
+            name: "demo".to_string(),
+            direction: LogReadDirection::Forward,
+            cursor: Some(WorkloadLogCursor {
+                shard: "2026-06-19".to_string(),
+                offset: 4,
+            }),
+            max_bytes: Some(65536),
+        };
+        let raw = handler.handle("n1".into(), &serde_json::to_vec(&req).unwrap()).unwrap();
+        let resp: ReadWorkloadLogResp = serde_json::from_slice(&raw).unwrap();
+        assert!(resp.ok, "{resp:?}");
+        assert_eq!(resp.text.as_deref(), Some("new\n"));
+        assert_eq!(
+            resp.start_cursor,
+            Some(WorkloadLogCursor {
+                shard: "2026-06-20".to_string(),
+                offset: 0,
+            })
+        );
+        assert_eq!(
+            resp.end_cursor,
+            Some(WorkloadLogCursor {
+                shard: "2026-06-20".to_string(),
+                offset: 4,
+            })
+        );
+    }
+
+    #[test]
+    fn read_workload_log_backward_cursor_rolls_into_previous_shard() {
+        let td = tempfile::tempdir().unwrap();
+        let log_dir = td.path().to_path_buf();
+        std::fs::write(
+            log_dir.join("workload__Deployment__demo.2026-06-19.log"),
+            "old\n",
+        )
+        .unwrap();
+        std::fs::write(
+            log_dir.join("workload__Deployment__demo.2026-06-20.log"),
+            "new\n",
+        )
+        .unwrap();
+        let handler = ReadWorkloadLogChunkHandler { log_dir };
+        let req = ReadWorkloadLogReq {
+            kind: WorkloadKind::Deployment,
+            name: "demo".to_string(),
+            direction: LogReadDirection::Backward,
+            cursor: Some(WorkloadLogCursor {
+                shard: "2026-06-20".to_string(),
+                offset: 0,
+            }),
+            max_bytes: Some(65536),
+        };
+        let raw = handler.handle("n1".into(), &serde_json::to_vec(&req).unwrap()).unwrap();
+        let resp: ReadWorkloadLogResp = serde_json::from_slice(&raw).unwrap();
+        assert!(resp.ok, "{resp:?}");
+        assert_eq!(resp.text.as_deref(), Some("old\n"));
+        assert_eq!(
+            resp.start_cursor,
+            Some(WorkloadLogCursor {
+                shard: "2026-06-19".to_string(),
+                offset: 0,
+            })
+        );
+        assert_eq!(
+            resp.end_cursor,
+            Some(WorkloadLogCursor {
+                shard: "2026-06-19".to_string(),
+                offset: 4,
+            })
+        );
+    }
 }

From ea49f593624981dde54f22d23e7535fba82249a4 Mon Sep 17 00:00:00 2001
From: ActivePeter <1020401660@qq.com>
Date: Wed, 24 Jun 2026 19:23:09 +0800
Subject: [PATCH 13/13] test

---
 deployment/deployconf.yaml                    |  54 ++--
 deployment/tests/test_gen_k8s_daemonset.py    |  11 +-
 deployment/utils/deployconf_config_utils.py   |  13 +-
 examples/external_put_get_del.py              |   6 +-
 examples/fluxon_quick_start/start.py          |  55 ++--
 examples/rpc_call.py                          |   6 +-
 examples/start_kv_and_fs_svc.py               |  16 +-
 examples/start_master_owner.py                |  10 +-
 examples/start_mpmc_demo.py                   |   9 +-
 ...15\347\275\256\346\200\273\350\247\210.md" |  16 +-
 ...74\345\207\272\351\223\276\350\267\257.md" |  14 +-
 ...04\345\222\214\346\246\202\345\277\265.md" |   4 +-
 ...15\345\212\241\345\271\263\351\235\242.md" |  10 +-
 ...7 - 3 - KV-RPC\346\216\245\345\217\243.md" |  47 ++--
 ...0\267 - 4 - MQ\346\216\245\345\217\243.md" |  24 +-
 ...0\267 - 5 - FS\346\216\245\345\217\243.md" |  26 +-
 .../User - 1 - Architecture and Concepts.md   |   8 +-
 .../User - 3 - KV and RPC Interface.md        |  37 +--
 .../user_doc/User - 4 - MQ Interface.md       |   6 +-
 .../user_doc/User - 5 - FS Interface.md       |   3 +-
 fluxon_py/_api_ext_chan/mpmc.py               |   8 +-
 fluxon_py/config.py                           |  16 +-
 fluxon_py/kvclient/fluxon.py                  |  17 ++
 fluxon_py/kvclient/kvclient_interface.py      |   3 +
 fluxon_py/kvclient/mooncake.py                |   6 +
 fluxon_py/logging.py                          |  14 +-
 .../tests/fluxon_fs_transfer_tikv_support.py  |  18 +-
 .../test_mpmc_simple_bench.py                 |  98 +++----
 .../test_mpmc_simple_bench2.py                |   4 +-
 .../tests/test_backend_fallback_close.py      |   3 +
 ...est_backend_relay_deployconf.template.yaml |  12 +-
 fluxon_py/tests/test_backend_relay_docker.py  |  65 ++---
 fluxon_py/tests/test_config.py                |  16 +-
 fluxon_py/tests/test_config.yaml              |   3 +-
 fluxon_py/tests/test_fluxon_fs_patcher.py     |   9 +-
 .../tests/test_fluxon_fs_remote_mount.py      |  12 +-
 fluxon_py/tests/test_lib.py                   |  14 +-
 .../tests/test_mq/test_example_ctrl_c_exit.py |  36 ++-
 .../kvcli_example_client_config1.yaml         |   2 +-
 .../kvcli_example_client_config2.yaml         |   2 +-
 .../fluxon_kv/src/client_seg_pool/mod.rs      |  97 +++----
 fluxon_rs/fluxon_kv/src/config.rs             | 117 +++-----
 .../external_client_test.rs                   |   9 +-
 .../fluxon_kv/src/external_client_api/mod.rs  |  99 +++----
 fluxon_rs/fluxon_kv/src/kv_test.rs            |  94 ++-----
 fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs    |   6 +-
 fluxon_rs/fluxon_kv/src/lib.rs                | 256 ++++++------------
 .../fluxon_kv/src/memholder/memholder_test.rs |   8 +-
 fluxon_rs/fluxon_pyo3/src/lib.rs              |  30 +-
 fluxon_test_stack/benchmark_full_matrix.yaml  |   2 +-
 fluxon_test_stack/ci_test_list.yaml           |   2 +-
 fluxon_test_stack/deployconf_testbed.yml      |  35 +--
 fluxon_test_stack/test_runner.py              | 236 +++++-----------
 .../test_runner_runtime_backend.py            |  24 +-
 .../test_test_runner_testbed_contract.py      |  26 +-
 setup_and_pack/utils/repo_config_utils.py     |  26 +-
 56 files changed, 649 insertions(+), 1151 deletions(-)

diff --git a/deployment/deployconf.yaml b/deployment/deployconf.yaml
index b0c67b2..3000ffe 100644
--- a/deployment/deployconf.yaml
+++ b/deployment/deployconf.yaml
@@ -81,13 +81,9 @@ global_envs:
   #   printf "[global]\nindex-url = https://pypi.tuna.tsinghua.edu.cn/simple\n" > ~/.pip/pip.conf;
   FLUXON_CLUSTER_NAME: "fluxon-example-cluster"
   FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
-  FLUXON_SHARED_FILE: "${HOSTWORKDIR}/shm1_files"
   FLUXON_SHARED_MEM2: "${HOSTWORKDIR}/shm2"
-  FLUXON_SHARED_FILE2: "${HOSTWORKDIR}/shm2_files"
   FLUXON_SHARED_MEM_RELAY: "${HOSTWORKDIR}/shm3"
-  FLUXON_SHARED_FILE_RELAY: "${HOSTWORKDIR}/shm3_files"
   FLUXON_SHARED_MEM_RELAY2: "${HOSTWORKDIR}/shm4"
-  FLUXON_SHARED_FILE_RELAY2: "${HOSTWORKDIR}/shm4_files"
   # Enable pprof by setting seconds > 0; empty means disabled.
   FLUXON_PPROF_DURATION_SECONDS: ""
 
@@ -328,8 +324,7 @@ service:
           etcd_addresses:
           - "${ETCD_FULL_ADDRESS}"
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
           # redis_compat:
           #   listen_addr: "0.0.0.0:16379"
           sub_cluster: "producer_side"
@@ -375,8 +370,7 @@ service:
           etcd_addresses:
           - "${ETCD_FULL_ADDRESS}"
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM2}"
-          shared_file_path: "${FLUXON_SHARED_FILE2}"
+          share_mem_path: "${FLUXON_SHARED_MEM2}"
           sub_cluster: "consumer_side"
       YAML
       # export UCX_LOG_LEVEL=info
@@ -397,15 +391,14 @@ service:
 
       cd "${FLUXON_SRC_ROOT}/examples"
       WORKDIR="./fluxon_work/fluxon_fs_master_work"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}"
 
       cat > "all_config.yaml" <<YAML
       kvclient:
         instance_key: "fluxon_fs_master"
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       fluxon_fs:
         master:
           instance_key: "fluxon_fs_master"
@@ -459,15 +452,14 @@ service:
 
       cd "${FLUXON_SRC_ROOT}/examples"
       WORKDIR="./fluxon_work/fluxon_fs_writer_work"
-      mkdir -p "${WORKDIR}" "${HOSTWORKDIR}/fluxon_fs_export_root" "${HOSTWORKDIR}/fluxon_fs_local_shared" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}" "${HOSTWORKDIR}/fluxon_fs_export_root" "${HOSTWORKDIR}/fluxon_fs_local_shared" "${FLUXON_SHARED_MEM}"
 
       cat > "all_config.yaml" <<YAML
       kvclient:
         instance_key: "fluxon_fs_writer"
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       fluxon_fs:
         cache:
           stale_window_ms: 5000
@@ -512,15 +504,14 @@ service:
 
       cd "${FLUXON_SRC_ROOT}/examples"
       WORKDIR="./fluxon_work/fluxon_fs_reader_work"
-      mkdir -p "${WORKDIR}" "${HOSTWORKDIR}/fluxon_fs_local_shared" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}" "${HOSTWORKDIR}/fluxon_fs_local_shared" "${FLUXON_SHARED_MEM}"
 
       cat > "all_config.yaml" <<YAML
       kvclient:
         instance_key: "fluxon_fs_reader"
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       fluxon_fs:
         master:
           instance_key: "fluxon_fs_master"
@@ -584,8 +575,7 @@ service:
           etcd_addresses:
           - "${ETCD_FULL_ADDRESS}"
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM_RELAY}"
-          shared_file_path: "${FLUXON_SHARED_FILE_RELAY}"
+          share_mem_path: "${FLUXON_SHARED_MEM_RELAY}"
           p2p_listen_port: 31001
           sub_cluster: "relay"
       YAML
@@ -622,8 +612,7 @@ service:
           etcd_addresses:
           - "${ETCD_FULL_ADDRESS}"
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM_RELAY2}"
-          shared_file_path: "${FLUXON_SHARED_FILE_RELAY2}"
+          share_mem_path: "${FLUXON_SHARED_MEM_RELAY2}"
           p2p_listen_port: 31002
           sub_cluster: "relay"
       YAML
@@ -653,8 +642,7 @@ service:
         instance_key: mpmc_demo_producer_base
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       mpmc_demo:
         key: demo_mpmc
         capacity: 20
@@ -726,8 +714,7 @@ service:
         instance_key: mpmc_demo_consumer_base
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM2}"
-          shared_file_path: "${FLUXON_SHARED_FILE2}"
+          share_mem_path: "${FLUXON_SHARED_MEM2}"
       mpmc_demo:
         key: demo_mpmc
         capacity: 20
@@ -812,8 +799,7 @@ service:
         kvexternal:
           fluxonkv_spec:
             cluster_name: "${FLUXON_CLUSTER_NAME}"
-            shared_memory_path: "${FLUXON_SHARED_MEM}"
-            shared_file_path: "${FLUXON_SHARED_FILE}"
+            share_mem_path: "${FLUXON_SHARED_MEM}"
         db_path: ./xfer_panel.sqlite3
         bootstrap_admin:
           username: admin
@@ -859,8 +845,7 @@ service:
         kvexternal:
           fluxonkv_spec:
             cluster_name: "${FLUXON_CLUSTER_NAME}"
-            shared_memory_path: "${FLUXON_SHARED_MEM2}"
-            shared_file_path: "${FLUXON_SHARED_FILE2}"
+            share_mem_path: "${FLUXON_SHARED_MEM2}"
         http:
           listen_addr: 0.0.0.0
           port: ${XFER_WEBPANEL__PORT}
@@ -902,9 +887,7 @@ service:
       ETCD = os.environ['ETCD_FULL_ADDRESS']
       CLUSTER_NAME = os.environ['FLUXON_CLUSTER_NAME']
       SHARED_MEM = os.environ['FLUXON_SHARED_MEM']
-      SHARED_FILE = os.environ['FLUXON_SHARED_FILE']
       SHARED_MEM2 = os.environ['FLUXON_SHARED_MEM2']
-      SHARED_FILE2 = os.environ['FLUXON_SHARED_FILE2']
       # Addresses from injected env tokens (no hardcoding)
       METADATA_IP = os.environ.get('MOONCAKE_METADATA__NODE_ID__IP')
       MASTER_IP = os.environ.get('MASTER__NODE_ID__IP')
@@ -939,8 +922,7 @@ service:
           'contribute_to_cluster_pool_size': {'dram': 0, 'vram': {}},
           'fluxonkv_spec': {
               'cluster_name': CLUSTER_NAME,
-              'shared_memory_path': SHARED_MEM,
-              'shared_file_path': SHARED_FILE,
+              'share_mem_path': SHARED_MEM,
           },
               # 如果需要切 mooncake，可以在这里启用 mooncake_spec
               # 'mooncake_spec': {
@@ -967,7 +949,7 @@ service:
                   'kv': {'instance_key': 'bench2', 'fluxonkv_spec': {
                        'etcd_addresses': [ETCD],
                        'cluster_name': CLUSTER_NAME,
-                       'shared_memory_path': SHARED_MEM2,
+                       'share_mem_path': SHARED_MEM2,
                    }},
                   'mq_role': 'consumer',
                   # 'mq': {'weight': 1.0},
@@ -976,7 +958,7 @@ service:
               #     'kv': {'instance_key': 'bench3', 'fluxonkv_spec': {
               #         'etcd_addresses': [ETCD],
               #         'cluster_name': CLUSTER_NAME,
-              #         'shared_memory_path': SHARED_MEM2,
+              #         'share_mem_path': SHARED_MEM2,
               #     }},
               #     'mq_role': 'consumer',
               #     # 'mq': {'weight': 1.0},
@@ -989,7 +971,7 @@ service:
               #     'kv': {'instance_key': 'bench5', 'fluxonkv_spec': {
               #         'etcd_addresses': [ETCD],
               #         'cluster_name': CLUSTER_NAME,
-              #         'shared_memory_path': SHARED_MEM2,
+              #         'share_mem_path': SHARED_MEM2,
               #     }},
               #     'mq_role': 'consumer',
               # }
diff --git a/deployment/tests/test_gen_k8s_daemonset.py b/deployment/tests/test_gen_k8s_daemonset.py
index 2cd769e..35fae5a 100644
--- a/deployment/tests/test_gen_k8s_daemonset.py
+++ b/deployment/tests/test_gen_k8s_daemonset.py
@@ -190,7 +190,6 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
                   FLUXON_PIP_CONF_CMD: "true"
                   FLUXON_RELEASE_WHEEL_FETCH_CMD: "true"
                   FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
-                  FLUXON_SHARED_FILE: "${HOSTWORKDIR}/shm1_files"
                   ETCD_FULL_ADDRESS: "127.0.0.1:33579"
                   FLUXON_CLUSTER_NAME: "fluxon_testbed"
                   FLUXON_OPS_CONTROLLER_INSTANCE_KEY: "ops_controller_node-a"
@@ -201,15 +200,14 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
                   ops_agent:
                     entrypoint: |
                       WORKDIR="${HOSTWORKDIR}/ops_agent/${NODE_ID}"
-                      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+                      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}"
                       cat > "${WORKDIR}/ops_agent.yaml" <<YAML
                       kv_client:
                         instance_key: "fluxon_ops_${NODE_ID}"
                         pprof_duration_seconds: 60
                         fluxonkv_spec:
                           cluster_name: "${FLUXON_CLUSTER_NAME}"
-                          shared_memory_path: "${FLUXON_SHARED_MEM}"
-                          shared_file_path: "${FLUXON_SHARED_FILE}"
+                          share_mem_path: "${FLUXON_SHARED_MEM}"
                       controller_instance_key: "${FLUXON_OPS_CONTROLLER_INSTANCE_KEY}"
                       hostworkdir: "${HOSTWORKDIR}"
                       YAML
@@ -219,7 +217,7 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
                   ops_controller:
                     entrypoint: |
                       WORKDIR="${HOSTWORKDIR}/ops_controller"
-                      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+                      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}"
                       cat > "${WORKDIR}/ops_controller.yaml" <<YAML
                       ops_controller:
                         kv_client:
@@ -227,8 +225,7 @@ def test_ops_entrypoints_use_direct_scripts() -> None:
                           pprof_duration_seconds: 60
                           fluxonkv_spec:
                             cluster_name: "${FLUXON_CLUSTER_NAME}"
-                            shared_memory_path: "${FLUXON_SHARED_MEM}"
-                            shared_file_path: "${FLUXON_SHARED_FILE}"
+                            share_mem_path: "${FLUXON_SHARED_MEM}"
                             p2p_listen_port: 12102
                         panel:
                           max_body_bytes: 1073741824
diff --git a/deployment/utils/deployconf_config_utils.py b/deployment/utils/deployconf_config_utils.py
index 4244526..b312c6d 100644
--- a/deployment/utils/deployconf_config_utils.py
+++ b/deployment/utils/deployconf_config_utils.py
@@ -18,8 +18,7 @@
     "load_deployconf_prometheus_base_url",
     "load_deployconf_prom_remote_write_url",
     "load_deployconf_fluxon_cluster_name",
-    "load_deployconf_fluxon_shared_memory_path",
-    "load_deployconf_fluxon_shared_file_path",
+    "load_deployconf_fluxon_share_mem_path",
     "load_deployconf_service_ip_port",
 ]
 
@@ -140,7 +139,7 @@ def load_deployconf_fluxon_cluster_name(*, config_path: Path) -> str:
     return raw.strip()
 
 
-def load_deployconf_fluxon_shared_memory_path(*, config_path: Path) -> str:
+def load_deployconf_fluxon_share_mem_path(*, config_path: Path) -> str:
     global_envs = load_deployconf_resolved_global_envs(config_path=config_path)
     raw = global_envs.get("FLUXON_SHARED_MEM")
     if not isinstance(raw, str) or not raw.strip():
@@ -148,14 +147,6 @@ def load_deployconf_fluxon_shared_memory_path(*, config_path: Path) -> str:
     return raw.strip()
 
 
-def load_deployconf_fluxon_shared_file_path(*, config_path: Path) -> str:
-    global_envs = load_deployconf_resolved_global_envs(config_path=config_path)
-    raw = global_envs.get("FLUXON_SHARED_FILE")
-    if not isinstance(raw, str) or not raw.strip():
-        raise ValueError("deployconf.global_envs.FLUXON_SHARED_FILE must resolve to a non-empty string")
-    return raw.strip()
-
-
 def load_deployconf_service_ip_port(*, config_path: Path, service_name: str) -> Tuple[str, int]:
     cfg = load_deployconf_mapping(config_path=config_path)
     cluster_nodes = cfg.get("cluster_nodes")
diff --git a/examples/external_put_get_del.py b/examples/external_put_get_del.py
index c1ee8c3..834425d 100644
--- a/examples/external_put_get_del.py
+++ b/examples/external_put_get_del.py
@@ -4,8 +4,7 @@
 
 INSTANCE_KEY = "demo_kv_external"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def main() -> None:
@@ -14,8 +13,7 @@ def main() -> None:
             "instance_key": INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
diff --git a/examples/fluxon_quick_start/start.py b/examples/fluxon_quick_start/start.py
index 1ee0acf..32a1639 100644
--- a/examples/fluxon_quick_start/start.py
+++ b/examples/fluxon_quick_start/start.py
@@ -473,10 +473,9 @@ def _load_config_from_b64(config_b64: str) -> Dict[str, Any]:
 
 def _resolve_fluxonkv_spec_paths(*, spec: Dict[str, Any], workdir: Path) -> Dict[str, Any]:
     resolved = dict(spec)
-    for field_name in ("shared_memory_path", "shared_file_path"):
-        raw_path = resolved.get(field_name)
-        if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
-            resolved[field_name] = str((workdir / raw_path).resolve())
+    raw_path = resolved.get("share_mem_path")
+    if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
+        resolved["share_mem_path"] = str((workdir / raw_path).resolve())
     return resolved
 
 
@@ -535,7 +534,6 @@ def _owner_large_file_paths(workdir: Path) -> List[str]:
 def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: int,
                     panel_port: int, greptime_http_port: int, workdir: Path) -> Dict[str, Any]:
     shm = str(workdir / "sharemem")
-    shared_file_path = str(workdir / "sharefile")
     log_dir = str(workdir / "log" / "master")
     master_cfg: Dict[str, Any] = {
         "etcd_endpoints": [etcd_ep],
@@ -555,8 +553,7 @@ def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: i
             "fluxonkv_spec": {
                 "etcd_addresses": [etcd_ep],
                 "cluster_name": cluster,
-                "shared_memory_path": shm,
-                "shared_file_path": shared_file_path,
+                "share_mem_path": shm,
                 "sub_cluster": "default",
                 "large_file_paths": _owner_large_file_paths(workdir),
             },
@@ -570,8 +567,7 @@ def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: i
             "instance_key": "qs_http_accessor",
             "fluxonkv_spec": {
                 "cluster_name": cluster,
-                "shared_memory_path": shm,
-                "shared_file_path": shared_file_path,
+                "share_mem_path": shm,
             },
         },
     }
@@ -581,7 +577,6 @@ def _gen_kv_config(etcd_ep: str, cluster: str, master_port: int, kv_http_port: i
 def _gen_mq_config(etcd_ep: str, cluster: str, master_port: int, greptime_http_port: int,
                     workdir: Path, panel_port: int = 0) -> Dict[str, Any]:
     shm = str(workdir / "sharemem")
-    shared_file_path = str(workdir / "sharefile")
     log_dir = str(workdir / "log" / "master")
     master_cfg: Dict[str, Any] = {
         "etcd_endpoints": [etcd_ep],
@@ -601,8 +596,7 @@ def _gen_mq_config(etcd_ep: str, cluster: str, master_port: int, greptime_http_p
             "fluxonkv_spec": {
                 "etcd_addresses": [etcd_ep],
                 "cluster_name": cluster,
-                "shared_memory_path": shm,
-                "shared_file_path": shared_file_path,
+                "share_mem_path": shm,
                 "sub_cluster": "default",
                 "large_file_paths": _owner_large_file_paths(workdir),
             },
@@ -611,8 +605,7 @@ def _gen_mq_config(etcd_ep: str, cluster: str, master_port: int, greptime_http_p
             "instance_key": "qs_mq_external",
             "fluxonkv_spec": {
                 "cluster_name": cluster,
-                "shared_memory_path": shm,
-                "shared_file_path": shared_file_path,
+                "share_mem_path": shm,
             },
         },
         "mpmc_demo": {
@@ -636,7 +629,6 @@ def _gen_mq_config(etcd_ep: str, cluster: str, master_port: int, greptime_http_p
 def _gen_fs_config(etcd_ep: str, cluster: str, master_port: int, panel_port: int,
                     greptime_http_port: int, workdir: Path) -> Dict[str, Any]:
     shm = str(workdir / "sharemem")
-    shared_file_path = str(workdir / "sharefile")
     log_dir = str(workdir / "log" / "master")
     remote_root_dir = str(workdir / "fs_remote_root")
     access_db_path = str(workdir / "fs_master" / "access.db")
@@ -660,8 +652,7 @@ def _gen_fs_config(etcd_ep: str, cluster: str, master_port: int, panel_port: int
             "fluxonkv_spec": {
                 "etcd_addresses": [etcd_ep],
                 "cluster_name": cluster,
-                "shared_memory_path": shm,
-                "shared_file_path": shared_file_path,
+                "share_mem_path": shm,
                 "sub_cluster": "default",
                 "large_file_paths": _owner_large_file_paths(workdir),
             },
@@ -671,8 +662,7 @@ def _gen_fs_config(etcd_ep: str, cluster: str, master_port: int, panel_port: int
                 "instance_key": "qs_fs_master",
                 "fluxonkv_spec": {
                     "cluster_name": cluster,
-                    "shared_memory_path": shm,
-                    "shared_file_path": shared_file_path,
+                    "share_mem_path": shm,
                 },
             },
             "fluxon_fs": {
@@ -718,8 +708,7 @@ def _gen_fs_config(etcd_ep: str, cluster: str, master_port: int, panel_port: int
                 "instance_key": "qs_fs_agent",
                 "fluxonkv_spec": {
                     "cluster_name": cluster,
-                    "shared_memory_path": shm,
-                    "shared_file_path": shared_file_path,
+                    "share_mem_path": shm,
                 },
             },
             "fluxon_fs": {
@@ -987,19 +976,19 @@ def _wait_for_process_tcp_ready_best_effort(
     return False
 
 
-def _kvclient_shared_json_target(shared_file_path: Path, cluster_name: str) -> Path:
-    return shared_file_path / cluster_name / "shared.json"
+def _kvclient_shared_json_target(share_mem_path: Path, cluster_name: str) -> Path:
+    return share_mem_path / cluster_name / "shared.json"
 
 
-def _clear_stale_shared_json(shared_file_path: Path, cluster_name: str) -> None:
-    target = _kvclient_shared_json_target(shared_file_path, cluster_name)
+def _clear_stale_shared_json(share_mem_path: Path, cluster_name: str) -> None:
+    target = _kvclient_shared_json_target(share_mem_path, cluster_name)
     if target.exists():
         print(f"[quick_start] removing stale shared.json: {target}")
         target.unlink()
 
 
 def _wait_for_shared_json(
-    shared_file_path: Path,
+    share_mem_path: Path,
     cluster_name: str,
     timeout: int = 180,
     *,
@@ -1008,7 +997,7 @@ def _wait_for_shared_json(
     log_path: Optional[Path] = None,
 ) -> None:
     """Block until shared.json appears (owner kvclient ready)."""
-    target = _kvclient_shared_json_target(shared_file_path, cluster_name)
+    target = _kvclient_shared_json_target(share_mem_path, cluster_name)
     target_dir = target.parent
     deadline = time.time() + timeout
     elapsed = 0
@@ -1043,7 +1032,7 @@ def _start_cluster_infra(
     etcd_log_path = workdir / "log" / "etcd.log"
     master_log_path = workdir / "log" / "master.log"
     kvclient_log_path = workdir / "log" / "kvclient.log"
-    shared_file_path = _kvclient_shared_file_path_from_cfg(cfg)
+    share_mem_path = _kvclient_share_mem_path_from_cfg(cfg)
     cluster_name = _kvclient_cluster_name_from_cfg(cfg)
     log_dir = workdir / "log"
 
@@ -1109,10 +1098,10 @@ def _start_cluster_infra(
         )
 
     print("[quick_start] starting kvclient...")
-    _clear_stale_shared_json(shared_file_path, cluster_name)
+    _clear_stale_shared_json(share_mem_path, cluster_name)
     kvclient_proc = _start_kvclient(cfg["kvclient"], workdir)
     _wait_for_shared_json(
-        shared_file_path,
+        share_mem_path,
         cluster_name,
         proc=kvclient_proc,
         label="kvclient",
@@ -1120,16 +1109,16 @@ def _start_cluster_infra(
     )
 
 
-def _kvclient_shared_file_path_from_cfg(cfg: Dict[str, Any]) -> Path:
+def _kvclient_share_mem_path_from_cfg(cfg: Dict[str, Any]) -> Path:
     kvclient_cfg = cfg.get("kvclient")
     if not isinstance(kvclient_cfg, dict):
         raise ValueError("missing kvclient config")
     spec = kvclient_cfg.get("fluxonkv_spec")
     if not isinstance(spec, dict):
         raise ValueError("missing kvclient.fluxonkv_spec config")
-    raw_path = spec.get("shared_file_path")
+    raw_path = spec.get("share_mem_path")
     if not isinstance(raw_path, str) or not raw_path:
-        raise ValueError("kvclient.fluxonkv_spec.shared_file_path must be a non-empty string")
+        raise ValueError("kvclient.fluxonkv_spec.share_mem_path must be a non-empty string")
     return Path(raw_path)
 
 
diff --git a/examples/rpc_call.py b/examples/rpc_call.py
index 250f2fa..4afd331 100644
--- a/examples/rpc_call.py
+++ b/examples/rpc_call.py
@@ -8,8 +8,7 @@
 RPC_SERVER_INSTANCE_KEY = "demo_rpc_server"
 RPC_CLIENT_INSTANCE_KEY = "demo_rpc_client"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def main() -> None:
@@ -43,8 +42,7 @@ def _build_config(*, instance_key: str) -> FluxonKvClientConfig:
             "instance_key": instance_key,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
diff --git a/examples/start_kv_and_fs_svc.py b/examples/start_kv_and_fs_svc.py
index 9cec14f..84f65a8 100644
--- a/examples/start_kv_and_fs_svc.py
+++ b/examples/start_kv_and_fs_svc.py
@@ -16,8 +16,7 @@
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-fs-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_fs_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_fs_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_fs_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_fs_demo/runtime").resolve()
 REMOTE_ROOT_DIR = Path("/tmp/fluxon_fs_demo/remote_root").resolve()
 KV_MASTER_PORT = 34100
@@ -46,7 +45,6 @@ def main() -> None:
     args = parse_args()
     WORKDIR.mkdir(parents=True, exist_ok=True)
     REMOTE_ROOT_DIR.mkdir(parents=True, exist_ok=True)
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
 
     log_dir = (WORKDIR / "log").resolve()
     log_dir.mkdir(parents=True, exist_ok=True)
@@ -117,8 +115,7 @@ def main() -> None:
     )
 
     print(f"[fluxon_fs] cluster name: {CLUSTER_NAME}")
-    print(f"[fluxon_fs] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_fs] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_fs] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_fs] remote root dir: {REMOTE_ROOT_DIR}")
     print(f"[fluxon_fs] export name: {EXPORT_NAME}")
     print(f"[fluxon_fs] owner instance key: {OWNER_INSTANCE_KEY}")
@@ -199,8 +196,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": build_owner_large_file_paths(),
         },
@@ -213,8 +209,7 @@ def build_fs_master_config() -> dict:
             "instance_key": FS_MASTER_INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": str(SHARED_MEMORY_PATH),
-                "shared_file_path": str(SHARED_FILE_PATH),
+                "share_mem_path": str(SHARE_MEM_PATH),
             },
         },
         "fluxon_fs": {
@@ -273,8 +268,7 @@ def build_fs_agent_config() -> dict:
             "instance_key": FS_AGENT_INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": str(SHARED_MEMORY_PATH),
-                "shared_file_path": str(SHARED_FILE_PATH),
+                "share_mem_path": str(SHARE_MEM_PATH),
             },
         },
         "fluxon_fs": {
diff --git a/examples/start_master_owner.py b/examples/start_master_owner.py
index 078450b..7bfb770 100644
--- a/examples/start_master_owner.py
+++ b/examples/start_master_owner.py
@@ -14,8 +14,7 @@
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_kv_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_kv_demo/runtime").resolve()
 MASTER_PORT = 31000
 MASTER_INSTANCE_KEY = "demo_kv_master"
@@ -29,7 +28,6 @@ def build_owner_large_file_paths() -> list[str]:
 
 def main() -> None:
     args = parse_args()
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
     log_dir = (WORKDIR / "log").resolve()
 
     if args.with_master:
@@ -64,8 +62,7 @@ def main() -> None:
         )
     )
 
-    print(f"[fluxon_kv] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_kv] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_kv] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_kv] etcd endpoint: {ETCD_ENDPOINT}")
     print(f"[fluxon_kv] greptime base url: {GREPTIME_BASE_URL}")
     print(f"[fluxon_kv] start master in this script: {args.with_master}")
@@ -128,8 +125,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": build_owner_large_file_paths(),
         },
diff --git a/examples/start_mpmc_demo.py b/examples/start_mpmc_demo.py
index 2988674..5ad9f64 100644
--- a/examples/start_mpmc_demo.py
+++ b/examples/start_mpmc_demo.py
@@ -17,8 +17,7 @@
 
 # These constants are the only user-facing knobs in the minimal example.
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 CHANNEL_KEY = "demo_mq_channel_doc"
 CHANNEL_CAPACITY = 128
 CHANNEL_TTL_SECONDS = 300
@@ -53,8 +52,7 @@ def _build_store_config(*, role: str) -> FluxonKvClientConfig:
             "instance_key": f"demo_mq_{role}",
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
         }
     )
@@ -198,9 +196,6 @@ def main() -> None:
     parser.add_argument("--role", choices=["producer", "consumer"], required=True)
     args = parser.parse_args()
 
-    # The minimal example keeps shared file authority explicit and local.
-    Path(SHARED_FILE_PATH).mkdir(parents=True, exist_ok=True)
-
     # init_logger() reads FLUXON_LOG and sets the user-process console log level.
     logger = init_logger(f"mpmc_demo_{args.role}")
     shutdown_requested = threading.Event()
diff --git "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md" "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
index 50e2b38..a4c5865 100644
--- "a/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
+++ "b/fluxon_doc_cn/design/fluxon_0_\351\205\215\347\275\256\346\200\273\350\247\210.md"
@@ -107,7 +107,6 @@ cluster_nodes:
 global_envs:
   FLUXON_CLUSTER_NAME: "fluxon-example-cluster"
   FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
-  FLUXON_SHARED_FILE: "${HOSTWORKDIR}/shm1_files"
   ETCD_FULL_ADDRESS: "${${ETCD__NODE_ID}__IP}:${ETCD__PORT}"
   FLUXON_PROMETHEUS_BASE_URL: "http://${${GREPTIME__NODE_ID}__IP}:${GREPTIME__PORT}/v1/prometheus"
   MONITOR_GREPTIMEDB_WRITE_URL: "http://${${GREPTIME__NODE_ID}__IP}:${GREPTIME__PORT}/v1/prometheus/write"
@@ -268,12 +267,8 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   cluster_name: demo-kv-cluster
 
-  # 本机共享内存 authority；运行时会拼成 cluster_name 作用域路径
-  shared_memory_path: /dev/shm/fluxon
-
-  # 本机共享文件 authority；shared.json、profile、peer metadata 等在这条根下
-  # 运行时也会拼成 cluster_name 作用域路径
-  shared_file_path: /var/lib/fluxon/shared
+  # 共享 bundle 根目录；运行时会拼成 cluster_name 作用域路径
+  share_mem_path: /dev/shm/fluxon
 
   # owner 必须自己连接 etcd；输入要求 raw host:port
   etcd_addresses:
@@ -303,9 +298,8 @@ instance_key: my-external-1
 fluxonkv_spec:
   cluster_name: demo-kv-cluster
 
-  # external 只保留 attach owner 所需的本机共享锚点
-  shared_memory_path: /dev/shm/fluxon
-  shared_file_path: /var/lib/fluxon/shared
+  # external 只保留 attach owner 所需的共享 bundle 根目录
+  share_mem_path: /dev/shm/fluxon
 
   # 可选
   p2p_listen_port: 31002
@@ -324,7 +318,7 @@ fluxonkv_spec:
 - `contribute_to_cluster_pool_size` 里的容量都按 16 MiB 对齐；`dram = 0` 但 `vram` 非 0 会被拒绝，避免半 owner 半 external 的模糊状态。
 - owner 模式要求 `contribute_to_cluster_pool_size.dram > 0`，并且必须显式提供 `etcd_addresses`、`sub_cluster`、`large_file_paths`。
 - zero-contribution `external` 模式禁止再写 owner 专属字段；运行时会从 owner `shared.json` 补齐这部分信息。
-- `shared_memory_path` / `shared_file_path` 会拼成 `cluster_name` 作用域路径。
+- `share_mem_path` 会拼成 `cluster_name` 作用域路径；`mmap.file`、`shared.json` 和 peer metadata 都位于这个 cluster-scoped 目录下。
 - `test_spec_config.side_transfer_role = worker` 不是第三套 YAML，而是 zero-contribution client 的子分支；它强制 `TransferEngineType::P2p`，并关闭 transfer RPC fast path。
 - `test_spec_config.side_transfer_worker_count` 只允许出现在 owner 配置里，用来控制 owner 拉起的 worker 数量。
 
diff --git "a/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md" "b/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
index fd81c45..555672b 100644
--- "a/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
+++ "b/fluxon_doc_cn/design/log_1_\346\234\254\345\234\260\346\226\207\344\273\266\346\227\245\345\277\227\344\270\216Greptime_OTLP\345\257\274\345\207\272\351\223\276\350\267\257.md"
@@ -17,7 +17,7 @@
 3. Rust / Python 之间哪些 contract 已经对齐，哪些还没有。
 4. 当前实现里哪些地方已经收口，哪些地方仍是未完全收口点。
 
-KV 里的 `external` 与 side worker 都只消费 owner 感知结果。当前稳定 contract 是：它们显式配置 `shared_memory_path` / `shared_file_path` 作为 attach owner 的共享 bundle 锚点，`large_file_paths` 则从 owner 发布的 `shared.json` 继承；日志和 cache 从启动起就直接落到 owner 派生出来的大文件目录，不再要求 zero-contribution 侧另配一份本地 large root。
+KV 里的 `external` 与 side worker 都只消费 owner 感知结果。当前稳定 contract 是：它们显式配置单一 `share_mem_path` 作为 attach owner 的共享 bundle 根目录，`mmap.file`、`shared.json` 和 peer metadata 都在运行时拼接出的 cluster-scoped 目录下；`large_file_paths` 则从 owner 发布的 `shared.json` 继承，日志和 cache 从启动起就直接落到 owner 派生出来的大文件目录。
 
 ## 1. 目录边界
 目录边界只管物理隔离，不管统一 root。统一的是命名、元数据、归档窗口和清理语义。
@@ -112,9 +112,9 @@ ${HOSTWORKDIR}/
 - 当前优先级不是先把 testbed 做到完美支持，而是先把 ops 长时服务日志 contract 讲清楚并收口；testbed 继续按“服务级日志”和“case artifact”分开讨论。
 
 ### 1.4 FS
-- `shared_file_path` 与 `export.remote_root_dir_abs` 分开使用。
-- 前者负责共享 attachment 边界。
-- 后者负责业务数据边界。
+- `share_mem_path` 与 `export.remote_root_dir_abs` 分开使用。
+- 前者负责 KV attachment 所需的共享 bundle 边界。
+- 后者负责 FS 业务数据边界。
 
 这里的目标很明确：目录可以不同，语义必须一致。`log`、`cache`、`shared attachment`、`workload data` 不能混在同一个边界里。
 
@@ -191,9 +191,9 @@ Greptime 侧的 retention / TTL 也按同一日期窗口收口，保证本地与
 ## 6. 当前还没有完全收口的点
 这一节只写未完全收口点，避免把“当前事实”和“目标态”混在一起。
 
-### 6.1 KV 目录边界还没有完全收口到单一 `share_path`
-- 预期 KV 最终收口为单一 `share_path`，统一承载 `mmap.file`、`shared.json` 和 side transfer metadata。
-- 当前 Rust 实现仍保留 `shared_memory_path` 与 `shared_file_path` 两条配置，并分别用于 `mmap.file` 与 `shared.json` / `peer metadata` 的就绪探测和发布。
+### 6.1 KV 共享 bundle 已收口到单一 `share_mem_path`
+- 当前 KV public contract 只保留 `share_mem_path`。
+- 运行时在 `share_mem_path` 下拼接 `cluster_name`，统一承载 `mmap.file`、`shared.json`、peer metadata 和 side transfer metadata。
 
 ### 6.2 side worker stdio 仍未收口到统一按天分片
 - zero-contribution bootstrap 已经在启动前继承 owner 的 `large_file_paths`，因此 KV runtime logger 不再依赖 attach 后热切换文件路径。
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"
index f85811d..bbe5c27 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 1 - \346\236\266\346\236\204\345\222\214\346\246\202\345\277\265.md"	
@@ -60,9 +60,7 @@
 
 **`prometheus_base_url`** — 面板的 metrics 数据源地址（Prometheus-compatible HTTP API）。面板只查询不采集，不可达时指标显示 N/A。
 
-**`shared_memory_path`** — 共享内存目录，同机进程通过它附着到同一内存池；这是 mmap / data plane 的本机 authority。
-
-**`shared_file_path`** — 共享文件目录，`shared.json` 与 peer metadata 等本机共享文件位于这里；这是 file / metadata attachment 的本机 authority。
+**`share_mem_path`** — 共享 bundle 根目录。运行时会在其下拼接 `cluster_name`，同一个 cluster-scoped 目录同时承载 `mmap.file`、`shared.json` 和 peer metadata。
 
 **`log_dir`** — master 自己的日志目录 authority。master 运行时会在这个目录下继续派生 cluster 级日志和 profile 子目录。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"
index 5daa633..2ffa6e5 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 2 - \346\234\215\345\212\241\345\271\263\351\235\242.md"	
@@ -199,8 +199,7 @@ ETCD_ENDPOINT = "127.0.0.1:2379"
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_kv_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_kv_demo/runtime").resolve()
 MASTER_PORT = 31000
 MASTER_INSTANCE_KEY = "demo_kv_master"
@@ -210,7 +209,6 @@ OWNER_DRAM_BYTES = 1073741824
 
 def main() -> None:
     args = parse_args()
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
     log_dir = (WORKDIR / "log").resolve()
 
     if args.with_master:
@@ -245,8 +243,7 @@ def main() -> None:
         )
     )
 
-    print(f"[fluxon_kv] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_kv] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_kv] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_kv] etcd endpoint: {ETCD_ENDPOINT}")
     print(f"[fluxon_kv] greptime base url: {GREPTIME_BASE_URL}")
     print(f"[fluxon_kv] start master in this script: {args.with_master}")
@@ -309,8 +306,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"
index 55d4cd1..9a8c8e1 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 3 - KV-RPC\346\216\245\345\217\243.md"	
@@ -52,8 +52,7 @@ ETCD_ENDPOINT = "127.0.0.1:2379"
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_kv_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_kv_demo/runtime").resolve()
 MASTER_PORT = 31000
 MASTER_UI_PORT = 18080
@@ -64,7 +63,6 @@ OWNER_DRAM_BYTES = 1073741824
 
 def main() -> None:
     args = parse_args()
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
     log_dir = (WORKDIR / "log").resolve()
 
     if args.with_master:
@@ -99,8 +97,7 @@ def main() -> None:
         )
     )
 
-    print(f"[fluxon_kv] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_kv] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_kv] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_kv] etcd endpoint: {ETCD_ENDPOINT}")
     print(f"[fluxon_kv] greptime base url: {GREPTIME_BASE_URL}")
     print(f"[fluxon_kv] start master in this script: {args.with_master}")
@@ -170,8 +167,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
@@ -238,6 +234,7 @@ api.close() -> Result[OkNone, ApiError]
 - `FluxonKvClientConfig`：配置对象，优先直接从 Python dict 创建，也支持从 YAML 文件加载。
 - `new_store(config: FluxonKvClientConfig) -> Result[KvClient, ApiError]`：创建 KV client 实例。
 - `KvClient`：统一入口，同时提供 KV 读写与节点间调用。
+- `KvClient.third_party_logs_dir() -> Result[str, ApiError]`：返回 Fluxon 分配给第三方 Python 组件的日志根目录。组件应在这个根目录下继续派生自己的子目录，例如 `mq/`。
 - `MemHolder`：`get_blocking(...)` 成功后的读取结果持有者，`access()` 取得 `FlatDict`。
 - `PutOptionalArgs`：`put_blocking(...)` 的可选参数对象，当前常用字段是 `lease_id`。
 - `test_spec_config.disable_observability`：最小 external client 示例里显式设为 `True`，避免把 OTLP / observe 后台任务引入“只验证 KV/RPC 基本链路”的示例生命周期。
@@ -265,8 +262,7 @@ from fluxon_py import FluxonKvClientConfig, new_store
 
 INSTANCE_KEY = "demo_kv_external"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def main() -> None:
@@ -275,8 +271,7 @@ def main() -> None:
             "instance_key": INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
@@ -333,7 +328,9 @@ FLUXON_LOG=DEBUG python3 examples/external_put_get_del.py
 - `FLUXON_LOG`：控制当前 Python 业务进程 console logger 的输出门限
 - Fluxon Python 侧 logger 会读取 `FLUXON_LOG`；合法值是 `DEBUG`、`INFO`、`WARNING`、`ERROR`、`CRITICAL`，默认 `INFO`
 - `log_dir`：`master` 本地日志 authority
-- `shared_file_path`：本机共享文件 authority，`shared.json`、日志、profile 等文件位于这里
+- `share_mem_path`：KV 共享 bundle 根目录，只承载 `mmap.file`、`shared.json` 和 peer metadata
+- `large_file_paths`：owner 侧大文件根目录，日志、profile、cache 等运行时资产都从这里派生
+- `store.third_party_logs_dir().unwrap(...)`：返回 `{large_file_paths[0]}/{cluster_name}_cluster_third_party_logs`。第三方 Python 组件应只在这个根目录下派生自己的子目录，这样目录使用更收束，Fluxon 观测平面也能统一感知和采集这些文件日志。
 
 如果服务平面的 `master.monitoring.otlp_log_api` 已经配置，后台服务日志还会继续采集到 Greptime 的 `fluxon_logs` 表。
 
@@ -412,8 +409,7 @@ from fluxon_py import FluxonKvClientConfig, new_store
 RPC_SERVER_INSTANCE_KEY = "demo_rpc_server"
 RPC_CLIENT_INSTANCE_KEY = "demo_rpc_client"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def main() -> None:
@@ -447,8 +443,7 @@ def _build_config(*, instance_key: str) -> FluxonKvClientConfig:
             "instance_key": instance_key,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
@@ -549,8 +544,7 @@ cfg = FluxonKvClientConfig(
         "instance_key": "my-kv-client-1",
         "fluxonkv_spec": {
             "cluster_name": "demo-kv-cluster",
-            "shared_memory_path": "/dev/shm/fluxon",
-            "shared_file_path": "/var/lib/fluxon/shared",
+            "share_mem_path": "/dev/shm/fluxon",
         },
     }
 )
@@ -575,10 +569,8 @@ instance_key: my-kv-client-1
 fluxonkv_spec:
   # 目标集群名；必须和 master / owner 保持一致
   cluster_name: demo-kv-cluster
-  # 本机共享内存 authority；external 靠它附着到同机 owner 的内存池
-  shared_memory_path: /dev/shm/fluxon
-  # 本机共享文件 authority；shared.json、日志、profile 等文件位于这里
-  shared_file_path: /var/lib/fluxon/shared
+  # 共享 bundle 根目录；运行时会在其下拼接 cluster_name
+  share_mem_path: /dev/shm/fluxon
   # 可选：覆盖当前 client 的 P2P 监听端口
   p2p_listen_port: 31001
 ```
@@ -602,20 +594,17 @@ fluxonkv_spec:
     - 127.0.0.1:2379
   # 目标集群名；必须和 master / external 保持一致
   cluster_name: demo-kv-cluster
-  # 本机共享内存 authority；external 进程会附着到这里
-  shared_memory_path: /dev/shm/fluxon
-  # 本机共享文件 authority；shared.json、日志、profile 等文件位于这里
-  shared_file_path: /var/lib/fluxon/shared
+  # 共享 bundle 根目录；运行时会在其下拼接 cluster_name
+  share_mem_path: /dev/shm/fluxon
   # owner 自己的 P2P 监听端口
   p2p_listen_port: 31000
   # owner 所属子集群标签
   sub_cluster: default
 ```
 
-这里需要把两个本机 authority 分清楚：
+这里需要把共享 bundle 和大文件根目录分清楚：
 
-- `shared_memory_path`：共享内存 / mmap authority，同机进程靠它附着到同一块内存池
-- `shared_file_path`：共享文件 authority，只承载 `shared.json` 和 peer metadata 等共享文件
+- `share_mem_path`：共享 bundle 根目录；运行时拼接 `cluster_name` 后，同时承载 `mmap.file`、`shared.json` 和 peer metadata
 - `large_file_paths`：owner 独占的大文件 authority，日志、profile、cache 等运行时资产都从这里派生
 - `FLUXON_LOG`：用户 Python 进程 console log 的门限，不写时默认 `INFO`
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"
index 4501abb..a788b74 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 4 - MQ\346\216\245\345\217\243.md"	
@@ -86,8 +86,7 @@ ETCD_ENDPOINT = "127.0.0.1:2379"
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_kv_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_kv_demo/runtime").resolve()
 MASTER_PORT = 31000
 MASTER_INSTANCE_KEY = "demo_kv_master"
@@ -97,7 +96,6 @@ OWNER_DRAM_BYTES = 1073741824
 
 def main() -> None:
     args = parse_args()
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
     log_dir = (WORKDIR / "log").resolve()
 
     if args.with_master:
@@ -132,8 +130,7 @@ def main() -> None:
         )
     )
 
-    print(f"[fluxon_kv] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_kv] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_kv] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_kv] etcd endpoint: {ETCD_ENDPOINT}")
     print(f"[fluxon_kv] greptime base url: {GREPTIME_BASE_URL}")
     print(f"[fluxon_kv] start master in this script: {args.with_master}")
@@ -196,8 +193,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
@@ -300,8 +296,7 @@ from fluxon_py.runtime import register_ctrlc_callback
 
 # These constants are the only user-facing knobs in the minimal example.
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 CHANNEL_KEY = "demo_mq_channel_doc"
 CHANNEL_CAPACITY = 128
 CHANNEL_TTL_SECONDS = 300
@@ -336,8 +331,7 @@ def _build_store_config(*, role: str) -> FluxonKvClientConfig:
             "instance_key": f"demo_mq_{role}",
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
         }
     )
@@ -481,9 +475,7 @@ def main() -> None:
     parser.add_argument("--role", choices=["producer", "consumer"], required=True)
     args = parser.parse_args()
 
-    # The minimal example keeps shared file authority explicit and local.
-    Path(SHARED_FILE_PATH).mkdir(parents=True, exist_ok=True)
-
+    # The minimal example keeps share_mem_path explicit and local.
     # init_logger() reads FLUXON_LOG and sets the user-process console log level.
     logger = init_logger(f"mpmc_demo_{args.role}")
     shutdown_requested = threading.Event()
@@ -543,7 +535,7 @@ FLUXON_LOG=DEBUG python3 examples/start_mpmc_demo.py --role consumer
 
 ### 关键接口常见错误处理
 
-- `new_or_bind_with_unique_key(...)` 失败：直接把 `unwrap_error()` 打出来，先检查 cluster、shared memory/shared file 路径、`unique_id`、`chan_role` 是否和对端一致
+- `new_or_bind_with_unique_key(...)` 失败：直接把 `unwrap_error()` 打出来，先检查 `cluster_name`、`share_mem_path`、`unique_id`、`chan_role` 是否和对端一致
 - `producer.put_data(...)` 返回 `ProducerClosedError`：按正常关闭路径处理，直接退出主循环
 - `consumer.get_data(...)` 返回 `ChannelClosedError`：按正常关闭路径处理，直接退出主循环
 
@@ -553,7 +545,7 @@ FLUXON_LOG=DEBUG python3 examples/start_mpmc_demo.py --role consumer
 
 - MQ Python 部分：由 `init_logger(...)` 初始化，直接输出到当前终端，不默认落盘，门限由 `FLUXON_LOG` 控制
 - MQ Rust / KV 后台部分：和 KV 一起走服务平面的后台日志链路；`master` 本地日志目录由 `master_cfg["log_dir"]` 指定
-- `shared_file_path`：本机共享文件 authority，只承载 `shared.json` 等共享文件
+- `share_mem_path`：KV 共享 bundle 根目录，只承载 `mmap.file`、`shared.json` 和 peer metadata；后端日志、profile、cache 从 owner 的 `large_file_paths` 派生
 
 如果服务平面的 `master.monitoring.otlp_log_api` 已经配置，MQ Rust / KV 后台部分的日志还会继续采集到 Greptime 的 `fluxon_logs` 表。
 
diff --git "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md" "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"
index 9f67aaf..cf9ab79 100644
--- "a/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
+++ "b/fluxon_doc_cn/user_doc/\347\224\250\346\210\267 - 5 - FS\346\216\245\345\217\243.md"	
@@ -104,8 +104,7 @@ ETCD_ENDPOINT = "127.0.0.1:2379"
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-fs-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_fs_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_fs_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_fs_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_fs_demo/runtime").resolve()
 REMOTE_ROOT_DIR = Path("/tmp/fluxon_fs_demo/remote_root").resolve()
 KV_MASTER_PORT = 34100
@@ -130,8 +129,6 @@ def main() -> None:
     args = parse_args()
     WORKDIR.mkdir(parents=True, exist_ok=True)
     REMOTE_ROOT_DIR.mkdir(parents=True, exist_ok=True)
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
-
     log_dir = (WORKDIR / "log").resolve()
     log_dir.mkdir(parents=True, exist_ok=True)
 
@@ -201,8 +198,7 @@ def main() -> None:
     )
 
     print(f"[fluxon_fs] cluster name: {CLUSTER_NAME}")
-    print(f"[fluxon_fs] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_fs] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_fs] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_fs] remote root dir: {REMOTE_ROOT_DIR}")
     print(f"[fluxon_fs] export name: {EXPORT_NAME}")
     print(f"[fluxon_fs] owner instance key: {OWNER_INSTANCE_KEY}")
@@ -283,8 +279,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
@@ -297,8 +292,7 @@ def build_fs_master_config() -> dict:
             "instance_key": FS_MASTER_INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": str(SHARED_MEMORY_PATH),
-                "shared_file_path": str(SHARED_FILE_PATH),
+                "share_mem_path": str(SHARE_MEM_PATH),
             },
         },
         "fluxon_fs": {
@@ -357,8 +351,7 @@ def build_fs_agent_config() -> dict:
             "instance_key": FS_AGENT_INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": str(SHARED_MEMORY_PATH),
-                "shared_file_path": str(SHARED_FILE_PATH),
+                "share_mem_path": str(SHARE_MEM_PATH),
             },
         },
         "fluxon_fs": {
@@ -403,8 +396,7 @@ python3 examples/start_kv_and_fs_svc.py --without-master
 脚本会持续运行，并打印：
 
 - `cluster name`
-- `shared memory path`
-- `shared file path`
+- `share_mem_path`
 - `remote root dir`
 - `export name`
 - `owner instance key`
@@ -447,8 +439,7 @@ python3 examples/start_kv_and_fs_svc.py --without-master
 这条最小成功路径默认对应本页的本地完整示例，也就是不带 `--without-master` 的启动方式。`--without-master` 用于把当前机器接到已经存在的 KV / FS 集群；如果继续运行 `start_fluxon_fs_writer.py` / `start_fluxon_fs_reader.py`，配置里的这些对象必须和现有集群一致：
 
 - `cluster_name`
-- `shared_memory_path`
-- `shared_file_path`
+- `share_mem_path`
 - `fluxon_fs.master.instance_key`
 - `export_name`
 - `remote_root_dir_abs`
@@ -728,8 +719,7 @@ FLUXON_LOG=DEBUG python3 examples/start_fluxon_fs_reader.py -c <reader-config.ya
 
 - `start_kv_and_fs_svc.py` 是否还在运行
 - `CLUSTER_NAME`
-- `SHARED_MEMORY_PATH`
-- `SHARED_FILE_PATH`
+- `SHARE_MEM_PATH`
 
 ### `fluxon_fs cache config is not loaded yet`
 
diff --git a/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md b/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md
index 9c64b7f..3dc06a6 100644
--- a/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md	
+++ b/fluxon_doc_en/user_doc/User - 1 - Architecture and Concepts.md	
@@ -74,13 +74,9 @@ Cross-machine transport:
 - Metrics source queried by the panel
 - The panel only reads; it does not scrape by itself
 
-`shared_memory_path`
+`share_mem_path`
 
-- Shared-memory authority for local attachment to the same pool
-
-`shared_file_path`
-
-- Shared-file authority for `shared.json`, peer metadata, and other local shared files
+- Shared bundle root. Runtime appends `cluster_name`, and that cluster-scoped directory holds `mmap.file`, `shared.json`, and peer metadata.
 
 `log_dir`
 
diff --git a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md
index ab3932a..b3f003d 100644
--- a/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 3 - KV and RPC Interface.md	
@@ -47,8 +47,7 @@ ETCD_ENDPOINT = "127.0.0.1:2379"
 GREPTIME_HTTP_PORT = 34030
 GREPTIME_BASE_URL = f"http://127.0.0.1:{GREPTIME_HTTP_PORT}"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
-SHARED_FILE_PATH = Path("/tmp/fluxon_kv_demo/shared").resolve()
+SHARE_MEM_PATH = Path("/dev/shm/fluxon_kv_demo").resolve()
 WORKDIR = Path("/tmp/fluxon_kv_demo/runtime").resolve()
 MASTER_PORT = 31000
 MASTER_UI_PORT = 18080
@@ -59,7 +58,6 @@ OWNER_DRAM_BYTES = 1073741824
 
 def main() -> None:
     args = parse_args()
-    SHARED_FILE_PATH.mkdir(parents=True, exist_ok=True)
     log_dir = (WORKDIR / "log").resolve()
 
     if args.with_master:
@@ -84,8 +82,7 @@ def main() -> None:
         children.append(ManagedSubprocess(label="master", proc=master_proc))
     children.append(ManagedSubprocess(label="owner", proc=owner_proc))
 
-    print(f"[fluxon_kv] shared memory path: {SHARED_MEMORY_PATH}")
-    print(f"[fluxon_kv] shared file path: {SHARED_FILE_PATH}")
+    print(f"[fluxon_kv] share_mem_path: {SHARE_MEM_PATH}")
     print(f"[fluxon_kv] etcd endpoint: {ETCD_ENDPOINT}")
     print(f"[fluxon_kv] greptime base url: {GREPTIME_BASE_URL}")
     print(f"[fluxon_kv] start master in this script: {args.with_master}")
@@ -145,8 +142,7 @@ def build_owner_config() -> dict:
         "fluxonkv_spec": {
             "etcd_addresses": [ETCD_ENDPOINT],
             "cluster_name": CLUSTER_NAME,
-            "shared_memory_path": str(SHARED_MEMORY_PATH),
-            "shared_file_path": str(SHARED_FILE_PATH),
+            "share_mem_path": str(SHARE_MEM_PATH),
             "sub_cluster": "default",
             "large_file_paths": [str((WORKDIR / "large" / "owner").resolve())],
         },
@@ -187,6 +183,7 @@ close()
 - `FluxonKvClientConfig`: config object, usually built from a Python dict
 - `new_store(config: FluxonKvClientConfig) -> Result[KvClient, ApiError]`: create one KV client
 - `KvClient`: single entrypoint for both KV and RPC
+- `KvClient.third_party_logs_dir() -> Result[str, ApiError]`: return the Fluxon-assigned log root for third-party Python components. Components should derive their own subdirectories under this root, for example `mq/`.
 - `MemHolder`: successful result holder from `get_blocking(...)`
 - `PutOptionalArgs`: optional write controls, most commonly `lease_id`
 
@@ -213,8 +210,7 @@ from fluxon_py import FluxonKvClientConfig, new_store
 
 INSTANCE_KEY = "demo_kv_external"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def main() -> None:
@@ -223,8 +219,7 @@ def main() -> None:
             "instance_key": INSTANCE_KEY,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
@@ -266,6 +261,7 @@ Useful calls:
 - `get_size(key)`: query payload size without reading the whole object
 - `is_exist(key)`: existence check
 - `remove(key)`: delete a key
+- `third_party_logs_dir()`: return `{large_file_paths[0]}/{cluster_name}_cluster_third_party_logs` as a `Result[str, ApiError]`
 
 To increase user-process logs:
 
@@ -273,6 +269,8 @@ To increase user-process logs:
 FLUXON_LOG=DEBUG python3 examples/external_put_get_del.py
 ```
 
+Third-party Python components should place file logs under `store.third_party_logs_dir().unwrap(...)` and then append a component subdirectory such as `mq/`. This keeps log directory usage bounded and lets the Fluxon observability plane discover and collect those file logs through one owner-derived root.
+
 ### Minimal Node-to-Node RPC Example
 
 `examples/rpc_call.py`:
@@ -288,8 +286,7 @@ from fluxon_py import FluxonKvClientConfig, new_store
 RPC_SERVER_INSTANCE_KEY = "demo_rpc_server"
 RPC_CLIENT_INSTANCE_KEY = "demo_rpc_client"
 CLUSTER_NAME = "demo-kv-cluster"
-SHARED_MEMORY_PATH = "/dev/shm/fluxon_kv_demo"
-SHARED_FILE_PATH = "/tmp/fluxon_kv_demo/shared"
+SHARE_MEM_PATH = "/dev/shm/fluxon_kv_demo"
 
 
 def _build_config(*, instance_key: str) -> FluxonKvClientConfig:
@@ -298,8 +295,7 @@ def _build_config(*, instance_key: str) -> FluxonKvClientConfig:
             "instance_key": instance_key,
             "fluxonkv_spec": {
                 "cluster_name": CLUSTER_NAME,
-                "shared_memory_path": SHARED_MEMORY_PATH,
-                "shared_file_path": SHARED_FILE_PATH,
+                "share_mem_path": SHARE_MEM_PATH,
             },
             "test_spec_config": {
                 "disable_observability": True,
@@ -359,8 +355,7 @@ instance_key: my-kv-client-1
 
 fluxonkv_spec:
   cluster_name: demo-kv-cluster
-  shared_memory_path: /dev/shm/fluxon
-  shared_file_path: /var/lib/fluxon/shared
+  share_mem_path: /dev/shm/fluxon
   p2p_listen_port: 31001
 ```
 
@@ -377,16 +372,14 @@ fluxonkv_spec:
   etcd_addresses:
     - 127.0.0.1:2379
   cluster_name: demo-kv-cluster
-  shared_memory_path: /dev/shm/fluxon
-  shared_file_path: /var/lib/fluxon/shared
+  share_mem_path: /dev/shm/fluxon
   p2p_listen_port: 31000
   sub_cluster: default
 ```
 
-Keep these authorities separate:
+Keep these roots separate:
 
-- `shared_memory_path`: shared-memory / mmap authority
-- `shared_file_path`: shared-file authority for `shared.json` and peer metadata files
+- `share_mem_path`: shared bundle root. Runtime appends `cluster_name`, and that directory holds `mmap.file`, `shared.json`, and peer metadata.
 - `large_file_paths`: owner-only large-file authority for logs, profiles, caches, and other derived runtime assets
 - `FLUXON_LOG`: console log threshold for the user process
 
diff --git a/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md b/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md
index dcfe33c..8f59529 100644
--- a/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 4 - MQ Interface.md	
@@ -116,7 +116,7 @@ Parameter constraints:
 
 ### Common Error Handling
 
-- `new_or_bind_with_unique_key(...)` fails: first check cluster name, shared memory / shared file paths, `unique_id`, and that both ends use matching roles
+- `new_or_bind_with_unique_key(...)` fails: first check `cluster_name`, `share_mem_path`, `unique_id`, and that both ends use matching roles
 - `producer.put_data(...)` returns `ProducerClosedError`: treat it as a normal shutdown signal and exit the main loop
 - `consumer.get_data(...)` returns `ChannelClosedError`: treat it as a normal shutdown signal and exit the main loop
 
@@ -124,8 +124,8 @@ Parameter constraints:
 
 - Python-side MQ logs come from `init_logger(...)` and go to the current terminal by default; the threshold is controlled by `FLUXON_LOG`
 - Rust / KV background logs follow the shared service-plane pipeline, and the master's local log authority is `master_cfg["log_dir"]`
-- `shared_file_path` remains the local shared-file authority for `shared.json` and related files
-- `large_file_paths` remains the owner-only large-file authority for backend logs, profiles, caches, and other derived runtime assets
+- `share_mem_path` is the shared bundle root for `mmap.file`, `shared.json`, and peer metadata
+- `large_file_paths` is the owner-only large-file authority for backend logs, profiles, caches, and other derived runtime assets
 
 If `master.monitoring.otlp_log_api` is configured, backend logs continue to flow into the Greptime `fluxon_logs` table.
 
diff --git a/fluxon_doc_en/user_doc/User - 5 - FS Interface.md b/fluxon_doc_en/user_doc/User - 5 - FS Interface.md
index fdf2242..dcf3cd2 100644
--- a/fluxon_doc_en/user_doc/User - 5 - FS Interface.md	
+++ b/fluxon_doc_en/user_doc/User - 5 - FS Interface.md	
@@ -287,8 +287,7 @@ Usually means the external client did not attach to the local owner. Check:
 
 - whether `start_kv_and_fs_svc.py` is still running
 - `CLUSTER_NAME`
-- `SHARED_MEMORY_PATH`
-- `SHARED_FILE_PATH`
+- `SHARE_MEM_PATH`
 
 ### `fluxon_fs cache config is not loaded yet`
 
diff --git a/fluxon_py/_api_ext_chan/mpmc.py b/fluxon_py/_api_ext_chan/mpmc.py
index 8ad4683..4ddbc1e 100644
--- a/fluxon_py/_api_ext_chan/mpmc.py
+++ b/fluxon_py/_api_ext_chan/mpmc.py
@@ -243,12 +243,12 @@ def stable_delete_ready_keys_for_member(
 
 def _local_member_id_cache_path(kv_api: KvClient, mpmc_id: str, role: ChanRole) -> str:
     cfg = kv_api.config()
-    shared_memory_path = cfg.fluxonkv_spec_shared_memory_path
-    if not isinstance(shared_memory_path, str) or not shared_memory_path.strip():
-        raise ValueError("fluxonkv_spec.shared_memory_path must be a non-empty string for local member-id cache")
+    share_mem_path = cfg.fluxonkv_spec_share_mem_path
+    if not isinstance(share_mem_path, str) or not share_mem_path.strip():
+        raise ValueError("fluxonkv_spec.share_mem_path must be a non-empty string for local member-id cache")
     cluster_name = kv_api.get_cluster_name()
     role_name = role.value
-    cache_dir = os.path.join(shared_memory_path, cluster_name, "mq_member_id_cache")
+    cache_dir = os.path.join(share_mem_path, cluster_name, "mq_member_id_cache")
     os.makedirs(cache_dir, exist_ok=True)
     return os.path.join(cache_dir, f"mpmc_{mpmc_id}_{role_name}.json")
 
diff --git a/fluxon_py/config.py b/fluxon_py/config.py
index e591d65..5861f64 100644
--- a/fluxon_py/config.py
+++ b/fluxon_py/config.py
@@ -108,8 +108,7 @@ def _yaml_template():
 fluxonkv_spec:                        # fluxon kv specific config (dict(optional))
   etcd_addresses:                     # Etcd address list ((None|['{str}:{int}']))
   cluster_name:                       # Cluster name (str)
-  shared_memory_path:                 # Shared memory path (str)
-  shared_file_path:                   # Shared file path for shared.json/logs/profiles (str)
+  share_mem_path:                     # Shared bundle path for mmap.file/shared.json/peer metadata (str)
   large_file_paths:                   # Owner-mode ordered large-file roots (['{str}'](optional))
   p2p_listen_port:                    # P2P QUIC listen port override (int(optional))
   redis_compat:                       # Enable Redis protocol shim (dict(optional))
@@ -350,12 +349,9 @@ def _validate_fluxonkv_contract(cfg: Dict[str, Any]) -> None:
 
     is_zero_contribution = _is_zero_contribution_fluxonkv_config(cfg)
 
-    shared_memory_path = spec.get("shared_memory_path")
-    if not isinstance(shared_memory_path, str) or not shared_memory_path.strip():
-        raise ValueError("fluxonkv_spec.shared_memory_path must be a non-empty string")
-    shared_file_path = spec.get("shared_file_path")
-    if not isinstance(shared_file_path, str) or not shared_file_path.strip():
-        raise ValueError("fluxonkv_spec.shared_file_path must be a non-empty string")
+    share_mem_path = spec.get("share_mem_path")
+    if not isinstance(share_mem_path, str) or not share_mem_path.strip():
+        raise ValueError("fluxonkv_spec.share_mem_path must be a non-empty string")
 
     if "rdma_device_names" in cfg:
         raise ValueError("rdma_device_names has been removed from Fluxon KV config")
@@ -530,10 +526,10 @@ def fluxonkv_spec_cluster_name(self):
         return self.config_dict["fluxonkv_spec"]["cluster_name"]
     
     @property
-    def fluxonkv_spec_shared_memory_path(self):
+    def fluxonkv_spec_share_mem_path(self):
         if "fluxonkv_spec" not in self.config_dict:
             return None
-        return self.config_dict["fluxonkv_spec"]["shared_memory_path"]
+        return self.config_dict["fluxonkv_spec"]["share_mem_path"]
     
     @property
     def fluxonkv_spec_transfer_engine(self):
diff --git a/fluxon_py/kvclient/fluxon.py b/fluxon_py/kvclient/fluxon.py
index 3578405..1325e3d 100644
--- a/fluxon_py/kvclient/fluxon.py
+++ b/fluxon_py/kvclient/fluxon.py
@@ -821,6 +821,23 @@ def get_etcd_config(self) -> List[str]:
             out.append(addr)
         return out
 
+    def third_party_logs_dir(self) -> Result[str, ApiError]:
+        if self._client is None:
+            return Result.new_error(GeneralError(message="Store not initialized"))
+        try:
+            res = self._client.third_party_logs_dir()
+            if not res.is_ok():
+                return Result.new_error(res.unwrap_error())
+            logs_dir = res.unwrap()
+            if not isinstance(logs_dir, str) or not logs_dir:
+                return Result.new_error(
+                    GeneralError(message=f"third_party_logs_dir must be non-empty str; got {logs_dir!r}")
+                )
+            return Result.new_ok(logs_dir)
+        except ApiError as e:
+            return Result.new_error(e)
+        except Exception as e:
+            return Result.new_error(GeneralError(message=f"third_party_logs_dir failed: {e}"))
 
     def ensure_zero_contribution_for_channel(self) -> None:
         self._config.ensure_zero_contribution_for_channel()
diff --git a/fluxon_py/kvclient/kvclient_interface.py b/fluxon_py/kvclient/kvclient_interface.py
index 3170628..f50db0f 100644
--- a/fluxon_py/kvclient/kvclient_interface.py
+++ b/fluxon_py/kvclient/kvclient_interface.py
@@ -207,6 +207,9 @@ def get_cluster_name(self) -> str:
     def get_etcd_config(self) -> List[str]:
         """Return etcd endpoint list as raw host:port strings (no scheme)."""
 
+    @abstractmethod
+    def third_party_logs_dir(self) -> Result[str, ApiError]:
+        """Return the owner-derived log root for third-party Python components."""
 
     @abstractmethod
     def ensure_zero_contribution_for_channel(self) -> None:
diff --git a/fluxon_py/kvclient/mooncake.py b/fluxon_py/kvclient/mooncake.py
index becd08d..4457cc3 100644
--- a/fluxon_py/kvclient/mooncake.py
+++ b/fluxon_py/kvclient/mooncake.py
@@ -836,6 +836,12 @@ def get_etcd_config(self) -> List[str]:
                 raise InvalidConfigurationError(message=f"etcd endpoint must be raw host:port (no scheme), got: {addr!r}")
         return endpoints
 
+    def third_party_logs_dir(self) -> Result[str, ApiError]:
+        return Result.new_error(
+            GeneralError(
+                message="third_party_logs_dir is only supported by the Fluxon backend"
+            )
+        )
 
     def ensure_zero_contribution_for_channel(self) -> None:
         self._config.ensure_zero_contribution_for_channel()
diff --git a/fluxon_py/logging.py b/fluxon_py/logging.py
index 33fb2ae..bf67c3d 100755
--- a/fluxon_py/logging.py
+++ b/fluxon_py/logging.py
@@ -94,11 +94,7 @@ def init_logger(name: str = "fluxon") -> Logger:
 def init_mq_file_logger(name: str = "fluxon_mq") -> Logger:
     """Initialize an MQ-specific logger with an optional file handler.
 
-    Path rule aligned with Rust:
-        shared_file_path/{cluster_name}_cluster_mq_logs/
-
-    shared_file_path and cluster_name are provided by fluxon_pyo3.KvClient.logs_dir(),
-    to avoid scattering files under the shared-memory root directory.
+    Path rule aligned with Rust: third_party_logs_dir() is derived from owner large_file_paths.
 
     If fluxon_pyo3 is unavailable, falls back to console-only logging.
     """
@@ -112,20 +108,22 @@ def init_mq_file_logger(name: str = "fluxon_mq") -> Logger:
     ch.setFormatter(CustomFormatter())
     logger.addHandler(ch)
 
-    # If fluxon_pyo3 is available, try using KvClient.logs_dir() as file log directory.
+    # Keep third-party file logs under one Fluxon-owned root so observability can discover them.
     log_dir = None
     try:
         from .tool import import_fluxon_pyo3_local
 
         fp = import_fluxon_pyo3_local()
         client = fp.KvClient()
-        log_dir = client.logs_dir()
+        third_party_log_dir = client.third_party_logs_dir().unwrap("third_party_logs_dir failed")
+        if isinstance(third_party_log_dir, str) and third_party_log_dir:
+            log_dir = os.path.join(third_party_log_dir, "mq")
     except ImportError as exc:
         logger.warning("init_mq_file_logger: fluxon_pyo3 not available; MQ file logs disabled: %s", exc)
         log_dir = None
     except Exception as exc:  # noqa: BLE001
         # Keep usable in cases like invalid config or client init failure; use console-only logging.
-        logger.warning("init_mq_file_logger: KvClient/logs_dir failed: %s", exc)
+        logger.warning("init_mq_file_logger: KvClient/third_party_logs_dir failed: %s", exc)
         log_dir = None
 
     if isinstance(log_dir, str) and log_dir:
diff --git a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
index d120cc7..7e38d04 100644
--- a/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
+++ b/fluxon_py/tests/fluxon_fs_transfer_tikv_support.py
@@ -1546,10 +1546,8 @@ def __init__(
         self._kv_master_port = _pick_free_port()
         self._ui_base_url = f"http://127.0.0.1:{self._ui_port}"
         self._fs_s3_base_url = f"{self._ui_base_url}/fs_s3"
-        self._shared_memory_root = self._work_root / "sm"
-        self._shared_file_root = self._work_root / "sf"
-        self._shared_memory_root.mkdir(parents=True, exist_ok=True)
-        self._shared_file_root.mkdir(parents=True, exist_ok=True)
+        self._share_mem_root = self._work_root / "sm"
+        self._share_mem_root.mkdir(parents=True, exist_ok=True)
         self._etcd: EtcdHarness | None = None
         self._tikv: TiKvHarness | None = None
         self._monitor: DummyMonitoringHarness | None = None
@@ -1573,8 +1571,8 @@ def store_config(self) -> FluxonFsTransferStateStoreConfig:
             raise RuntimeError("store_config is unavailable before harness init")
         return self._store_config
 
-    def _cluster_scoped_shared_file_dir(self) -> Path:
-        return self._shared_file_root / self._cluster_name
+    def _cluster_scoped_share_mem_dir(self) -> Path:
+        return self._share_mem_root / self._cluster_name
 
     def _monitoring_block(self) -> dict[str, Any]:
         if self._monitor is None:
@@ -1595,8 +1593,7 @@ def _owner_kvclient_config(self) -> dict[str, Any]:
             "fluxonkv_spec": {
                 "etcd_addresses": [self._etcd.endpoint],
                 "cluster_name": self._cluster_name,
-                "shared_memory_path": str(self._shared_memory_root),
-                "shared_file_path": str(self._shared_file_root),
+                "share_mem_path": str(self._share_mem_root),
                 "sub_cluster": "transfer_owner",
                 "large_file_paths": [str(self._work_root / "large" / "owner")],
             },
@@ -1610,8 +1607,7 @@ def _external_kvclient_config(self, *, instance_key: str) -> dict[str, Any]:
             "instance_key": instance_key,
             "fluxonkv_spec": {
                 "cluster_name": self._cluster_name,
-                "shared_memory_path": str(self._shared_memory_root),
-                "shared_file_path": str(self._shared_file_root),
+                "share_mem_path": str(self._share_mem_root),
             },
             "test_spec_config": {
                 "disable_observability": True,
@@ -1752,7 +1748,7 @@ def _prepare_configs(self) -> None:
                 },
             },
         )
-        self._owner_shared_json_path = self._cluster_scoped_shared_file_dir() / "shared.json"
+        self._owner_shared_json_path = self._cluster_scoped_share_mem_dir() / "shared.json"
 
     def _start_logged_process(
         self,
diff --git a/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench.py b/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench.py
index 5f45336..a29c46f 100644
--- a/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench.py
+++ b/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench.py
@@ -69,7 +69,6 @@ def _find_project_root(start: Path) -> Path:
     MOONCAKE_MASTER_SERVER_ADDRESS,
     MOONCAKE_METADATA_SERVER,
     load_test_fluxon_cluster_name,
-    load_test_fluxon_share_file_path,
     load_test_fluxon_share_mem_path,
     new_test_consumer,
     new_test_producer,
@@ -103,7 +102,7 @@ def _find_project_root(start: Path) -> Path:
 WORKER_EXIT_TIMEOUT_SECONDS = 60.0
 STOP_KEY_PREFIX = "/test_mpmc_simple_bench/stop/"
 SUMMARY_KEY_PREFIX = "/test_mpmc_simple_bench/summary/"
-SharedBundle = tuple[str, str]
+SharedBundle = str
 PayloadFieldValue = bytes | DLPackBytesView
 PayloadFields = dict[str, PayloadFieldValue]
 SINGLE_FIELD_PAYLOAD_KEY = "payload"
@@ -159,8 +158,7 @@ def _build_parser() -> argparse.ArgumentParser:
     main_parser.add_argument("--batch-size", type=int, required=False, default=DEFAULT_BATCH_SIZE)
     main_parser.add_argument("--prefetch-num", type=int, required=False, default=DEFAULT_PREFETCH_NUM)
     main_parser.add_argument("--channel-capacity", type=int, required=False, default=DEFAULT_CHANNEL_CAPACITY)
-    main_parser.add_argument("--shared-memory-paths", type=str, required=False)
-    main_parser.add_argument("--shared-file-paths", type=str, required=False)
+    main_parser.add_argument("--share-mem-paths", type=str, required=False)
     producer_parser = subparsers.add_parser("run_producer", help="Run one producer worker")
     producer_parser.add_argument("--backend-type", required=True, type=str)
     producer_parser.add_argument("--ip", required=True, type=str)
@@ -170,8 +168,7 @@ def _build_parser() -> argparse.ArgumentParser:
     producer_parser.add_argument("--payload-bytes", required=True, type=int)
     producer_parser.add_argument("--payload-kind", required=True, type=str, choices=PAYLOAD_KIND_CHOICES)
     producer_parser.add_argument("--channel-capacity", required=True, type=int)
-    producer_parser.add_argument("--shared-memory-path", required=False, type=str)
-    producer_parser.add_argument("--shared-file-path", required=False, type=str)
+    producer_parser.add_argument("--share-mem-path", required=False, type=str)
     producer_parser.add_argument("--stop-key", required=True, type=str)
 
     consumer_parser = subparsers.add_parser("run_consumer", help="Run one consumer worker")
@@ -185,8 +182,7 @@ def _build_parser() -> argparse.ArgumentParser:
     consumer_parser.add_argument("--payload-kind", required=True, type=str, choices=PAYLOAD_KIND_CHOICES)
     consumer_parser.add_argument("--prefetch-num", required=True, type=int)
     consumer_parser.add_argument("--channel-capacity", required=True, type=int)
-    consumer_parser.add_argument("--shared-memory-path", required=False, type=str)
-    consumer_parser.add_argument("--shared-file-path", required=False, type=str)
+    consumer_parser.add_argument("--share-mem-path", required=False, type=str)
     consumer_parser.add_argument("--stop-key", required=True, type=str)
     consumer_parser.add_argument("--summary-key", required=True, type=str)
     return parser
@@ -209,8 +205,7 @@ def _run_main(args: argparse.Namespace) -> None:
     _validate_main_args(args)
     consumer_counts = _parse_consumer_counts(args.consumer_counts)
     shared_bundles = _parse_shared_bundles(
-        shared_memory_paths_raw=args.shared_memory_paths,
-        shared_file_paths_raw=args.shared_file_paths,
+        share_mem_paths_raw=args.share_mem_paths,
     )
     for consumer_count in consumer_counts:
         _run_one_case(
@@ -272,8 +267,7 @@ def _run_one_case(
     bootstrap_store = _new_channel_store(
         role_key=f"{bench_id}_bootstrap",
         backend_type=KV_SVC_TYPE,
-        shared_memory_path=bootstrap_bundle[0],
-        shared_file_path=bootstrap_bundle[1],
+        share_mem_path=bootstrap_bundle,
     )
     bootstrap_producer = None
     worker_processes: list[subprocess.Popen[str]] = []
@@ -305,8 +299,7 @@ def _run_one_case(
                     payload_bytes=payload_bytes,
                     payload_kind=payload_kind,
                     channel_capacity=channel_capacity,
-                    shared_memory_path=producer_bundle[0],
-                    shared_file_path=producer_bundle[1],
+                    share_mem_path=producer_bundle,
                     stop_key=stop_key,
                 )
             )
@@ -338,10 +331,8 @@ def _run_one_case(
                         str(prefetch_num),
                         "--channel-capacity",
                         str(channel_capacity),
-                        "--shared-memory-path",
-                        consumer_bundle[0],
-                        "--shared-file-path",
-                        consumer_bundle[1],
+                        "--share-mem-path",
+                        consumer_bundle,
                         "--stop-key",
                         stop_key,
                         "--summary-key",
@@ -418,8 +409,7 @@ def _run_producer(args: argparse.Namespace) -> None:
     store = _new_channel_store(
         role_key=f"{args.bench_id}_producer_{args.producer_id}",
         backend_type=args.backend_type,
-        shared_memory_path=args.shared_memory_path,
-        shared_file_path=args.shared_file_path,
+        share_mem_path=args.share_mem_path,
     )
     producer = None
     restore_signal_listener = None
@@ -500,8 +490,7 @@ def _run_consumer(args: argparse.Namespace) -> None:
     store = _new_channel_store(
         role_key=f"{args.bench_id}_consumer_{args.consumer_id}",
         backend_type=args.backend_type,
-        shared_memory_path=args.shared_memory_path,
-        shared_file_path=args.shared_file_path,
+        share_mem_path=args.share_mem_path,
     )
     consumer = None
     restore_signal_listener = None
@@ -669,8 +658,7 @@ def _validate_main_args(args: argparse.Namespace) -> None:
     _validate_non_negative_int("prefetch_num", args.prefetch_num)
     _validate_positive_int("channel_capacity", args.channel_capacity)
     _parse_shared_bundles(
-        shared_memory_paths_raw=args.shared_memory_paths,
-        shared_file_paths_raw=args.shared_file_paths,
+        share_mem_paths_raw=args.share_mem_paths,
     )
     _validate_sample_window(
         total_duration_seconds=int(args.duration_seconds),
@@ -732,14 +720,12 @@ def _new_channel_store(
     *,
     role_key: str,
     backend_type: str,
-    shared_memory_path: str | None,
-    shared_file_path: str | None,
+    share_mem_path: str | None,
 ):
     config = _new_store_config(
         instance_key=role_key,
         backend_type=backend_type,
-        shared_memory_path=shared_memory_path,
-        shared_file_path=shared_file_path,
+        share_mem_path=share_mem_path,
     )
     result = new_store(config)
     if not result.is_ok():
@@ -751,8 +737,7 @@ def _new_store_config(
     *,
     instance_key: str,
     backend_type: str,
-    shared_memory_path: str | None,
-    shared_file_path: str | None,
+    share_mem_path: str | None,
 ) -> FluxonKvClientConfig:
     if backend_type == KvClientType.MOONCAKE.value:
         return FluxonKvClientConfig(
@@ -772,14 +757,12 @@ def _new_store_config(
         )
 
     if backend_type == KvClientType.FLUXON.value:
-        resolved_shared_memory_path, resolved_shared_file_path = _resolve_fluxon_shared_bundle(
-            shared_memory_path=shared_memory_path,
-            shared_file_path=shared_file_path,
+        resolved_share_mem_path = _resolve_fluxon_shared_bundle(
+            share_mem_path=share_mem_path,
         )
         fluxon_spec: dict[str, Any] = {
             "cluster_name": load_test_fluxon_cluster_name(),
-            "shared_memory_path": resolved_shared_memory_path,
-            "shared_file_path": resolved_shared_file_path,
+            "share_mem_path": resolved_share_mem_path,
         }
         return FluxonKvClientConfig(
             {
@@ -813,8 +796,7 @@ def _spawn_producer(
     payload_bytes: int,
     payload_kind: PayloadKind,
     channel_capacity: int,
-    shared_memory_path: str,
-    shared_file_path: str,
+    share_mem_path: str,
     stop_key: str,
 ) -> subprocess.Popen[str]:
     return _spawn_worker(
@@ -838,10 +820,8 @@ def _spawn_producer(
             payload_kind.value,
             "--channel-capacity",
             str(channel_capacity),
-            "--shared-memory-path",
-            shared_memory_path,
-            "--shared-file-path",
-            shared_file_path,
+            "--share-mem-path",
+            share_mem_path,
             "--stop-key",
             stop_key,
         ]
@@ -850,21 +830,11 @@ def _spawn_producer(
 
 def _parse_shared_bundles(
     *,
-    shared_memory_paths_raw: str | None,
-    shared_file_paths_raw: str | None,
+    share_mem_paths_raw: str | None,
 ) -> tuple[SharedBundle, ...]:
-    if shared_memory_paths_raw is None and shared_file_paths_raw is None:
-        return ((load_test_fluxon_share_mem_path(), load_test_fluxon_share_file_path()),)
-    if shared_memory_paths_raw is None or shared_file_paths_raw is None:
-        raise ValueError("shared-memory-paths and shared-file-paths must be set together")
-    shared_memory_paths = _parse_csv_paths(raw=shared_memory_paths_raw, arg_name="shared-memory-paths")
-    shared_file_paths = _parse_csv_paths(raw=shared_file_paths_raw, arg_name="shared-file-paths")
-    if len(shared_memory_paths) != len(shared_file_paths):
-        raise ValueError(
-            "shared-memory-paths and shared-file-paths length mismatch: "
-            f"{len(shared_memory_paths)} != {len(shared_file_paths)}"
-        )
-    return tuple(zip(shared_memory_paths, shared_file_paths, strict=True))
+    if share_mem_paths_raw is None:
+        return (load_test_fluxon_share_mem_path(),)
+    return _parse_csv_paths(raw=share_mem_paths_raw, arg_name="share-mem-paths")
 
 
 def _parse_csv_paths(*, raw: str, arg_name: str) -> tuple[str, ...]:
@@ -887,18 +857,14 @@ def _select_shared_bundle(shared_bundles: tuple[SharedBundle, ...], worker_idx:
 
 def _resolve_fluxon_shared_bundle(
     *,
-    shared_memory_path: str | None,
-    shared_file_path: str | None,
+    share_mem_path: str | None,
 ) -> SharedBundle:
-    if shared_memory_path is None or shared_file_path is None:
-        raise ValueError(
-            "fluxon backend requires explicit shared_memory_path/shared_file_path for each worker"
-        )
-    resolved_shared_memory_path = str(shared_memory_path).strip()
-    resolved_shared_file_path = str(shared_file_path).strip()
-    if resolved_shared_memory_path == "" or resolved_shared_file_path == "":
-        raise ValueError("shared_memory_path/shared_file_path must be non-empty strings")
-    return (resolved_shared_memory_path, resolved_shared_file_path)
+    if share_mem_path is None:
+        raise ValueError("fluxon backend requires explicit share_mem_path for each worker")
+    resolved_share_mem_path = str(share_mem_path).strip()
+    if resolved_share_mem_path == "":
+        raise ValueError("share_mem_path must be a non-empty string")
+    return resolved_share_mem_path
 
 
 def _terminate_processes(processes: list[subprocess.Popen[str]]) -> None:
diff --git a/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench2.py b/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench2.py
index eabac11..bc9cfa0 100644
--- a/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench2.py
+++ b/fluxon_py/tests/test_api_chan_mpmc/test_mpmc_simple_bench2.py
@@ -67,7 +67,6 @@ def _find_project_root(start: Path) -> Path:
     MOONCAKE_MASTER_SERVER_ADDRESS,
     MOONCAKE_METADATA_SERVER,
     load_test_fluxon_cluster_name,
-    load_test_fluxon_share_file_path,
     load_test_fluxon_share_mem_path,
     new_test_consumer,
     new_test_producer,
@@ -898,8 +897,7 @@ def _new_store_config(*, instance_key: str, backend_type: str) -> FluxonKvClient
     if backend_type == KvClientType.FLUXON.value:
         fluxon_spec: dict[str, Any] = {
             "cluster_name": load_test_fluxon_cluster_name(),
-            "shared_memory_path": load_test_fluxon_share_mem_path(),
-            "shared_file_path": load_test_fluxon_share_file_path(),
+            "share_mem_path": load_test_fluxon_share_mem_path(),
         }
         return FluxonKvClientConfig(
             {
diff --git a/fluxon_py/tests/test_backend_fallback_close.py b/fluxon_py/tests/test_backend_fallback_close.py
index a33da71..74ad26d 100644
--- a/fluxon_py/tests/test_backend_fallback_close.py
+++ b/fluxon_py/tests/test_backend_fallback_close.py
@@ -93,6 +93,9 @@ def get_cluster_name(self):
     def get_etcd_config(self):
         return []
 
+    def third_party_logs_dir(self):
+        return Result.new_ok("/tmp/fluxon_third_party_logs")
+
     def ensure_zero_contribution_for_channel(self):
         return None
 
diff --git a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
index 74f4943..d965923 100644
--- a/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
+++ b/fluxon_py/tests/test_backend_relay_deployconf.template.yaml
@@ -85,8 +85,7 @@ service:
           etcd_addresses:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
-          shared_memory_path: "__OWNER1_SHM__"
-          shared_file_path: "__OWNER1_SHARED_FILE__"
+          share_mem_path: "__OWNER1_SHM__"
           sub_cluster: "owner1"
           large_file_paths: ["__OWNER1_LARGE_ROOT__"]
           p2p_listen_port: 31011
@@ -116,8 +115,7 @@ service:
           etcd_addresses:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
-          shared_memory_path: "__OWNER2_SHM__"
-          shared_file_path: "__OWNER2_SHARED_FILE__"
+          share_mem_path: "__OWNER2_SHM__"
           sub_cluster: "owner2"
           large_file_paths: ["__OWNER2_LARGE_ROOT__"]
           p2p_listen_port: 31012
@@ -147,8 +145,7 @@ service:
           etcd_addresses:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
-          shared_memory_path: "__OWNER3_SHM__"
-          shared_file_path: "__OWNER3_SHARED_FILE__"
+          share_mem_path: "__OWNER3_SHM__"
           sub_cluster: "owner3"
           large_file_paths: ["__OWNER3_LARGE_ROOT__"]
           p2p_listen_port: 31013
@@ -178,8 +175,7 @@ service:
           etcd_addresses:
             - "__ETCD_CONTAINER_NAME__:2379"
           cluster_name: "__CLUSTER_NAME__"
-          shared_memory_path: "__OWNER4_SHM__"
-          shared_file_path: "__OWNER4_SHARED_FILE__"
+          share_mem_path: "__OWNER4_SHM__"
           sub_cluster: "owner4"
           large_file_paths: ["__OWNER4_LARGE_ROOT__"]
           p2p_listen_port: 31014
diff --git a/fluxon_py/tests/test_backend_relay_docker.py b/fluxon_py/tests/test_backend_relay_docker.py
index 1699b0c..d51bcbb 100644
--- a/fluxon_py/tests/test_backend_relay_docker.py
+++ b/fluxon_py/tests/test_backend_relay_docker.py
@@ -42,21 +42,21 @@ def main() -> None:
             raise RuntimeError("mode is required")
         mode = sys.argv[1]
         if mode == "wait-store":
-            if len(sys.argv) != 6:
-                raise RuntimeError("wait-store requires: cluster_name shared_memory_path shared_file_path timeout_seconds")
-            _wait_store(sys.argv[2], sys.argv[3], sys.argv[4], float(sys.argv[5]))
+            if len(sys.argv) != 5:
+                raise RuntimeError("wait-store requires: cluster_name share_mem_path timeout_seconds")
+            _wait_store(sys.argv[2], sys.argv[3], float(sys.argv[4]))
             print("wait-store ok")
             return
         if mode == "put":
-            if len(sys.argv) != 7:
-                raise RuntimeError("put requires: cluster_name shared_memory_path shared_file_path key payload_base64")
-            _put(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], sys.argv[6])
+            if len(sys.argv) != 6:
+                raise RuntimeError("put requires: cluster_name share_mem_path key payload_base64")
+            _put(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5])
             print("put ok")
             return
         if mode == "get":
-            if len(sys.argv) != 8:
-                raise RuntimeError("get requires: cluster_name shared_memory_path shared_file_path key expected_base64 timeout_seconds")
-            _get(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], sys.argv[6], float(sys.argv[7]))
+            if len(sys.argv) != 7:
+                raise RuntimeError("get requires: cluster_name share_mem_path key expected_base64 timeout_seconds")
+            _get(sys.argv[2], sys.argv[3], sys.argv[4], sys.argv[5], float(sys.argv[6]))
             print("get ok")
             return
         raise RuntimeError(f"unknown mode: {mode}")
@@ -64,14 +64,13 @@ def main() -> None:
 
     def _wait_store(
         cluster_name: str,
-        shared_memory_path: str,
-        shared_file_path: str,
+        share_mem_path: str,
         timeout_seconds: float,
     ) -> None:
         deadline = time.time() + timeout_seconds
         last_error = ""
         while time.time() < deadline:
-            result = new_store(_new_config(cluster_name, shared_memory_path, shared_file_path))
+            result = new_store(_new_config(cluster_name, share_mem_path))
             if result.is_ok():
                 store = result.unwrap()
                 _close_store(store)
@@ -83,13 +82,12 @@ def _wait_store(
 
     def _put(
         cluster_name: str,
-        shared_memory_path: str,
-        shared_file_path: str,
+        share_mem_path: str,
         key: str,
         payload_base64: str,
     ) -> None:
         payload = base64.b64decode(payload_base64.encode("ascii"))
-        store = _open_store(cluster_name, shared_memory_path, shared_file_path)
+        store = _open_store(cluster_name, share_mem_path)
         try:
             put_result = store.put(key, {"payload": payload})
             if not put_result.is_ok():
@@ -104,15 +102,14 @@ def _put(
 
     def _get(
         cluster_name: str,
-        shared_memory_path: str,
-        shared_file_path: str,
+        share_mem_path: str,
         key: str,
         expected_base64: str,
         timeout_seconds: float,
     ) -> None:
         expected = base64.b64decode(expected_base64.encode("ascii"))
         deadline = time.time() + timeout_seconds
-        store = _open_store(cluster_name, shared_memory_path, shared_file_path)
+        store = _open_store(cluster_name, share_mem_path)
         try:
             last_error = ""
             while time.time() < deadline:
@@ -139,8 +136,7 @@ def _get(
 
     def _new_config(
         cluster_name: str,
-        shared_memory_path: str,
-        shared_file_path: str,
+        share_mem_path: str,
     ) -> FluxonKvClientConfig:
         return FluxonKvClientConfig(
             {
@@ -148,15 +144,14 @@ def _new_config(
                 "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
                 "fluxonkv_spec": {
                     "cluster_name": cluster_name,
-                    "shared_memory_path": shared_memory_path,
-                    "shared_file_path": shared_file_path,
+                    "share_mem_path": share_mem_path,
                 },
             }
         )
 
 
-    def _open_store(cluster_name: str, shared_memory_path: str, shared_file_path: str):
-        result = new_store(_new_config(cluster_name, shared_memory_path, shared_file_path))
+    def _open_store(cluster_name: str, share_mem_path: str):
+        result = new_store(_new_config(cluster_name, share_mem_path))
         if not result.is_ok():
             raise RuntimeError(f"new_store failed: {result.unwrap_error()}")
         return result.unwrap()
@@ -306,8 +301,7 @@ def _relay_wait_for_store(
     container_name: str,
     helper_path: str,
     cluster_name: str,
-    shared_memory_path: str,
-    shared_file_path: str,
+    share_mem_path: str,
 ) -> None:
     _relay_run(
         [
@@ -318,8 +312,7 @@ def _relay_wait_for_store(
             helper_path,
             "wait-store",
             cluster_name,
-            shared_memory_path,
-            shared_file_path,
+            share_mem_path,
             str(RELAY_DOCKER_WAIT_TIMEOUT_SECONDS),
         ],
         timeout_seconds=RELAY_DOCKER_WAIT_TIMEOUT_SECONDS + 30,
@@ -442,10 +435,6 @@ def test_relay_docker_connectivity() -> int:
             owner_name: f"{container_runtime_root}/shm/{owner_name}"
             for owner_name in ("owner1", "owner2", "owner3", "owner4")
         }
-        owner_shared_file_paths = {
-            owner_name: f"{container_runtime_root}/sharefile/{owner_name}"
-            for owner_name in ("owner1", "owner2", "owner3", "owner4")
-        }
         owner_large_root_paths = {
             owner_name: f"{container_runtime_root}/large/{owner_name}"
             for owner_name in ("owner1", "owner2", "owner3", "owner4")
@@ -475,10 +464,6 @@ def test_relay_docker_connectivity() -> int:
                 "__OWNER2_SHM__": owner_shm_paths["owner2"],
                 "__OWNER3_SHM__": owner_shm_paths["owner3"],
                 "__OWNER4_SHM__": owner_shm_paths["owner4"],
-                "__OWNER1_SHARED_FILE__": owner_shared_file_paths["owner1"],
-                "__OWNER2_SHARED_FILE__": owner_shared_file_paths["owner2"],
-                "__OWNER3_SHARED_FILE__": owner_shared_file_paths["owner3"],
-                "__OWNER4_SHARED_FILE__": owner_shared_file_paths["owner4"],
                 "__OWNER1_LARGE_ROOT__": owner_large_root_paths["owner1"],
                 "__OWNER2_LARGE_ROOT__": owner_large_root_paths["owner2"],
                 "__OWNER3_LARGE_ROOT__": owner_large_root_paths["owner3"],
@@ -522,15 +507,13 @@ def test_relay_docker_connectivity() -> int:
             container_name=container_names["owner1"],
             helper_path=helper_container_path,
             cluster_name=cluster_name,
-            shared_memory_path=owner_shm_paths["owner1"],
-            shared_file_path=owner_shared_file_paths["owner1"],
+            share_mem_path=owner_shm_paths["owner1"],
         )
         _relay_wait_for_store(
             container_name=container_names["owner4"],
             helper_path=helper_container_path,
             cluster_name=cluster_name,
-            shared_memory_path=owner_shm_paths["owner4"],
-            shared_file_path=owner_shared_file_paths["owner4"],
+            share_mem_path=owner_shm_paths["owner4"],
         )
 
         key = f"/relay_docker/{run_suffix}/payload"
@@ -546,7 +529,6 @@ def test_relay_docker_connectivity() -> int:
                 "get",
                 cluster_name,
                 owner_shm_paths["owner4"],
-                owner_shared_file_paths["owner4"],
                 key,
                 payload_base64,
                 str(RELAY_DOCKER_GET_TIMEOUT_SECONDS),
@@ -566,7 +548,6 @@ def test_relay_docker_connectivity() -> int:
                 "put",
                 cluster_name,
                 owner_shm_paths["owner1"],
-                owner_shared_file_paths["owner1"],
                 key,
                 payload_base64,
             ],
diff --git a/fluxon_py/tests/test_config.py b/fluxon_py/tests/test_config.py
index dc1e6dc..6de5180 100644
--- a/fluxon_py/tests/test_config.py
+++ b/fluxon_py/tests/test_config.py
@@ -152,8 +152,7 @@ def _owner_fluxonkv_base_config(
     *,
     instance_key: str = "test_instance",
     cluster_name: str = "test_cluster",
-    shared_memory_path: str = "/tmp/kvcache_shared_memory/test",
-    shared_file_path: str = "/tmp/kvcache_shared_files/test",
+    share_mem_path: str = "/tmp/kvcache_shared_memory/test",
     sub_cluster: str = "rack-a",
     tag: str = "test",
 ) -> dict:
@@ -163,8 +162,7 @@ def _owner_fluxonkv_base_config(
         "fluxonkv_spec": {
             "etcd_addresses": ["localhost:2379"],
             "cluster_name": cluster_name,
-            "shared_memory_path": shared_memory_path,
-            "shared_file_path": shared_file_path,
+            "share_mem_path": share_mem_path,
             "sub_cluster": sub_cluster,
             "large_file_paths": _owner_large_file_paths(tag),
         },
@@ -320,8 +318,7 @@ def test_fluxonkv_external_forbids_large_file_paths():
             "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
             "fluxonkv_spec": {
                 "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test",
-                "shared_file_path": "/tmp/kvcache_shared_files/test",
+                "share_mem_path": "/tmp/kvcache_shared_memory/test",
                 "large_file_paths": _owner_large_file_paths("external_forbidden"),
             },
         }
@@ -364,9 +361,9 @@ def test_fluxon_client_config_yaml_shape():
         config = FluxonKvClientConfig(copy.deepcopy(base))
         yaml_text = config.to_fluxon_kv_client_config_yaml_str()
         loaded = yaml.safe_load(yaml_text)
-        assert loaded["fluxonkv_spec"]["shared_memory_path"] == base["fluxonkv_spec"]["shared_memory_path"]
+        assert loaded["fluxonkv_spec"]["share_mem_path"] == base["fluxonkv_spec"]["share_mem_path"]
         assert loaded["fluxonkv_spec"]["sub_cluster"] == base["fluxonkv_spec"]["sub_cluster"]
-        assert "shared_memory_path" not in loaded
+        assert "share_mem_path" not in loaded
         assert "rdma_device_names" not in loaded
         assert "transfer_engine" not in loaded["fluxonkv_spec"]
         print("✅ PASS: test_fluxon_client_config_yaml_shape")
@@ -384,8 +381,7 @@ def test_fluxonkv_protocol_field():
             },
             "fluxonkv_spec": {
                 "cluster_name": "test_cluster",
-                "shared_memory_path": "/tmp/kvcache_shared_memory/test_side_worker",
-                "shared_file_path": "/tmp/kvcache_shared_files/test_side_worker",
+                "share_mem_path": "/tmp/kvcache_shared_memory/test_side_worker",
             },
             "test_spec_config": {
                 "enable_side_transfer": True,
diff --git a/fluxon_py/tests/test_config.yaml b/fluxon_py/tests/test_config.yaml
index d47332c..8520ec2 100644
--- a/fluxon_py/tests/test_config.yaml
+++ b/fluxon_py/tests/test_config.yaml
@@ -1,5 +1,4 @@
 kv_svc_type: fluxon
 etcd_address: 127.0.0.1:2379
 cluster_name: fluxon-example-cluster
-shared_memory_path: /tmp/fluxon-example-cluster/shm
-shared_file_path: /tmp/fluxon-example-cluster/share
+share_mem_path: /tmp/fluxon-example-cluster/shm
diff --git a/fluxon_py/tests/test_fluxon_fs_patcher.py b/fluxon_py/tests/test_fluxon_fs_patcher.py
index 943c5d3..3b02a08 100644
--- a/fluxon_py/tests/test_fluxon_fs_patcher.py
+++ b/fluxon_py/tests/test_fluxon_fs_patcher.py
@@ -23,7 +23,6 @@ def main() -> None:
 from fluxon_py.api_error import KeyNotFoundError  # noqa: E402
 from fluxon_py.tests.test_lib import (  # noqa: E402
     load_test_fluxon_cluster_name,
-    load_test_fluxon_share_file_path,
     load_test_fluxon_share_mem_path,
 )
 
@@ -36,24 +35,22 @@ def _new_test_dir(tag: str) -> Path:
     return p
 
 
-def _load_ci_cluster() -> tuple[str, str, str]:
+def _load_ci_cluster() -> tuple[str, str]:
     return (
         load_test_fluxon_cluster_name(),
         load_test_fluxon_share_mem_path(),
-        load_test_fluxon_share_file_path(),
     )
 
 
 def _new_fluxon_external_store(*, instance_key: str):
-    cluster_name, share_mem_path, share_file_path = _load_ci_cluster()
+    cluster_name, share_mem_path = _load_ci_cluster()
     cfg = FluxonKvClientConfig(
         {
             "instance_key": instance_key,
             "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
             "fluxonkv_spec": {
                 "cluster_name": cluster_name,
-                "shared_memory_path": share_mem_path,
-                "shared_file_path": share_file_path,
+                "share_mem_path": share_mem_path,
             },
         }
     )
diff --git a/fluxon_py/tests/test_fluxon_fs_remote_mount.py b/fluxon_py/tests/test_fluxon_fs_remote_mount.py
index a2b9ed9..9283073 100644
--- a/fluxon_py/tests/test_fluxon_fs_remote_mount.py
+++ b/fluxon_py/tests/test_fluxon_fs_remote_mount.py
@@ -19,7 +19,6 @@ def main() -> None:
 from fluxon_py.kvclient import new_store  # noqa: E402
 from fluxon_py.tests.test_lib import (  # noqa: E402
     load_test_fluxon_cluster_name,
-    load_test_fluxon_share_file_path,
     load_test_fluxon_share_mem_path,
 )
 
@@ -32,11 +31,10 @@ def _new_test_dir(tag: str) -> Path:
     return p
 
 
-def _load_ci_cluster() -> tuple[str, str, str]:
+def _load_ci_cluster() -> tuple[str, str]:
     return (
         load_test_fluxon_cluster_name(),
         load_test_fluxon_share_mem_path(),
-        load_test_fluxon_share_file_path(),
     )
 
 
@@ -45,7 +43,6 @@ def _new_fluxon_external_store_with_cluster(
     instance_key: str,
     cluster_name: str,
     share_mem_path: str,
-    share_file_path: str,
 ):
     cfg = FluxonKvClientConfig(
         {
@@ -53,8 +50,7 @@ def _new_fluxon_external_store_with_cluster(
             "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
             "fluxonkv_spec": {
                 "cluster_name": cluster_name,
-                "shared_memory_path": share_mem_path,
-                "shared_file_path": share_file_path,
+                "share_mem_path": share_mem_path,
             },
         }
     )
@@ -79,7 +75,7 @@ def setUpClass(cls) -> None:
         cls._remote_root = (cls._tmp / "remote_root").resolve()
         cls._remote_root.mkdir(parents=True, exist_ok=False)
 
-        cls._cluster_name, cls._share_mem_path, cls._share_file_path = _load_ci_cluster()
+        cls._cluster_name, cls._share_mem_path = _load_ci_cluster()
 
         # Keep the mountpoint under a writable temp directory to avoid relying on root paths.
         # The engine will create the mountpoint if it does not exist.
@@ -91,13 +87,11 @@ def setUpClass(cls) -> None:
             instance_key=f"test_fluxon_fs_agent_{os.getpid()}",
             cluster_name=cls._cluster_name,
             share_mem_path=cls._share_mem_path,
-            share_file_path=cls._share_file_path,
         )
         cls._client_store = _new_fluxon_external_store_with_cluster(
             instance_key=f"test_fluxon_fs_client_{os.getpid()}",
             cluster_name=cls._cluster_name,
             share_mem_path=cls._share_mem_path,
-            share_file_path=cls._share_file_path,
         )
 
         agent_key_res = cls._agent_store.instance_key()
diff --git a/fluxon_py/tests/test_lib.py b/fluxon_py/tests/test_lib.py
index a246e24..9be7003 100644
--- a/fluxon_py/tests/test_lib.py
+++ b/fluxon_py/tests/test_lib.py
@@ -35,8 +35,7 @@
     load_test_config_mapping,
     load_test_etcd_address_from_test_config,
     load_test_fluxon_cluster_name_from_test_config,
-    load_test_fluxon_shared_file_path_from_test_config,
-    load_test_fluxon_shared_memory_path_from_test_config,
+    load_test_fluxon_share_mem_path_from_test_config,
     load_test_kv_svc_type_from_test_config,
 )
 
@@ -85,12 +84,7 @@ def load_test_fluxon_cluster_name(*, config_path: Optional[Path] = None) -> str:
 
 def load_test_fluxon_share_mem_path(*, config_path: Optional[Path] = None) -> str:
     """Load required Fluxon shared-memory path from test_config.yaml."""
-    return load_test_fluxon_shared_memory_path_from_test_config(config_path=config_path)
-
-
-def load_test_fluxon_share_file_path(*, config_path: Optional[Path] = None) -> str:
-    """Load required Fluxon shared-file path from test_config.yaml."""
-    return load_test_fluxon_shared_file_path_from_test_config(config_path=config_path)
+    return load_test_fluxon_share_mem_path_from_test_config(config_path=config_path)
 
 
 def load_test_chan_config(*, config_path: Optional[Path] = None) -> Dict[str, int]:
@@ -283,12 +277,10 @@ def new_shared_stores(
             # Strictly require fluxon-specific fields from the shared test/example deployconf.
             cluster_name = load_test_fluxon_cluster_name()
             share_mem = load_test_fluxon_share_mem_path()
-            share_file = load_test_fluxon_share_file_path()
             spec = {
                 "fluxonkv_spec": {
                     "cluster_name": cluster_name,
-                    "shared_memory_path": share_mem,
-                    "shared_file_path": share_file,
+                    "share_mem_path": share_mem,
                 }
             }
 
diff --git a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
index 6257f4f..c1b3193 100644
--- a/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
+++ b/fluxon_py/tests/test_mq/test_example_ctrl_c_exit.py
@@ -97,10 +97,9 @@ def _build_store_config(*, config_path: Path, workdir: Path) -> FluxonKvClientCo
     producer_cfg = dict(loaded["mpmc_demo"]["producer"])
     kvexternal_cfg["instance_key"] = str(producer_cfg["instance_key"])
     spec = dict(kvexternal_cfg["fluxonkv_spec"])
-    for field_name in ("shared_memory_path", "shared_file_path"):
-        raw_path = spec.get(field_name)
-        if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
-            spec[field_name] = str((workdir / raw_path).resolve())
+    raw_path = spec.get("share_mem_path")
+    if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
+        spec["share_mem_path"] = str((workdir / raw_path).resolve())
     kvexternal_cfg["fluxonkv_spec"] = spec
     return FluxonKvClientConfig(kvexternal_cfg)
 
@@ -223,10 +222,9 @@ def _build_store_config(*, config_path: Path, workdir: Path) -> FluxonKvClientCo
     consumer_cfg = dict(loaded["mpmc_demo"]["consumer"])
     kvexternal_cfg["instance_key"] = str(consumer_cfg["instance_key"])
     spec = dict(kvexternal_cfg["fluxonkv_spec"])
-    for field_name in ("shared_memory_path", "shared_file_path"):
-        raw_path = spec.get(field_name)
-        if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
-            spec[field_name] = str((workdir / raw_path).resolve())
+    raw_path = spec.get("share_mem_path")
+    if isinstance(raw_path, str) and raw_path and not Path(raw_path).is_absolute():
+        spec["share_mem_path"] = str((workdir / raw_path).resolve())
     kvexternal_cfg["fluxonkv_spec"] = spec
     return FluxonKvClientConfig(kvexternal_cfg)
 
@@ -462,7 +460,7 @@ def _build_example_config(
     unique_suffix: str,
     cluster_name: str,
     etcd_endpoint: str,
-    shared_memory_path: str,
+    share_mem_path: str,
     greptime_http_port: int,
     master_port: int,
 ) -> dict[str, Any]:
@@ -474,7 +472,7 @@ def _build_example_config(
             "cluster_name": cluster_name,
             "instance_key": f"example_ctrlc_master_{unique_suffix}",
             "port": master_port,
-            "log_dir": str((Path(shared_memory_path).parent / "log" / "master").resolve()),
+            "log_dir": str((Path(share_mem_path).parent / "log" / "master").resolve()),
             "monitoring": _monitoring_block(greptime_http_port=greptime_http_port),
         },
         "kvclient": {
@@ -483,10 +481,9 @@ def _build_example_config(
             "fluxonkv_spec": {
                 "etcd_addresses": [etcd_endpoint],
                 "cluster_name": cluster_name,
-                "shared_memory_path": shared_memory_path,
-                "shared_file_path": str((Path(shared_memory_path).parent / "sharefile").resolve()),
+                "share_mem_path": share_mem_path,
                 "sub_cluster": "demo",
-                "large_file_paths": [str((Path(shared_memory_path).parent / "large" / "owner").resolve())],
+                "large_file_paths": [str((Path(share_mem_path).parent / "large" / "owner").resolve())],
             },
         },
         "kvexternal": {
@@ -494,8 +491,7 @@ def _build_example_config(
             "contribute_to_cluster_pool_size": {"dram": 0, "vram": {}},
             "fluxonkv_spec": {
                 "cluster_name": cluster_name,
-                "shared_memory_path": shared_memory_path,
-                "shared_file_path": str((Path(shared_memory_path).parent / "sharefile").resolve()),
+                "share_mem_path": share_mem_path,
             },
         },
         "mpmc_demo": {
@@ -525,8 +521,8 @@ def _write_runtime_subconfig(*, path: Path, config: dict[str, Any], key: str) ->
     )
 
 
-def _kvclient_shared_json_target(*, shared_file_path: Path, cluster_name: str) -> Path:
-    return shared_file_path / cluster_name / "shared.json"
+def _kvclient_shared_json_target(*, share_mem_path: Path, cluster_name: str) -> Path:
+    return share_mem_path / cluster_name / "shared.json"
 
 
 def _start_local_stack(*, temp_root: Path, config_path: Path) -> list[tuple[subprocess.Popen[str], Path]]:
@@ -591,13 +587,13 @@ def _start_local_stack(*, temp_root: Path, config_path: Path) -> list[tuple[subp
 
     unique_suffix = uuid.uuid4().hex[:12]
     cluster_name = f"example_ctrlc_cluster_{unique_suffix}"
-    shared_memory_path = str((temp_root / "sharemem").resolve())
+    share_mem_path = str((temp_root / "sharemem").resolve())
     master_port = _pick_free_port()
     config = _build_example_config(
         unique_suffix=unique_suffix,
         cluster_name=cluster_name,
         etcd_endpoint=etcd_endpoint,
-        shared_memory_path=shared_memory_path,
+        share_mem_path=share_mem_path,
         greptime_http_port=greptime_http_port,
         master_port=master_port,
     )
@@ -638,7 +634,7 @@ def _start_local_stack(*, temp_root: Path, config_path: Path) -> list[tuple[subp
         env=env,
     )
     kvclient_shared_json = _kvclient_shared_json_target(
-        shared_file_path=Path(str(config["kvclient"]["fluxonkv_spec"]["shared_file_path"])).resolve(),
+        share_mem_path=Path(str(config["kvclient"]["fluxonkv_spec"]["share_mem_path"])).resolve(),
         cluster_name=cluster_name,
     )
     _wait_for_path(
diff --git a/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config1.yaml b/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config1.yaml
index 7781f8b..8119a14 100644
--- a/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config1.yaml
+++ b/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config1.yaml
@@ -9,7 +9,7 @@ fluxonkv_spec:
   etcd_addresses:
   - "127.0.0.1:2379"
   cluster_name: "cluster_001"
-  shared_memory_path: "/tmp/kvcache_shared_memory/client_node_001"
+  share_mem_path: "/tmp/kvcache_shared_memory/client_node_001"
 
 # Optional: Additional configurations can be added here
 # custom_field: "value"
diff --git a/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config2.yaml b/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config2.yaml
index e2e9464..9d72fe7 100644
--- a/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config2.yaml
+++ b/fluxon_rs/fluxon_kv/examples/kvcli_example_client_config2.yaml
@@ -9,7 +9,7 @@ fluxonkv_spec:
   etcd_addresses:
   - "127.0.0.1:2379"
   cluster_name: "cluster_001"
-  shared_memory_path: "/tmp/kvcache_shared_memory/client_node_002"
+  share_mem_path: "/tmp/kvcache_shared_memory/client_node_002"
 
 # Optional: Additional configurations can be added here
 # custom_field: "value"
diff --git a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
index c31ef73..1aa6954 100644
--- a/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/client_seg_pool/mod.rs
@@ -44,8 +44,7 @@ define_module!(
 #[derive(Clone, Debug)]
 pub struct ClientSegPoolNewArg {
     pub contribute_size: ContributeToClusterPoolSize,
-    pub shared_memory_path: String,
-    pub shared_file_path: String,
+    pub share_mem_path: String,
     pub large_file_paths: crate::config::LargeFilePaths,
     pub cluster_name: String,
     pub etcd_addresses: Vec<String>,
@@ -63,8 +62,7 @@ pub struct SharedJsonMeta {
     pub sub_cluster: Option<String>,
     pub cluster_name: String,
     pub etcd_addresses: Vec<String>,
-    pub shared_memory_path: String,
-    pub shared_file_path: String,
+    pub share_mem_path: String,
     pub large_file_paths: crate::config::LargeFilePaths,
     pub protocol_version: String,
     pub write_ts: Option<i64>,
@@ -201,10 +199,8 @@ impl Deref for ClientCpuMemReadGuard {
 pub struct ClientSegPoolInner {
     cpu_allocated_mem: std::sync::Arc<ARwLock<Option<ClientMappedMem>>>,
     view: std::sync::OnceLock<ClientSegPoolView>,
-    /// Directory path for shared-memory backed files (mmap.file).
-    shared_memory_path: String,
-    /// Directory path for regular files (shared.json, side-transfer metadata).
-    shared_file_path: String,
+    /// Directory path for the local shared bundle (mmap.file, shared.json, peer metadata).
+    share_mem_path: String,
     /// Ordered large-file roots; concrete subdirectories are derived by fixed relative layout.
     large_file_paths: crate::config::LargeFilePaths,
     side_transfer_worker: bool,
@@ -237,15 +233,15 @@ impl ClientSegPoolInner {
 }
 
 impl ClientSegPool {
-    pub fn side_transfer_peers_dir(shared_file_path: &str) -> std::path::PathBuf {
-        std::path::Path::new(shared_file_path).join(SIDE_TRANSFER_PEERS_DIRNAME)
+    pub fn side_transfer_peers_dir(share_mem_path: &str) -> std::path::PathBuf {
+        std::path::Path::new(share_mem_path).join(SIDE_TRANSFER_PEERS_DIRNAME)
     }
 
     pub fn side_transfer_peer_file_path(
-        shared_file_path: &str,
+        share_mem_path: &str,
         side_id: &str,
     ) -> std::path::PathBuf {
-        Self::side_transfer_peers_dir(shared_file_path).join(format!("{side_id}.json"))
+        Self::side_transfer_peers_dir(share_mem_path).join(format!("{side_id}.json"))
     }
 
     pub fn attach_view(&self, view: ClientSegPoolView) {
@@ -259,13 +255,12 @@ impl ClientSegPool {
 
     pub async fn construct(arg: ClientSegPoolNewArg) -> Result<Self, KvError> {
         tracing::info!(
-            "Constructing ClientSegPool in Client mode with shared_memory_path: {}",
-            arg.shared_memory_path
+            "Constructing ClientSegPool in Client mode with share_mem_path: {}",
+            arg.share_mem_path
         );
 
         let contribute_size = arg.contribute_size;
-        let shared_memory_path = arg.shared_memory_path;
-        let shared_file_path = arg.shared_file_path;
+        let share_mem_path = arg.share_mem_path;
         let large_file_paths = arg.large_file_paths;
         let cluster_name = arg.cluster_name;
         let etcd_addresses = arg.etcd_addresses;
@@ -283,7 +278,7 @@ impl ClientSegPool {
         if let Some(existing_meta) = attach_existing_meta {
             tracing::info!(
                 "Attaching existing shared memory for side-transfer worker: path={}, len={}",
-                shared_memory_path,
+                share_mem_path,
                 existing_meta.segment_len
             );
 
@@ -293,7 +288,7 @@ impl ClientSegPool {
             use std::ptr;
 
             let map_len = existing_meta.segment_len as usize;
-            let mmap_file_path = Path::new(&shared_memory_path).join("mmap.file");
+            let mmap_file_path = Path::new(&share_mem_path).join("mmap.file");
             let file = OpenOptions::new()
                 .read(true)
                 .write(true)
@@ -359,8 +354,7 @@ impl ClientSegPool {
                     layout_validated: AtomicBool::new(false),
                 }))),
                 view: std::sync::OnceLock::new(),
-                shared_memory_path: shared_memory_path.clone(),
-                shared_file_path: shared_file_path.clone(),
+                share_mem_path: share_mem_path.clone(),
                 large_file_paths: large_file_paths.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
@@ -376,8 +370,7 @@ impl ClientSegPool {
             let inner = ClientSegPoolInner {
                 cpu_allocated_mem: std::sync::Arc::new(ARwLock::new(None)),
                 view: std::sync::OnceLock::new(),
-                shared_memory_path: shared_memory_path.clone(),
-                shared_file_path: shared_file_path.clone(),
+                share_mem_path: share_mem_path.clone(),
                 large_file_paths: large_file_paths.clone(),
                 side_transfer_worker,
                 attach_owner_ref,
@@ -401,29 +394,20 @@ impl ClientSegPool {
 
         let map_len = contribute_size.dram as usize;
 
-        if shared_memory_path.is_empty() {
+        if share_mem_path.is_empty() {
             return Err(KvError::SharedMem(
                 crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MappingFailed {
                     path: String::new(),
                     len: map_len as u64,
-                    detail: "shared_memory_path is empty; explicit configuration required"
-                        .to_string(),
-                },
-            ));
-        }
-        if shared_file_path.is_empty() {
-            return Err(KvError::SharedMem(
-                crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MetaDataLoadError {
-                    path: String::new(),
-                    detail: "shared_file_path is empty; explicit configuration required"
+                    detail: "share_mem_path is empty; explicit configuration required"
                         .to_string(),
                 },
             ));
         }
 
-        let base_path = &shared_memory_path;
+        let base_path = &share_mem_path;
         tracing::info!(
-            "Using shared_memory_path: {} for memory-mapped file",
+            "Using share_mem_path: {} for memory-mapped file",
             base_path
         );
         std::fs::create_dir_all(base_path).map_err(|e| {
@@ -540,8 +524,7 @@ impl ClientSegPool {
                 layout_validated: AtomicBool::new(false),
             }))),
             view: std::sync::OnceLock::new(),
-            shared_memory_path: base_path.to_string(),
-            shared_file_path: shared_file_path.clone(),
+            share_mem_path: base_path.to_string(),
             large_file_paths,
             side_transfer_worker,
             attach_owner_ref,
@@ -557,8 +540,8 @@ impl ClientSegPool {
         &self.0
     }
 
-    pub fn shared_file_path(&self) -> &str {
-        &self.inner().shared_file_path
+    pub fn share_mem_path(&self) -> &str {
+        &self.inner().share_mem_path
     }
 
     pub fn large_file_paths(&self) -> &crate::config::LargeFilePaths {
@@ -909,7 +892,7 @@ impl ClientSegPool {
                 },
             )
         })?;
-        let peers_dir = Self::side_transfer_peers_dir(&inner.shared_file_path);
+        let peers_dir = Self::side_transfer_peers_dir(&inner.share_mem_path);
         std::fs::create_dir_all(&peers_dir).map_err(|e| {
             KvError::SharedMem(
                 crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MetaDataLoadError {
@@ -919,7 +902,7 @@ impl ClientSegPool {
             )
         })?;
 
-        let peer_path = Self::side_transfer_peer_file_path(&inner.shared_file_path, &self_info.id);
+        let peer_path = Self::side_transfer_peer_file_path(&inner.share_mem_path, &self_info.id);
         let tmp_path = peer_path.with_file_name(format!(
             "{}.tmp.{}.{}",
             self_info.id,
@@ -962,7 +945,7 @@ impl ClientSegPool {
             return Ok(());
         }
         let self_id = inner.view().cluster_manager().get_self_info().id;
-        let peer_path = Self::side_transfer_peer_file_path(&inner.shared_file_path, &self_id);
+        let peer_path = Self::side_transfer_peer_file_path(&inner.share_mem_path, &self_id);
         match std::fs::remove_file(&peer_path) {
             Ok(()) => Ok(()),
             Err(e) if e.kind() == std::io::ErrorKind::NotFound => Ok(()),
@@ -1123,35 +1106,24 @@ impl ClientSegPool {
         self.wait_required_transfer_rpc_fast_path_ready().await?;
 
         use std::path::Path;
-        let shared_json_path = Path::new(&inner.shared_file_path).join("shared.json");
+        let shared_json_path = Path::new(&inner.share_mem_path).join("shared.json");
         if let Some(parent) = shared_json_path.parent() {
             std::fs::create_dir_all(parent).map_err(|e| {
                 KvError::SharedMem(
                     crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MetaDataLoadError {
                         path: parent.to_string_lossy().to_string(),
-                        detail: format!("Failed to create shared_file_path: {}", e),
+                        detail: format!("Failed to create share_mem_path: {}", e),
                     },
                 )
             })?;
         }
 
-        let shared_memory_canonical = std::fs::canonicalize(&inner.shared_memory_path)
-            .map_err(|e| {
-                KvError::SharedMem(
-                    crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MetaDataLoadError {
-                        path: inner.shared_memory_path.clone(),
-                        detail: format!("Failed to canonicalize shared_memory_path: {}", e),
-                    },
-                )
-            })?
-            .to_string_lossy()
-            .into_owned();
-        let shared_file_canonical = std::fs::canonicalize(&inner.shared_file_path)
+        let share_mem_canonical = std::fs::canonicalize(&inner.share_mem_path)
             .map_err(|e| {
                 KvError::SharedMem(
                     crate::rpcresp_kvresult_convert::msg_and_error::SharedMemError::MetaDataLoadError {
-                        path: inner.shared_file_path.clone(),
-                        detail: format!("Failed to canonicalize shared_file_path: {}", e),
+                        path: inner.share_mem_path.clone(),
+                        detail: format!("Failed to canonicalize share_mem_path: {}", e),
                     },
                 )
             })?
@@ -1171,8 +1143,7 @@ impl ClientSegPool {
 
             cluster_name: inner.cluster_name.clone(),
             etcd_addresses: inner.etcd_addresses.clone(),
-            shared_memory_path: shared_memory_canonical,
-            shared_file_path: shared_file_canonical,
+            share_mem_path: share_mem_canonical,
             large_file_paths: inner.large_file_paths.clone(),
 
             protocol_version,
@@ -1239,8 +1210,8 @@ impl ClientSegPool {
             ));
         }
 
-        let shared_json_path = std::path::Path::new(&inner.shared_file_path).join("shared.json");
-        let mmap_file_path = std::path::Path::new(&inner.shared_memory_path).join("mmap.file");
+        let shared_json_path = std::path::Path::new(&inner.share_mem_path).join("shared.json");
+        let mmap_file_path = std::path::Path::new(&inner.share_mem_path).join("mmap.file");
 
         if !mmap_file_path.exists() {
             return Err(KvError::SharedMem(
@@ -1356,7 +1327,7 @@ async fn handle_resolve_side_transfer_lane_request(
 ) -> MsgPack<ResolveSideTransferLaneResp> {
     let self_info = view.cluster_manager().get_self_info();
     let peers_dir =
-        ClientSegPool::side_transfer_peers_dir(&view.client_seg_pool().inner().shared_file_path);
+        ClientSegPool::side_transfer_peers_dir(&view.client_seg_pool().inner().share_mem_path);
     tracing::info!(
         "handle_resolve_side_transfer_lane_request: owner={} lane_idx={} peers_dir={}",
         self_info.id,
diff --git a/fluxon_rs/fluxon_kv/src/config.rs b/fluxon_rs/fluxon_kv/src/config.rs
index fad6082..f9c7691 100644
--- a/fluxon_rs/fluxon_kv/src/config.rs
+++ b/fluxon_rs/fluxon_kv/src/config.rs
@@ -577,8 +577,7 @@ pub struct FluxonKvSpecYaml {
     #[serde(skip_serializing_if = "Option::is_none")]
     pub etcd_addresses: Option<YamlNullable<Vec<String>>>,
     pub cluster_name: String,
-    pub shared_memory_path: String,
-    pub shared_file_path: String,
+    pub share_mem_path: String,
     #[serde(skip_serializing_if = "Option::is_none")]
     pub large_file_paths: Option<LargeFilePathsYaml>,
     #[serde(skip_serializing_if = "Option::is_none")]
@@ -688,6 +687,11 @@ impl LargeFilePaths {
         self.resolve_preferred_root_subdir(&relative_dir, "kv logs")
     }
 
+    pub fn third_party_logs_dir(&self, cluster_name: &str) -> KvResult<PathBuf> {
+        let relative_dir = PathBuf::from(format!("{cluster_name}_cluster_third_party_logs"));
+        self.resolve_preferred_root_subdir(&relative_dir, "third-party logs")
+    }
+
     pub fn kv_profiles_dir(&self, cluster_name: &str) -> KvResult<PathBuf> {
         let relative_dir = PathBuf::from(format!("{cluster_name}_cluster_kv_profiles"));
         self.resolve_preferred_root_subdir(&relative_dir, "kv profiles")
@@ -729,8 +733,7 @@ pub struct ClientConfig {
     pub pprof_duration_seconds: Option<u64>,
     pub redis_compat_listen_addr: Option<std::net::SocketAddr>,
     pub fluxonkv_spec: FluxonKvSpec,
-    pub shared_memory_path: String, // Mandatory shared memory path
-    pub shared_file_path: String,   // Mandatory shared file path
+    pub share_mem_path: String, // Mandatory shared bundle path
     pub large_file_paths: LargeFilePaths, // Mandatory large-file roots for logs and caches
     pub test_spec_config: TestSpecConfig,
 }
@@ -1151,16 +1154,10 @@ impl ClientConfigYaml {
             }
         }
 
-        // Validate shared_memory_path (mandatory and non-empty)
-        if self.fluxonkv_spec.shared_memory_path.trim().is_empty() {
-            return Err(ConfigError::InvalidInstanceKey {
-                key: "shared_memory_path cannot be empty".to_string(),
-            }
-            .into_kverror());
-        }
-        if self.fluxonkv_spec.shared_file_path.trim().is_empty() {
+        // Validate share_mem_path (mandatory and non-empty)
+        if self.fluxonkv_spec.share_mem_path.trim().is_empty() {
             return Err(ConfigError::InvalidInstanceKey {
-                key: "shared_file_path cannot be empty".to_string(),
+                key: "share_mem_path cannot be empty".to_string(),
             }
             .into_kverror());
         }
@@ -1183,12 +1180,8 @@ impl ClientConfigYaml {
             }
         };
 
-        let shared_memory_path = cluster_scoped_shared_path(
-            &self.fluxonkv_spec.shared_memory_path,
-            &fluxonkv_spec.cluster_name,
-        )?;
-        let shared_file_path = cluster_scoped_shared_path(
-            &self.fluxonkv_spec.shared_file_path,
+        let share_mem_path = cluster_scoped_shared_path(
+            &self.fluxonkv_spec.share_mem_path,
             &fluxonkv_spec.cluster_name,
         )?;
         let redis_compat_listen_addr = match self.fluxonkv_spec.redis_compat.as_ref() {
@@ -1220,8 +1213,7 @@ impl ClientConfigYaml {
             pprof_duration_seconds,
             redis_compat_listen_addr,
             fluxonkv_spec,
-            shared_memory_path,
-            shared_file_path,
+            share_mem_path,
             large_file_paths,
             test_spec_config,
         })
@@ -1568,8 +1560,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1588,11 +1579,7 @@ test_spec_config:
         assert!(verified.test_spec_config.enable_iceoryx_logs);
         assert!(verified.test_spec_config.iceoryx_external_busy_poll);
         assert!(!verified.test_spec_config.iceoryx_owner_client_busy_poll);
-        assert_eq!(verified.shared_memory_path, "/tmp/test_owner/test_cluster");
-        assert_eq!(
-            verified.shared_file_path,
-            "/tmp/test_owner_files/test_cluster"
-        );
+        assert_eq!(verified.share_mem_path, "/tmp/test_owner/test_cluster");
         assert_eq!(
             verified.test_spec_config.transport_mode,
             Some(TestSpecTransportMode::TransferOnly)
@@ -1615,8 +1602,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
@@ -1637,8 +1623,7 @@ fluxonkv_spec:
 instance_key: test_external
 fluxonkv_spec:
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_external
-  shared_file_path: /tmp/test_external_files
+  share_mem_path: /tmp/test_external
 "#,
         )
         .unwrap();
@@ -1655,8 +1640,7 @@ fluxonkv_spec:
 instance_key: test_external
 fluxonkv_spec:
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_external
-  shared_file_path: /tmp/test_external_files
+  share_mem_path: /tmp/test_external
   large_file_paths: [/tmp/test_external_large]
 "#,
         )
@@ -1686,6 +1670,17 @@ fluxonkv_spec:
             first_root.join("child").join("test_cluster_cluster_kv_logs")
         );
         assert!(logs_dir.exists());
+
+        let third_party_logs_dir = large_file_paths
+            .third_party_logs_dir("test_cluster")
+            .unwrap();
+        assert_eq!(
+            third_party_logs_dir,
+            first_root
+                .join("child")
+                .join("test_cluster_cluster_third_party_logs")
+        );
+        assert!(third_party_logs_dir.exists());
     }
 
     #[test]
@@ -1699,8 +1694,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1753,8 +1747,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1789,8 +1782,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1821,8 +1813,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1847,8 +1838,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1874,8 +1864,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1906,8 +1895,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1931,8 +1919,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
@@ -1966,8 +1953,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   sub_cluster: rack-a
 test_spec_config:
   transport_mode: transfer_only
@@ -1986,9 +1972,7 @@ protocol:
   protocol_type: tcp
 fluxonkv_spec:
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_side_worker
-  shared_file_path: /tmp/test_side_worker_files
-  large_file_paths: [/tmp/test_side_worker_large]
+  share_mem_path: /tmp/test_side_worker
   p2p_listen_port: 18081
 test_spec_config:
   enable_side_transfer: true
@@ -1999,13 +1983,9 @@ test_spec_config:
         let verified = cfg.verify().unwrap();
         assert_eq!(verified.protocol.protocol_type, ProtocolType::Tcp);
         assert_eq!(
-            verified.shared_memory_path,
+            verified.share_mem_path,
             "/tmp/test_side_worker/test_cluster"
         );
-        assert_eq!(
-            verified.shared_file_path,
-            "/tmp/test_side_worker_files/test_cluster"
-        );
         assert_eq!(
             verified.fluxonkv_spec.transfer_engine,
             TransferEngineType::P2p
@@ -2026,9 +2006,7 @@ protocol:
   protocol_type: tcp
 fluxonkv_spec:
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_side_worker
-  shared_file_path: /tmp/test_side_worker_files
-  large_file_paths: [/tmp/test_side_worker_large]
+  share_mem_path: /tmp/test_side_worker
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -2058,9 +2036,7 @@ protocol:
   protocol_type: tcp
 fluxonkv_spec:
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_side_worker
-  shared_file_path: /tmp/test_side_worker_files
-  large_file_paths: [/tmp/test_side_worker_large]
+  share_mem_path: /tmp/test_side_worker
 test_spec_config:
   enable_side_transfer: true
   side_transfer_role: worker
@@ -2088,8 +2064,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   p2p_listen_port: 18081
   sub_cluster: rack-a
@@ -2121,8 +2096,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 "#,
@@ -2147,8 +2121,7 @@ contribute_to_cluster_pool_size:
 fluxonkv_spec:
   etcd_addresses: ["127.0.0.1:2379"]
   cluster_name: test_cluster
-  shared_memory_path: /tmp/test_owner
-  shared_file_path: /tmp/test_owner_files
+  share_mem_path: /tmp/test_owner
   large_file_paths: [/tmp/test_owner_large]
   sub_cluster: rack-a
 test_spec_config:
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
index a43c021..b55f161 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/external_client_test.rs
@@ -80,8 +80,7 @@ fn new_client_config(
             enable_transfer_rpc_fast_path: true,
             sub_cluster: None,
         },
-        shared_memory_path: shm_path.to_string(),
-        shared_file_path: format!("{}_files", shm_path),
+        share_mem_path: shm_path.to_string(),
         large_file_paths: LargeFilePaths {
             paths: vec![format!("{}_large", shm_path)],
         },
@@ -95,8 +94,7 @@ fn new_zero_contribution_client_config(
     shm_path: &str,
 ) -> ClientConfig {
     // External instance_key MUST be different from owner.
-    // External bootstrap shares both owner bundle roots: shared_memory_path for mmap.file and
-    // shared_file_path for shared.json / peer metadata.
+    // External bootstrap shares the owner bundle root for mmap.file, shared.json, and peer metadata.
     let unique_suffix = std::time::SystemTime::now()
         .duration_since(std::time::UNIX_EPOCH)
         .map(|d| d.as_nanos())
@@ -125,8 +123,7 @@ fn new_zero_contribution_client_config(
             enable_transfer_rpc_fast_path: false,
             sub_cluster: None,
         },
-        shared_memory_path: shm_path.to_string(),
-        shared_file_path: format!("{}_files", shm_path),
+        share_mem_path: shm_path.to_string(),
         large_file_paths: LargeFilePaths { paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
diff --git a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
index 3830e21..9cb291f 100644
--- a/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
+++ b/fluxon_rs/fluxon_kv/src/external_client_api/mod.rs
@@ -251,8 +251,7 @@ define_module!(
 /// External Client configuration parameters
 #[derive(Clone, Debug)]
 pub struct ExternalClientApiNewArg {
-    pub shared_memory_path: String,
-    pub shared_file_path: String,
+    pub share_mem_path: String,
     pub large_file_paths: crate::config::LargeFilePaths,
     pub expected_cluster_name: String,
     pub expected_protocol_version: String,
@@ -311,8 +310,7 @@ pub struct ExternalInner {
     initial_sub_cluster: OnceLock<Option<String>>,
     expected_cluster_name: String,
     expected_protocol_version: String,
-    external_shared_memory_path: String,
-    external_shared_file_path: String,
+    external_share_mem_path: String,
     external_large_file_paths: crate::config::LargeFilePaths,
     _enable_side_transfer: bool,
     short_circuit_put_payload_path: bool,
@@ -352,7 +350,7 @@ impl ExternalClientApi {
     pub async fn construct(arg: ExternalClientApiNewArg) -> Result<Self, KvError> {
         tracing::info!(
             "Constructing ExternalClientApi in ExternalClient mode (PreView): shm_dir={}",
-            arg.shared_memory_path
+            arg.share_mem_path
         );
 
         Ok(Self(ExternalInner {
@@ -363,8 +361,7 @@ impl ExternalClientApi {
             initial_sub_cluster: OnceLock::new(),
             expected_cluster_name: arg.expected_cluster_name,
             expected_protocol_version: arg.expected_protocol_version,
-            external_shared_memory_path: arg.shared_memory_path,
-            external_shared_file_path: arg.shared_file_path,
+            external_share_mem_path: arg.share_mem_path,
             external_large_file_paths: arg.large_file_paths,
             _enable_side_transfer: arg.enable_side_transfer,
             short_circuit_put_payload_path: arg.short_circuit_put_payload_path,
@@ -406,8 +403,7 @@ impl ExternalClientApi {
             let wait_start_ts = i64::MIN;
             let OwnerRestartPayload { meta, signature } = task_wait_owner_restart(
                 ext.view.clone_view(),
-                ext.external_shared_memory_path.clone(),
-                ext.external_shared_file_path.clone(),
+                ext.external_share_mem_path.clone(),
                 None,
                 wait_start_ts,
                 None,
@@ -417,7 +413,7 @@ impl ExternalClientApi {
             .await?;
 
             let shared_memory_ptr = ExternalInner::init_shared_memory_from_meta(
-                &ext.external_shared_memory_path,
+                &ext.external_share_mem_path,
                 &meta,
                 signature,
             )?;
@@ -846,13 +842,11 @@ impl ExternalInner {
             return Ok(false);
         };
 
-        let shared_memory_path = self.shared_memory_path();
-        let shared_file_path = self.shared_file_path();
-        let shared_meta_path = format!("{}/shared.json", shared_file_path);
+        let share_mem_path = self.share_mem_path();
+        let shared_meta_path = format!("{}/shared.json", share_mem_path);
         let probe = probe_owner_restart_payload(
             &self.view.clone_view(),
-            &shared_memory_path,
-            &shared_file_path,
+            &share_mem_path,
             &shared_meta_path,
             Some(&current_signature),
             i64::MIN,
@@ -871,7 +865,7 @@ impl ExternalInner {
             return Ok(false);
         }
 
-        self.finish_owner_recover(&shared_memory_path, payload)
+        self.finish_owner_recover(&share_mem_path, payload)
             .await?;
         Ok(true)
     }
@@ -924,7 +918,7 @@ impl ExternalInner {
         match self.base_ptr().await {
             Ok(addr) => Ok(addr),
             Err(_) => {
-                let path = self.shared_memory_path();
+                let path = self.share_mem_path();
                 let (st, addr) = self
                     .wait_owner_recover_only(&path, *prev_owner_start_time)
                     .await?;
@@ -938,10 +932,10 @@ impl ExternalInner {
 
     async fn finish_owner_recover(
         &self,
-        shared_memory_path: &str,
+        share_mem_path: &str,
         payload: OwnerRestartPayload,
     ) -> KvResult<(i64, usize)> {
-        self.remap_shared_memory_with_payload(shared_memory_path, &payload)
+        self.remap_shared_memory_with_payload(share_mem_path, &payload)
             .await?;
         self.view
             .cluster_manager()
@@ -963,10 +957,10 @@ impl ExternalInner {
 
     async fn wait_owner_recover_only(
         &self,
-        shared_memory_path: &str,
+        share_mem_path: &str,
         prev_owner_start_time: i64,
     ) -> KvResult<(i64, usize)> {
-        self.wait_owner_recover(shared_memory_path, prev_owner_start_time)
+        self.wait_owner_recover(share_mem_path, prev_owner_start_time)
             .await
     }
 
@@ -974,7 +968,7 @@ impl ExternalInner {
         &self,
         prev_owner_start_time: &mut i64,
     ) -> KvResult<usize> {
-        let path = self.shared_memory_path();
+        let path = self.share_mem_path();
         let (st, addr) = self
             .wait_owner_recover_only(&path, *prev_owner_start_time)
             .await?;
@@ -990,7 +984,7 @@ impl ExternalInner {
             return match self.base_ptr().await {
                 Ok(addr) => Ok(addr),
                 Err(_) => {
-                    let path = self.shared_memory_path();
+                    let path = self.share_mem_path();
                     let (st, addr) = self
                         .wait_owner_recover_only(&path, *prev_owner_start_time)
                         .await?;
@@ -1000,7 +994,7 @@ impl ExternalInner {
             };
         }
 
-        let path = self.shared_memory_path();
+        let path = self.share_mem_path();
         let (st, addr) = self
             .wait_owner_recover_only(&path, *prev_owner_start_time)
             .await?;
@@ -1012,7 +1006,7 @@ impl ExternalInner {
     /// has advanced.
     async fn wait_owner_recover(
         &self,
-        _shared_memory_path: &str,
+        _share_mem_path: &str,
         prev_owner_start_time: i64,
     ) -> KvResult<(i64, usize)> {
         if let Some(res) = self
@@ -1093,11 +1087,11 @@ impl ExternalInner {
 
     async fn remap_shared_memory_with_payload(
         &self,
-        shared_memory_path: &str,
+        share_mem_path: &str,
         payload: &OwnerRestartPayload,
     ) -> KvResult<()> {
         let shared_memory = Self::init_shared_memory_from_meta(
-            shared_memory_path,
+            share_mem_path,
             &payload.meta,
             payload.signature.clone(),
         )?;
@@ -1215,11 +1209,11 @@ impl ExternalInner {
     }
 
     fn init_shared_memory_from_meta(
-        shared_memory_path: &str,
+        share_mem_path: &str,
         meta: &SharedJsonMeta,
         memory_signature: SharedMetaSignature,
     ) -> KvResult<Arc<SharedMemoryPtr>> {
-        let mmap_file_path = format!("{}/mmap.file", shared_memory_path);
+        let mmap_file_path = format!("{}/mmap.file", share_mem_path);
         Self::init_shared_memory(&mmap_file_path, meta.segment_len, memory_signature)
     }
     /// Get the shared storage node ID this client connects to
@@ -1230,14 +1224,8 @@ impl ExternalInner {
 
     /// Get the configured shared-memory base path (external mode).
     /// Non-external modes return empty string.
-    pub fn shared_memory_path(&self) -> String {
-        self.external_shared_memory_path.clone()
-    }
-
-    /// Get the configured shared-file base path (external mode).
-    /// Non-external modes return empty string.
-    pub fn shared_file_path(&self) -> String {
-        self.external_shared_file_path.clone()
+    pub fn share_mem_path(&self) -> String {
+        self.external_share_mem_path.clone()
     }
 
     pub fn large_file_paths(&self) -> &crate::config::LargeFilePaths {
@@ -1279,7 +1267,7 @@ impl ExternalInner {
         // require an extra enable flag once the owner has published ready lanes.
         let owner_id = self.shared_storage_node_id().await?;
         let owner_start_time = self.current_owner_start_time().await;
-        let peers_dir = ClientSegPool::side_transfer_peers_dir(&self.external_shared_file_path);
+        let peers_dir = ClientSegPool::side_transfer_peers_dir(&self.external_share_mem_path);
         let entries = std::fs::read_dir(&peers_dir).ok()?;
         let mut ready = Vec::new();
         for entry in entries.flatten() {
@@ -1541,7 +1529,7 @@ impl ExternalInner {
         let mut prev_owner_start_time = self.current_owner_start_time().await;
         let mut recover_attempts = 0usize;
         if self.base_ptr().await.is_err() {
-            let path = self.shared_memory_path();
+            let path = self.share_mem_path();
             tracing::info!("ExternalClientApi.is_exist waiting for owner at: {}", path);
             let _ = self.ensure_owner_ready(&mut prev_owner_start_time).await?;
         }
@@ -1632,7 +1620,7 @@ impl ExternalInner {
         // Ensure external mode configured; if not, block until owner is ready once
         let mut prev_owner_start_time = self.current_owner_start_time().await;
         if self.base_ptr().await.is_err() {
-            let path = self.shared_memory_path();
+            let path = self.share_mem_path();
             tracing::info!(
                 "ExternalClientApi.get detected unmapped shared memory; waiting at: {}",
                 path
@@ -1828,7 +1816,7 @@ key={}, attempt={}/{}, err={}",
         let mut base_addr: usize = match self.base_ptr().await {
             Ok(addr) => addr,
             Err(_) => {
-                let path = self.shared_memory_path();
+                let path = self.share_mem_path();
                 tracing::info!(
                     "ExternalClientApi.put detected unmapped shared memory; waiting for owner to be ready at path: {}",
                     path
@@ -1917,7 +1905,7 @@ key={}, attempt={}/{}, err={}",
         let mut base_addr: usize = match self.base_ptr().await {
             Ok(addr) => addr,
             Err(_) => {
-                let path = self.shared_memory_path();
+                let path = self.share_mem_path();
                 tracing::info!(
                     "ExternalClientApi.put_flat_dict_ptrs detected unmapped shared memory; waiting for owner to be ready at path: {}",
                     path
@@ -2307,7 +2295,7 @@ key={}, attempt={}/{}, err={}",
         let mut prev_owner_start_time = self.current_owner_start_time().await;
         let mut recover_attempts = 0usize;
         if self.base_ptr().await.is_err() {
-            let path = self.shared_memory_path();
+            let path = self.share_mem_path();
             tracing::info!("ExternalClientApi.delete waiting for owner at: {}", path);
             let _ = self.ensure_owner_ready(&mut prev_owner_start_time).await?;
         }
@@ -2671,8 +2659,7 @@ async fn handle_sync_kv_to_file_external(
 
 async fn task_wait_owner_restart(
     view: ExternalClientApiView,
-    shared_memory_path: String,
-    shared_file_path: String,
+    share_mem_path: String,
     current_sig_snapshot: Option<SharedMetaSignature>,
     wait_start_ts: i64,
     old_owner_id: Option<String>,
@@ -2681,7 +2668,7 @@ async fn task_wait_owner_restart(
 ) -> KvResult<OwnerRestartPayload> {
     let shutdown_poller = view.register_shutdown_poller();
     let mut cluster_rx = view.cluster_manager().listen();
-    let shared_meta_path = format!("{}/shared.json", &shared_file_path);
+    let shared_meta_path = format!("{}/shared.json", &share_mem_path);
     let mut waited = 0u64;
     loop {
         if !shutdown_poller.is_running() {
@@ -2692,8 +2679,7 @@ async fn task_wait_owner_restart(
 
         match probe_owner_restart_payload(
             &view,
-            &shared_memory_path,
-            &shared_file_path,
+            &share_mem_path,
             &shared_meta_path,
             current_sig_snapshot.as_ref(),
             wait_start_ts,
@@ -2742,8 +2728,7 @@ fn read_shared_json_snapshot(
 
 async fn probe_owner_restart_payload(
     view: &ExternalClientApiView,
-    shared_memory_path: &str,
-    shared_file_path: &str,
+    share_mem_path: &str,
     shared_meta_path: &str,
     current_sig_snapshot: Option<&SharedMetaSignature>,
     wait_start_ts: i64,
@@ -2751,16 +2736,16 @@ async fn probe_owner_restart_payload(
     expected_cluster_name: &str,
     expected_protocol_version: &str,
 ) -> KvResult<OwnerRestartProbe> {
-    if !fluxon_util::fs_watch::are_files_ready(shared_memory_path, &["mmap.file"]) {
+    if !fluxon_util::fs_watch::are_files_ready(share_mem_path, &["mmap.file"]) {
         return Ok(OwnerRestartProbe::Pending(format!(
             "shared memory mmap.file not ready yet: path={}",
-            shared_memory_path
+            share_mem_path
         )));
     }
-    if !fluxon_util::fs_watch::are_files_ready(shared_file_path, &["shared.json"]) {
+    if !fluxon_util::fs_watch::are_files_ready(share_mem_path, &["shared.json"]) {
         return Ok(OwnerRestartProbe::Pending(format!(
             "shared metadata shared.json not ready yet: path={}",
-            shared_file_path
+            share_mem_path
         )));
     }
 
@@ -2783,13 +2768,13 @@ async fn probe_owner_restart_payload(
     if meta.protocol_version != expected_protocol_version {
         return Ok(OwnerRestartProbe::Pending(format!(
             "shared.json protocol_version mismatch; waiting: shm_dir='{}' shared='{}' local='{}'",
-            shared_memory_path, meta.protocol_version, expected_protocol_version
+            share_mem_path, meta.protocol_version, expected_protocol_version
         )));
     }
     if meta.cluster_name != expected_cluster_name {
         return Ok(OwnerRestartProbe::Pending(format!(
             "shared.json cluster_name mismatch; waiting: shm_dir='{}' shared='{}' local='{}'",
-            shared_memory_path, meta.cluster_name, expected_cluster_name
+            share_mem_path, meta.cluster_name, expected_cluster_name
         )));
     }
     if let Some(old_owner_id) = old_owner_id {
@@ -2859,7 +2844,7 @@ impl LogicalModule for ExternalClientApi {
     async fn shutdown(&self) -> Result<(), Self::Error> {
         // 只在ExternalClient模式下清理共享内存映射
         let ext = &self.0;
-        if ext.shared_memory_path().is_empty() {
+        if ext.share_mem_path().is_empty() {
             tracing::info!("ExternalClientApi shutdown (no shared memory path configured)");
             return Ok(());
         }
diff --git a/fluxon_rs/fluxon_kv/src/kv_test.rs b/fluxon_rs/fluxon_kv/src/kv_test.rs
index 0ede369..5f0a9e2 100644
--- a/fluxon_rs/fluxon_kv/src/kv_test.rs
+++ b/fluxon_rs/fluxon_kv/src/kv_test.rs
@@ -609,8 +609,7 @@ struct KvTestClientOptions {
     transfer_backend_activation_mode: Option<TransferBackendActivationMode>,
     enable_transfer_rpc_fast_path: Option<bool>,
     contribute_to_cluster_pool_size: Option<ContributeToClusterPoolSize>,
-    shared_memory_path: Option<String>,
-    shared_file_path: Option<String>,
+    share_mem_path: Option<String>,
     etcd_mode: Option<KvTestEtcdMode>,
 }
 
@@ -639,14 +638,10 @@ impl KvTestClientOptions {
                 .contribute_to_cluster_pool_size
                 .clone()
                 .or_else(|| self.contribute_to_cluster_pool_size.clone()),
-            shared_memory_path: overrides
-                .shared_memory_path
+            share_mem_path: overrides
+                .share_mem_path
                 .clone()
-                .or_else(|| self.shared_memory_path.clone()),
-            shared_file_path: overrides
-                .shared_file_path
-                .clone()
-                .or_else(|| self.shared_file_path.clone()),
+                .or_else(|| self.share_mem_path.clone()),
             etcd_mode: overrides
                 .etcd_mode
                 .clone()
@@ -800,7 +795,7 @@ impl KvTestRoundOptions {
         )
     }
 
-    fn step8_shared_memory_path(&self) -> String {
+    fn step8_share_mem_path(&self) -> String {
         format!(
             "/tmp/kvcache_shared_memory_step8_{}_{}",
             self.round_name,
@@ -808,13 +803,6 @@ impl KvTestRoundOptions {
         )
     }
 
-    fn step8_shared_file_path(&self) -> String {
-        format!(
-            "/tmp/kvcache_shared_files_step8_{}_{}",
-            self.round_name,
-            kv_test_run_scope()
-        )
-    }
 }
 
 #[derive(Clone, Debug)]
@@ -872,8 +860,7 @@ fn default_owner_test_client_options(round_profile: KvTestRoundProfile) -> KvTes
         transfer_backend_activation_mode: round_profile.owner_transfer_backend_activation_mode(),
         enable_transfer_rpc_fast_path: Some(round_profile.enable_transfer_rpc_fast_path()),
         contribute_to_cluster_pool_size: Some(default_owner_contribute_to_cluster_pool_size()),
-        shared_memory_path: None,
-        shared_file_path: None,
+        share_mem_path: None,
         etcd_mode: Some(KvTestEtcdMode::Enabled),
     }
 }
@@ -886,8 +873,7 @@ fn default_master_test_client_options(round_profile: KvTestRoundProfile) -> KvTe
         transfer_backend_activation_mode: round_profile.master_transfer_backend_activation_mode(),
         enable_transfer_rpc_fast_path: Some(round_profile.enable_transfer_rpc_fast_path()),
         contribute_to_cluster_pool_size: None,
-        shared_memory_path: None,
-        shared_file_path: None,
+        share_mem_path: None,
         etcd_mode: None,
     }
 }
@@ -900,8 +886,7 @@ fn default_external_test_client_options() -> KvTestClientOptions {
         transfer_backend_activation_mode: None,
         enable_transfer_rpc_fast_path: Some(false),
         contribute_to_cluster_pool_size: Some(default_external_contribute_to_cluster_pool_size()),
-        shared_memory_path: None,
-        shared_file_path: None,
+        share_mem_path: None,
         etcd_mode: Some(KvTestEtcdMode::Disabled),
     }
 }
@@ -1037,12 +1022,9 @@ fn build_client_launch(
     let contribute_to_cluster_pool_size = options
         .contribute_to_cluster_pool_size
         .unwrap_or(default_owner_contribute_to_cluster_pool_size());
-    let shared_memory_path = options
-        .shared_memory_path
+    let share_mem_path = options
+        .share_mem_path
         .unwrap_or_else(|| format!("/tmp/kvcache_shared_memory/{}", instance_key));
-    let shared_file_path = options
-        .shared_file_path
-        .unwrap_or_else(|| format!("/tmp/kvcache_shared_files/{}", instance_key));
     let config = ClientConfig {
         cluster_name: round.cluster_name.clone(),
         etcd_addresses_raw,
@@ -1067,8 +1049,7 @@ fn build_client_launch(
         // kv_test uses a per-instance shared memory path by default so each owner/external share
         // group is explicit and test overrides only replace this when a scenario intentionally
         // binds multiple roles to the same owner path.
-        shared_memory_path,
-        shared_file_path,
+        share_mem_path,
         large_file_paths: default_client_large_file_paths(
             &instance_key,
             &contribute_to_cluster_pool_size,
@@ -1102,7 +1083,7 @@ fn new_client_launch(
 }
 
 /// 创建测试用的ExternalClient配置
-/// external 与 owner 的 instance_key 必须不同；仅共享 owner 的 shared_memory_path
+/// external 与 owner 的 instance_key 必须不同；仅共享 owner 的 share_mem_path
 fn new_external_client_launch(
     round: &KvTestRoundOptions,
     external_instance_key: &str,
@@ -1127,18 +1108,12 @@ fn new_external_client_launch(
     if external_options.enable_transfer_rpc_fast_path.is_none() {
         external_options.enable_transfer_rpc_fast_path = Some(false);
     }
-    if external_options.shared_memory_path.is_none() {
-        external_options.shared_memory_path = Some(format!(
+    if external_options.share_mem_path.is_none() {
+        external_options.share_mem_path = Some(format!(
             "/tmp/kvcache_shared_memory/{}",
             round.scoped_instance_key(owner_instance_key)
         ));
     }
-    if external_options.shared_file_path.is_none() {
-        external_options.shared_file_path = Some(format!(
-            "/tmp/kvcache_shared_files/{}",
-            round.scoped_instance_key(owner_instance_key)
-        ));
-    }
     build_client_launch(
         round,
         round.scoped_instance_key(external_instance_key),
@@ -1605,30 +1580,17 @@ async fn shutdown_framework_with_timeout(label: &str, framework: &crate::Framewo
 async fn run_kv_step8(round: &KvTestRoundOptions) {
     info!("📋 Step 8: Verifying external client blocking and recovery behavior");
 
-    let step8_shared_memory_path = round.step8_shared_memory_path();
-    let step8_shared_file_path = round.step8_shared_file_path();
-    if let Err(e) = fs::remove_dir_all(&step8_shared_memory_path) {
+    let step8_share_mem_path = round.step8_share_mem_path();
+    if let Err(e) = fs::remove_dir_all(&step8_share_mem_path) {
         warn!(
             "Step 8: failed to remove existing shared memory dir {}: {}",
-            step8_shared_memory_path, e
+            step8_share_mem_path, e
         );
     }
-    if let Err(e) = fs::create_dir_all(&step8_shared_memory_path) {
+    if let Err(e) = fs::create_dir_all(&step8_share_mem_path) {
         warn!(
             "Step 8: failed to pre-create shared memory dir {}: {}",
-            step8_shared_memory_path, e
-        );
-    }
-    if let Err(e) = fs::remove_dir_all(&step8_shared_file_path) {
-        warn!(
-            "Step 8: failed to remove existing shared file dir {}: {}",
-            step8_shared_file_path, e
-        );
-    }
-    if let Err(e) = fs::create_dir_all(&step8_shared_file_path) {
-        warn!(
-            "Step 8: failed to pre-create shared file dir {}: {}",
-            step8_shared_file_path, e
+            step8_share_mem_path, e
         );
     }
 
@@ -1649,15 +1611,13 @@ async fn run_kv_step8(round: &KvTestRoundOptions) {
     let step8_owner_options = round
         .owner_client_options
         .merged_with(&KvTestClientOptions {
-            shared_memory_path: Some(step8_shared_memory_path.clone()),
-            shared_file_path: Some(step8_shared_file_path.clone()),
+            share_mem_path: Some(step8_share_mem_path.clone()),
             ..Default::default()
         });
     let step8_external_options = round
         .external_client_options
         .merged_with(&KvTestClientOptions {
-            shared_memory_path: Some(step8_shared_memory_path.clone()),
-            shared_file_path: Some(step8_shared_file_path.clone()),
+            share_mem_path: Some(step8_share_mem_path.clone()),
             ..Default::default()
         });
 
@@ -1859,16 +1819,10 @@ async fn run_kv_step8(round: &KvTestRoundOptions) {
         .await;
     shutdown_framework_with_timeout("step8 master", &master_framework_step8).await;
 
-    if let Err(e) = fs::remove_dir_all(&step8_shared_memory_path) {
+    if let Err(e) = fs::remove_dir_all(&step8_share_mem_path) {
         warn!(
             "Step 8: failed to clean shared memory dir {} on exit: {}",
-            step8_shared_memory_path, e
-        );
-    }
-    if let Err(e) = fs::remove_dir_all(&step8_shared_file_path) {
-        warn!(
-            "Step 8: failed to clean shared file dir {} on exit: {}",
-            step8_shared_file_path, e
+            step8_share_mem_path, e
         );
     }
 }
@@ -2085,7 +2039,7 @@ async fn run_kv_round(round: &KvTestRoundOptions) {
 
         // 启动多个客户端节点
         let client1_launch = new_client_launch(round, "test_client_1", None);
-        // external 与 owner 使用不同的 instance_key，但共享 owner 的 shared_memory_path
+        // external 与 owner 使用不同的 instance_key，但共享 owner 的 share_mem_path
         let client2_launch =
             new_external_client_launch(round, "test_client_1_ext2", "test_client_1", None);
         let client3_launch =
diff --git a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
index 1a64c83..778666f 100644
--- a/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
+++ b/fluxon_rs/fluxon_kv/src/kvcore_test_lib.rs
@@ -121,8 +121,7 @@ fn new_client_config_with_cluster_and_dram(
         .expect("read raw etcd endpoint from build_config_ext.yml");
     // Shared memory path lives under the same test workdir base used by master logs
     let base = test_workdir_base();
-    let shared_memory_path = format!("{}/sharemem/{}", base, instance_key);
-    let shared_file_path = format!("{}/sharefile/{}", base, instance_key);
+    let share_mem_path = format!("{}/sharemem/{}", base, instance_key);
     let conf = ClientConfig {
         cluster_name: cluster_name.to_string(),
         etcd_addresses_raw: vec![etcd_raw],
@@ -145,8 +144,7 @@ fn new_client_config_with_cluster_and_dram(
             enable_transfer_rpc_fast_path: true,
             sub_cluster: None,
         },
-        shared_memory_path,
-        shared_file_path,
+        share_mem_path,
         large_file_paths: crate::config::LargeFilePaths {
             paths: vec![format!("{}/large/{}", base, instance_key)],
         },
diff --git a/fluxon_rs/fluxon_kv/src/lib.rs b/fluxon_rs/fluxon_kv/src/lib.rs
index 94bb34d..edaa386 100644
--- a/fluxon_rs/fluxon_kv/src/lib.rs
+++ b/fluxon_rs/fluxon_kv/src/lib.rs
@@ -107,15 +107,11 @@ use tracing::{info, warn};
 
 struct ExternalBootstrapBundle {
     meta: SharedJsonMeta,
-    shared_memory_path: String,
-    shared_file_path: String,
-    etcd_endpoints: Vec<String>,
 }
 
 struct ExternalBootstrapMetadata {
     meta: SharedJsonMeta,
-    shared_memory_path: String,
-    shared_file_path: String,
+    share_mem_path: String,
     etcd_endpoints: Vec<String>,
 }
 
@@ -799,8 +795,7 @@ fn build_side_transfer_worker_config(
             enable_transfer_rpc_fast_path: false,
             sub_cluster: None,
         },
-        shared_memory_path: owner_config.shared_memory_path.clone(),
-        shared_file_path: owner_config.shared_file_path.clone(),
+        share_mem_path: owner_config.share_mem_path.clone(),
         large_file_paths: owner_config.large_file_paths.clone(),
         test_spec_config,
     })
@@ -844,8 +839,7 @@ fn build_side_transfer_worker_config_yaml(
         fluxonkv_spec: crate::config::FluxonKvSpecYaml {
             etcd_addresses: None,
             cluster_name: side_config.cluster_name,
-            shared_memory_path: side_config.shared_memory_path,
-            shared_file_path: side_config.shared_file_path,
+            share_mem_path: side_config.share_mem_path,
             large_file_paths: None,
             p2p_listen_port: side_config.fluxonkv_spec.p2p_listen_port,
             redis_compat: None,
@@ -863,7 +857,7 @@ fn side_transfer_runtime_dir(owner_config: &ClientConfig) -> PathBuf {
 }
 
 fn cluster_manager_local_ipc_root(
-    shared_memory_path: &str,
+    share_mem_path: &str,
     test_spec_config: &TestSpecConfig,
 ) -> Option<String> {
     // Test-only override:
@@ -881,35 +875,35 @@ fn cluster_manager_local_ipc_root(
     // they do not need to reuse the same literal filesystem path.
     //
     // Causal chain:
-    // - `shared_memory_path` is authoritative for mmap.file/shared.json coordination and can be long.
+    // - `share_mem_path` is authoritative for mmap.file/shared.json coordination and can be long.
     // - iceoryx2 event listeners materialize AF_UNIX socket files under `local_ipc_root`.
-    // - AF_UNIX paths are short; reusing a long `shared_memory_path` makes listener creation fail
+    // - AF_UNIX paths are short; reusing a long `share_mem_path` makes listener creation fail
     //   as `ResourceCreationFailed`, even on a clean start with no stale resources.
     // - Therefore we derive a short, stable alias from the canonical shared-memory root and publish
     //   only that alias as `local_ipc_root`.
     Some(
-        derive_short_local_ipc_root(shared_memory_path)
+        derive_short_local_ipc_root(share_mem_path)
             .unwrap_or_else(|err| panic!("failed to derive local_ipc_root: {}", err)),
     )
 }
 
-fn derive_short_local_ipc_root(shared_memory_path: &str) -> Result<String> {
-    if shared_memory_path.trim().is_empty() {
-        anyhow::bail!("shared_memory_path cannot be empty");
+fn derive_short_local_ipc_root(share_mem_path: &str) -> Result<String> {
+    if share_mem_path.trim().is_empty() {
+        anyhow::bail!("share_mem_path cannot be empty");
     }
 
-    std::fs::create_dir_all(shared_memory_path).map_err(|e| {
+    std::fs::create_dir_all(share_mem_path).map_err(|e| {
         anyhow::anyhow!(
-            "shared_memory_path must be creatable before deriving local_ipc_root: path='{}', err={}",
-            shared_memory_path,
+            "share_mem_path must be creatable before deriving local_ipc_root: path='{}', err={}",
+            share_mem_path,
             e
         )
     })?;
 
-    let canonical = std::fs::canonicalize(shared_memory_path).map_err(|e| {
+    let canonical = std::fs::canonicalize(share_mem_path).map_err(|e| {
         anyhow::anyhow!(
-            "shared_memory_path must be canonicalizable before deriving local_ipc_root: path='{}', err={}",
-            shared_memory_path,
+            "share_mem_path must be canonicalizable before deriving local_ipc_root: path='{}', err={}",
+            share_mem_path,
             e
         )
     })?;
@@ -1117,22 +1111,22 @@ fn format_side_transfer_worker_output_tails(worker: &SideTransferWorkerProcess)
 }
 
 fn read_side_transfer_peer_file(
-    shared_file_path: &str,
+    share_mem_path: &str,
     side_id: &str,
 ) -> Option<crate::client_seg_pool::SideTransferPeerFileMeta> {
-    let peer_path = ClientSegPool::side_transfer_peer_file_path(shared_file_path, side_id);
+    let peer_path = ClientSegPool::side_transfer_peer_file_path(share_mem_path, side_id);
     let payload = std::fs::read_to_string(&peer_path).ok()?;
     serde_json::from_str::<crate::client_seg_pool::SideTransferPeerFileMeta>(&payload).ok()
 }
 
 fn is_side_transfer_worker_ready(
     _cluster_manager: &ClusterManager,
-    shared_file_path: &str,
+    share_mem_path: &str,
     owner_id: &str,
     owner_start_time: i64,
     side_id: &str,
 ) -> bool {
-    let Some(meta) = read_side_transfer_peer_file(shared_file_path, side_id) else {
+    let Some(meta) = read_side_transfer_peer_file(share_mem_path, side_id) else {
         return false;
     };
     // Peer files are written only after the worker has attached shared memory and finished
@@ -1162,8 +1156,8 @@ fn start_side_transfer_worker(
 }
 
 fn cleanup_stale_side_transfer_bootstrap_artifacts(owner_config: &ClientConfig) -> Result<()> {
-    let shared_file_path = Path::new(&owner_config.shared_file_path);
-    let shared_json_path = shared_file_path.join("shared.json");
+    let share_mem_path = Path::new(&owner_config.share_mem_path);
+    let shared_json_path = share_mem_path.join("shared.json");
     match std::fs::remove_file(&shared_json_path) {
         Ok(()) => {
             info!(
@@ -1182,7 +1176,7 @@ fn cleanup_stale_side_transfer_bootstrap_artifacts(owner_config: &ClientConfig)
         }
     }
 
-    let peers_dir = ClientSegPool::side_transfer_peers_dir(&owner_config.shared_file_path);
+    let peers_dir = ClientSegPool::side_transfer_peers_dir(&owner_config.share_mem_path);
     match std::fs::remove_dir_all(&peers_dir) {
         Ok(()) => {
             info!(
@@ -1229,7 +1223,7 @@ async fn wait_for_side_transfer_workers_ready(
             }
             if is_side_transfer_worker_ready(
                 cluster_manager,
-                &owner_config.shared_file_path,
+                &owner_config.share_mem_path,
                 &owner_info.id,
                 owner_info.node_start_time,
                 &worker.side_id,
@@ -1599,31 +1593,24 @@ async fn bootstrap_zero_contribution_client_config(config: ClientConfig) -> KvRe
         return Ok(config);
     }
 
-    let metadata = load_external_bootstrap_metadata(
-        &config.shared_memory_path,
-        &config.shared_file_path,
-        &config.cluster_name,
-    )
-    .await?;
+    let metadata =
+        load_external_bootstrap_metadata(&config.share_mem_path, &config.cluster_name).await?;
     let mut final_config = config;
     final_config.etcd_addresses_raw = metadata.meta.etcd_addresses.clone();
     final_config.fluxonkv_spec.etcd_addresses = metadata.etcd_endpoints;
     final_config.fluxonkv_spec.sub_cluster = metadata.meta.sub_cluster.clone();
-    final_config.shared_memory_path = metadata.shared_memory_path;
-    final_config.shared_file_path = metadata.shared_file_path;
+    final_config.share_mem_path = metadata.share_mem_path;
     final_config.large_file_paths = metadata.meta.large_file_paths;
     Ok(final_config)
 }
 
 async fn load_external_bootstrap_metadata(
-    shared_memory_path: &str,
-    shared_file_path: &str,
+    share_mem_path: &str,
     expected_cluster_name: &str,
 ) -> KvResult<ExternalBootstrapMetadata> {
     let build_version = fluxon_util::git_version_build_record::get_current_git_commitid().unwrap();
-    let shared_memory_dir = Path::new(shared_memory_path);
-    let shared_file_dir = Path::new(shared_file_path);
-    let shared_json_path = shared_file_dir.join("shared.json");
+    let share_mem_dir = Path::new(share_mem_path);
+    let shared_json_path = share_mem_dir.join("shared.json");
 
     let mut waited_ticks: u64 = 0;
     loop {
@@ -1666,10 +1653,9 @@ async fn load_external_bootstrap_metadata(
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
                 warn!(
-                    "Waiting protocol_version match... ({}s), shm_dir='{}' file_dir='{}', shared='{}', local='{}'",
+                    "Waiting protocol_version match... ({}s), share_mem_dir='{}', shared='{}', local='{}'",
                     waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_file_dir.to_string_lossy(),
+                    share_mem_dir.to_string_lossy(),
                     meta.protocol_version,
                     build_version
                 );
@@ -1682,10 +1668,9 @@ async fn load_external_bootstrap_metadata(
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
                 warn!(
-                    "Waiting cluster_name match... ({}s), shm_dir='{}' file_dir='{}', config='{}', shared.json='{}'",
+                    "Waiting cluster_name match... ({}s), share_mem_dir='{}', config='{}', shared.json='{}'",
                     waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_file_dir.to_string_lossy(),
+                    share_mem_dir.to_string_lossy(),
                     expected_cluster_name,
                     meta.cluster_name
                 );
@@ -1693,17 +1678,17 @@ async fn load_external_bootstrap_metadata(
             continue;
         }
 
-        let shared_memory_path_canonical = match std::fs::canonicalize(shared_memory_path) {
+        let share_mem_path_canonical = match std::fs::canonicalize(share_mem_path) {
             Ok(v) => v.to_string_lossy().into_owned(),
             Err(e) => {
                 limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
                 waited_ticks += 1;
                 if waited_ticks % 25 == 0 {
                     warn!(
-                        "Waiting shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
+                        "Waiting share_mem_path canonicalizable... ({}s), share_mem_dir='{}', path='{}', err={}",
                         waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_memory_path,
+                        share_mem_dir.to_string_lossy(),
+                        share_mem_path,
                         e
                     );
                 }
@@ -1711,52 +1696,17 @@ async fn load_external_bootstrap_metadata(
             }
         };
 
-        let meta_shm_canonical = match std::fs::canonicalize(&meta.shared_memory_path) {
-            Ok(v) => v.to_string_lossy().into_owned(),
-            Err(e) => {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting shared.json shared_memory_path canonicalizable... ({}s), shm_dir='{}', path='{}', err={}",
-                        waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        meta.shared_memory_path,
-                        e
-                    );
-                }
-                continue;
-            }
-        };
-
-        let shared_file_path_canonical = match std::fs::canonicalize(shared_file_path) {
-            Ok(v) => v.to_string_lossy().into_owned(),
-            Err(e) => {
-                limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-                waited_ticks += 1;
-                if waited_ticks % 25 == 0 {
-                    warn!(
-                        "Waiting shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
-                        waited_ticks / 5,
-                        shared_file_dir.to_string_lossy(),
-                        shared_file_path,
-                        e
-                    );
-                }
-                continue;
-            }
-        };
-        let meta_file_canonical = match std::fs::canonicalize(&meta.shared_file_path) {
+        let meta_shm_canonical = match std::fs::canonicalize(&meta.share_mem_path) {
             Ok(v) => v.to_string_lossy().into_owned(),
             Err(e) => {
                 limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
                 waited_ticks += 1;
                 if waited_ticks % 25 == 0 {
                     warn!(
-                        "Waiting shared.json shared_file_path canonicalizable... ({}s), file_dir='{}', path='{}', err={}",
+                        "Waiting shared.json share_mem_path canonicalizable... ({}s), share_mem_dir='{}', path='{}', err={}",
                         waited_ticks / 5,
-                        shared_file_dir.to_string_lossy(),
-                        meta.shared_file_path,
+                        share_mem_dir.to_string_lossy(),
+                        meta.share_mem_path,
                         e
                     );
                 }
@@ -1764,44 +1714,29 @@ async fn load_external_bootstrap_metadata(
             }
         };
 
-        if meta_shm_canonical != shared_memory_path_canonical {
+        if meta_shm_canonical != share_mem_path_canonical {
             limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
                 warn!(
-                    "Waiting shared_memory_path match... ({}s), shm_dir='{}', config='{}', shared.json='{}'",
+                    "Waiting share_mem_path match... ({}s), share_mem_dir='{}', config='{}', shared.json='{}'",
                     waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_memory_path_canonical,
+                    share_mem_dir.to_string_lossy(),
+                    share_mem_path_canonical,
                     meta_shm_canonical
                 );
             }
             continue;
         }
-        if meta_file_canonical != shared_file_path_canonical {
-            limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
-            waited_ticks += 1;
-            if waited_ticks % 25 == 0 {
-                warn!(
-                    "Waiting shared_file_path match... ({}s), file_dir='{}', config='{}', shared.json='{}'",
-                    waited_ticks / 5,
-                    shared_file_dir.to_string_lossy(),
-                    shared_file_path_canonical,
-                    meta_file_canonical
-                );
-            }
-            continue;
-        }
 
         if meta.etcd_addresses.is_empty() {
             limit_thirdparty::tokio::time::sleep(std::time::Duration::from_millis(200)).await;
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
                 warn!(
-                    "Waiting shared.json etcd_addresses non-empty... ({}s), shm_dir='{}' file_dir='{}', shared_memory_path='{}'",
+                    "Waiting shared.json etcd_addresses non-empty... ({}s), share_mem_dir='{}', share_mem_path='{}'",
                     waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_file_dir.to_string_lossy(),
+                    share_mem_dir.to_string_lossy(),
                     meta_shm_canonical
                 );
             }
@@ -1815,10 +1750,9 @@ async fn load_external_bootstrap_metadata(
                 waited_ticks += 1;
                 if waited_ticks % 25 == 0 {
                     warn!(
-                        "Waiting shared.json etcd_addresses valid... ({}s), shm_dir='{}' file_dir='{}', raw={:?}, err={}",
+                        "Waiting shared.json etcd_addresses valid... ({}s), share_mem_dir='{}', raw={:?}, err={}",
                         waited_ticks / 5,
-                        shared_memory_dir.to_string_lossy(),
-                        shared_file_dir.to_string_lossy(),
+                        share_mem_dir.to_string_lossy(),
                         meta.etcd_addresses,
                         e
                     );
@@ -1829,8 +1763,7 @@ async fn load_external_bootstrap_metadata(
 
         return Ok(ExternalBootstrapMetadata {
             meta,
-            shared_memory_path: meta_shm_canonical,
-            shared_file_path: meta_file_canonical,
+            share_mem_path: meta_shm_canonical,
             etcd_endpoints,
         });
     }
@@ -1839,16 +1772,11 @@ async fn load_external_bootstrap_metadata(
 async fn wait_for_external_bootstrap_bundle(
     config: &ClientConfig,
 ) -> KvResult<ExternalBootstrapBundle> {
-    let metadata = load_external_bootstrap_metadata(
-        &config.shared_memory_path,
-        &config.shared_file_path,
-        &config.cluster_name,
-    )
-    .await?;
-    let shared_memory_dir = Path::new(&metadata.shared_memory_path);
-    let shared_file_dir = Path::new(&metadata.shared_file_path);
-    let shared_json_path = shared_file_dir.join("shared.json");
-    let mmap_file_path = shared_memory_dir.join("mmap.file");
+    let metadata =
+        load_external_bootstrap_metadata(&config.share_mem_path, &config.cluster_name).await?;
+    let share_mem_dir = Path::new(&metadata.share_mem_path);
+    let shared_json_path = share_mem_dir.join("shared.json");
+    let mmap_file_path = share_mem_dir.join("mmap.file");
 
     let mut waited_ticks: u64 = 0;
     loop {
@@ -1857,10 +1785,9 @@ async fn wait_for_external_bootstrap_bundle(
             waited_ticks += 1;
             if waited_ticks % 25 == 0 {
                 info!(
-                    "Waiting owner shared bundle to be ready... ({}s), shm_dir={} file_dir={} (shared.json={}, mmap.file={})",
+                    "Waiting owner shared bundle to be ready... ({}s), share_mem_dir={} (shared.json={}, mmap.file={})",
                     waited_ticks / 5,
-                    shared_memory_dir.to_string_lossy(),
-                    shared_file_dir.to_string_lossy(),
+                    share_mem_dir.to_string_lossy(),
                     shared_json_path.exists(),
                     mmap_file_path.exists()
                 );
@@ -1869,9 +1796,6 @@ async fn wait_for_external_bootstrap_bundle(
         }
         return Ok(ExternalBootstrapBundle {
             meta: metadata.meta,
-            shared_memory_path: metadata.shared_memory_path,
-            shared_file_path: metadata.shared_file_path,
-            etcd_endpoints: metadata.etcd_endpoints,
         });
     }
 }
@@ -1934,14 +1858,14 @@ async fn run_client_impl(
 
     println!("Client config: {:?}", config);
     println!(
-        "Client shared_memory_path resolved to: {:?}",
-        config.shared_memory_path
+        "Client share_mem_path resolved to: {:?}",
+        config.share_mem_path
     );
 
     info!("Client config: {:?}", config);
     info!(
-        "Client shared_memory_path resolved to: {:?}",
-        config.shared_memory_path
+        "Client share_mem_path resolved to: {:?}",
+        config.share_mem_path
     );
     info!("Build version (git commit): {}", build_version);
     info!("Build version (source-sha256): {}", source_sha256);
@@ -2042,7 +1966,7 @@ async fn run_client_impl(
                 port: None,
                 metadata,
                 local_ipc_root: cluster_manager_local_ipc_root(
-                    &config.shared_memory_path,
+                    &config.share_mem_path,
                     &config.test_spec_config,
                 ),
                 rdma_control_init: rdma_control_init.clone(),
@@ -2065,8 +1989,7 @@ async fn run_client_impl(
                 test_spec_config: config.test_spec_config.clone(),
             },
             external_client_api_arg: ExternalClientApiNewArg {
-                shared_memory_path: config.shared_memory_path.clone(),
-                shared_file_path: config.shared_file_path.clone(),
+                share_mem_path: config.share_mem_path.clone(),
                 large_file_paths: config.large_file_paths.clone(),
                 expected_cluster_name: config.cluster_name.clone(),
                 expected_protocol_version: build_version.clone(),
@@ -2089,7 +2012,7 @@ async fn run_client_impl(
                 port: None,
                 metadata,
                 local_ipc_root: cluster_manager_local_ipc_root(
-                    &config.shared_memory_path,
+                    &config.share_mem_path,
                     &config.test_spec_config,
                 ),
                 rdma_control_init,
@@ -2117,8 +2040,7 @@ async fn run_client_impl(
             client_seg_pool_arg: ClientSegPoolNewArg {
                 contribute_size: config.contribute_to_cluster_pool_size.clone(),
                 // Read shared memory path from config (must not be empty).
-                shared_memory_path: config.shared_memory_path.clone(),
-                shared_file_path: config.shared_file_path.clone(),
+                share_mem_path: config.share_mem_path.clone(),
                 large_file_paths: config.large_file_paths.clone(),
                 cluster_name: config.cluster_name.clone(),
                 etcd_addresses: config.etcd_addresses_raw.clone(),
@@ -2271,7 +2193,7 @@ async fn run_client_impl(
                             Ok(None) => {
                                 if is_side_transfer_worker_ready(
                                     cluster_manager,
-                                    &reconcile_owner_config.shared_memory_path,
+                                    &reconcile_owner_config.share_mem_path,
                                     &reconcile_owner_info.id,
                                     reconcile_owner_info.node_start_time,
                                     &worker.side_id,
@@ -2542,8 +2464,7 @@ mod tests {
                 enable_transfer_rpc_fast_path: true,
                 sub_cluster: Some("owner-sub".to_string()),
             },
-            shared_memory_path: "/tmp/fluxon_side_transfer_test".to_string(),
-            shared_file_path: "/tmp/fluxon_side_transfer_test_files".to_string(),
+            share_mem_path: "/tmp/fluxon_side_transfer_test".to_string(),
             large_file_paths: crate::config::LargeFilePaths {
                 paths: vec!["/tmp/fluxon_side_transfer_test_large".to_string()],
             },
@@ -2612,11 +2533,11 @@ mod tests {
     #[test]
     fn derive_short_local_ipc_root_is_stable_for_canonical_path() {
         let tempdir = new_test_dir("fluxon_local_ipc_root_stable");
-        let shared_memory_root = tempdir.join("owner_shm");
-        std::fs::create_dir_all(&shared_memory_root).unwrap();
+        let share_mem_root = tempdir.join("owner_shm");
+        std::fs::create_dir_all(&share_mem_root).unwrap();
 
-        let canonical = std::fs::canonicalize(&shared_memory_root).unwrap();
-        let alias_a = derive_short_local_ipc_root(shared_memory_root.to_str().unwrap()).unwrap();
+        let canonical = std::fs::canonicalize(&share_mem_root).unwrap();
+        let alias_a = derive_short_local_ipc_root(share_mem_root.to_str().unwrap()).unwrap();
         let alias_b = derive_short_local_ipc_root(canonical.to_str().unwrap()).unwrap();
 
         assert_eq!(alias_a, alias_b);
@@ -2628,10 +2549,10 @@ mod tests {
     #[test]
     fn derive_short_local_ipc_root_keeps_iceoryx_event_path_short() {
         let tempdir = new_test_dir("fluxon_local_ipc_root_short");
-        let shared_memory_root = tempdir.join(
-            "this_is_a_deliberately_long_shared_memory_root_name_for_iceoryx_socket_length_checks",
+        let share_mem_root = tempdir.join(
+            "this_is_a_deliberately_long_share_mem_root_name_for_iceoryx_socket_length_checks",
         );
-        let alias = derive_short_local_ipc_root(shared_memory_root.to_str().unwrap()).unwrap();
+        let alias = derive_short_local_ipc_root(share_mem_root.to_str().unwrap()).unwrap();
         let example_event_path = format!("{}/iox2_254771654226413701181693419284.event", alias);
 
         assert!(Path::new(&alias).is_absolute());
@@ -2647,17 +2568,17 @@ mod tests {
     #[test]
     fn cluster_manager_local_ipc_root_respects_test_disable_switch() {
         let tempdir = new_test_dir("fluxon_local_ipc_root_disable_switch");
-        let shared_memory_root = tempdir.join("owner_shm");
-        std::fs::create_dir_all(&shared_memory_root).unwrap();
+        let share_mem_root = tempdir.join("owner_shm");
+        std::fs::create_dir_all(&share_mem_root).unwrap();
 
         let enabled = cluster_manager_local_ipc_root(
-            shared_memory_root.to_str().unwrap(),
+            share_mem_root.to_str().unwrap(),
             &TestSpecConfig::default(),
         );
         assert!(enabled.is_some());
 
         let disabled = cluster_manager_local_ipc_root(
-            shared_memory_root.to_str().unwrap(),
+            share_mem_root.to_str().unwrap(),
             &TestSpecConfig {
                 disable_local_ipc: true,
                 ..Default::default()
@@ -2794,13 +2715,11 @@ mod tests {
     #[tokio::test]
     async fn zero_contribution_bootstrap_inherits_large_file_paths_from_owner_shared_json() {
         let tempdir = new_test_dir("fluxon_external_bootstrap_large_paths");
-        let shared_memory_root = tempdir.join("shared_mem");
-        let shared_file_root = tempdir.join("shared_file");
+        let share_mem_root = tempdir.join("shared_mem");
         let owner_large_root = tempdir.join("owner_large");
-        std::fs::create_dir_all(&shared_memory_root).unwrap();
-        std::fs::create_dir_all(&shared_file_root).unwrap();
+        std::fs::create_dir_all(&share_mem_root).unwrap();
         std::fs::create_dir_all(&owner_large_root).unwrap();
-        std::fs::write(shared_memory_root.join("mmap.file"), vec![0u8; 4096]).unwrap();
+        std::fs::write(share_mem_root.join("mmap.file"), vec![0u8; 4096]).unwrap();
 
         let shared_meta = SharedJsonMeta {
             owner_id: "owner-a".to_string(),
@@ -2810,11 +2729,7 @@ mod tests {
             sub_cluster: Some("owner-sub".to_string()),
             cluster_name: "test_cluster".to_string(),
             etcd_addresses: vec!["127.0.0.1:2379".to_string()],
-            shared_memory_path: std::fs::canonicalize(&shared_memory_root)
-                .unwrap()
-                .to_string_lossy()
-                .into_owned(),
-            shared_file_path: std::fs::canonicalize(&shared_file_root)
+            share_mem_path: std::fs::canonicalize(&share_mem_root)
                 .unwrap()
                 .to_string_lossy()
                 .into_owned(),
@@ -2829,7 +2744,7 @@ mod tests {
         assert!(shared_meta_json.contains("\"large_file_paths\":["));
         assert!(!shared_meta_json.contains("root_paths"));
         std::fs::write(
-            shared_file_root.join("shared.json"),
+            share_mem_root.join("shared.json"),
             shared_meta_json.as_bytes(),
         )
         .unwrap();
@@ -2856,8 +2771,7 @@ mod tests {
                 enable_transfer_rpc_fast_path: false,
                 sub_cluster: None,
             },
-            shared_memory_path: shared_memory_root.to_string_lossy().into_owned(),
-            shared_file_path: shared_file_root.to_string_lossy().into_owned(),
+            share_mem_path: share_mem_root.to_string_lossy().into_owned(),
             large_file_paths: crate::config::LargeFilePaths { paths: Vec::new() },
             test_spec_config: TestSpecConfig::default(),
         };
diff --git a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
index 83e29de..7bc7a70 100644
--- a/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
+++ b/fluxon_rs/fluxon_kv/src/memholder/memholder_test.rs
@@ -92,8 +92,7 @@ fn new_client_config_with_size(
             enable_transfer_rpc_fast_path: true,
             sub_cluster: None,
         },
-        shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", instance_key),
-        shared_file_path: format!("/tmp/kvcache_shared_files/{}", instance_key),
+        share_mem_path: format!("/tmp/kvcache_shared_memory/{}", instance_key),
         large_file_paths: crate::config::LargeFilePaths {
             paths: vec![format!("/tmp/kvcache_large/{}", instance_key)],
         },
@@ -128,8 +127,7 @@ fn new_zero_contribution_client_config(
             enable_transfer_rpc_fast_path: false,
             sub_cluster: None,
         },
-        shared_memory_path: format!("/tmp/kvcache_shared_memory/{}", owner_instance_key),
-        shared_file_path: format!("/tmp/kvcache_shared_files/{}", owner_instance_key),
+        share_mem_path: format!("/tmp/kvcache_shared_memory/{}", owner_instance_key),
         large_file_paths: crate::config::LargeFilePaths { paths: Vec::new() },
         test_spec_config: TestSpecConfig::default(),
     }
@@ -419,7 +417,7 @@ pub mod test_memholder {
         sleep(Duration::from_secs(2)).await;
 
         let owner_name = "pin_owner";
-        // 第二个 owner 必须使用不同的 member key（也会带来不同的 shared_memory_path）
+        // 第二个 owner 必须使用不同的 member key（也会带来不同的 share_mem_path）
         let owner2_name = "pin_owner2";
         let (owner, _) = run_client(ConfigArg::Config(new_client_config_with_size(
             owner_name,
diff --git a/fluxon_rs/fluxon_pyo3/src/lib.rs b/fluxon_rs/fluxon_pyo3/src/lib.rs
index b29a083..a73591f 100644
--- a/fluxon_rs/fluxon_pyo3/src/lib.rs
+++ b/fluxon_rs/fluxon_pyo3/src/lib.rs
@@ -2759,18 +2759,30 @@ impl KvClient {
         inner_new(config_yaml, py).into_py_object(py)
     }
 
-    /// Return the logs directory for MQ-related components.
+    /// Return the logs directory for third-party Python components.
     ///
-    /// For the fluxon unified backend, this is derived from the
-    /// client's shared_memory_path and cluster_name:
-    ///   {shared_memory_path}/{cluster_name}_cluster_mq_logs
-    fn logs_dir(&self, py: Python) -> PyObject {
-        fn logs_dir_inner(client: &KvClient, py: Python) -> ApiResult<PyObject> {
-            let base = PathBuf::from(&client.config.shared_memory_path);
-            let dir = base.join(format!("{}_cluster_mq_logs", client.config.cluster_name));
+    /// For the fluxon unified backend, this is derived from owner
+    /// large_file_paths and cluster_name:
+    ///   {large_file_paths[0]}/{cluster_name}_cluster_third_party_logs
+    fn third_party_logs_dir(&self, py: Python) -> PyObject {
+        fn third_party_logs_dir_inner(client: &KvClient, py: Python) -> ApiResult<PyObject> {
+            let dir = match client
+                .config
+                .large_file_paths
+                .third_party_logs_dir(&client.config.cluster_name)
+            {
+                Ok(dir) => dir,
+                Err(e) => {
+                    return ApiResult::new_error(crate::error::py_error_from_kv_error(
+                        py,
+                        &e,
+                        "third_party_logs_dir failed",
+                    ));
+                }
+            };
             ApiResult::new_success(dir.to_string_lossy().into_owned().into_py(py))
         }
-        logs_dir_inner(self, py).into_py_object(py)
+        third_party_logs_dir_inner(self, py).into_py_object(py)
     }
 
     /// Return raw etcd addresses (host:port) used by this client.
diff --git a/fluxon_test_stack/benchmark_full_matrix.yaml b/fluxon_test_stack/benchmark_full_matrix.yaml
index ffa1f2b..eaf0fbe 100644
--- a/fluxon_test_stack/benchmark_full_matrix.yaml
+++ b/fluxon_test_stack/benchmark_full_matrix.yaml
@@ -318,7 +318,7 @@ profiles:
               disable_prefix_index: true
             fluxonkv_spec:
               cluster_name: __STACK_CLUSTER_NAME__
-              shared_memory_path: __STACK_SHARED_MEMORY_PATH__
+              share_mem_path: __STACK_SHARE_MEM_PATH__
           mq_base:
             capacity: 40
             ttl_seconds: 90
diff --git a/fluxon_test_stack/ci_test_list.yaml b/fluxon_test_stack/ci_test_list.yaml
index 9ebfa1c..4230559 100644
--- a/fluxon_test_stack/ci_test_list.yaml
+++ b/fluxon_test_stack/ci_test_list.yaml
@@ -439,7 +439,7 @@ profiles:
               # Self-host benchmark nodes are launched by the host-side deployer, not inside a
               # container with /hostworkdir mounted. Use the real host path so both infra44/46
               # benchmark nodes can open the same self-host shared-memory root directly.
-              shared_memory_path: __STACK_SHARED_MEMORY_PATH__
+              share_mem_path: __STACK_SHARE_MEM_PATH__
           mq_base:
             capacity: 40
             ttl_seconds: 90
diff --git a/fluxon_test_stack/deployconf_testbed.yml b/fluxon_test_stack/deployconf_testbed.yml
index 0a74ed4..4015beb 100644
--- a/fluxon_test_stack/deployconf_testbed.yml
+++ b/fluxon_test_stack/deployconf_testbed.yml
@@ -102,9 +102,7 @@ global_envs:
 
   FLUXON_CLUSTER_NAME: "fluxon_testbed"
   FLUXON_SHARED_MEM: "${HOSTWORKDIR}/shm1"
-  FLUXON_SHARED_FILE: "${HOSTWORKDIR}/shm1_files"
-  # Test-stack benchmark nodes use FLUXON_SHARED_MEM for mmap.file roots and
-  # FLUXON_SHARED_MEM2 as the shared-file/log root. Keep both under the current
+  # Test-stack benchmark nodes use explicit shared bundle roots under the current
   # hostworkdir so benchmarks do not bleed into fluxon4 paths.
   FLUXON_SHARED_MEM2: "${HOSTWORKDIR}/shm2_files"
   FLUXON_PPROF_DURATION_SECONDS: ""
@@ -335,7 +333,7 @@ service:
 
       WORKDIR="${FLUXON_SHARED_MEM}/owner_work_${NODE_ID}"
       CONFIG_PATH="${WORKDIR}/all_config.yaml"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}"
       cat > "${CONFIG_PATH}" <<YAML
       instance_key: "owner_${NODE_ID}"
       contribute_to_cluster_pool_size:
@@ -347,8 +345,7 @@ service:
         etcd_addresses:
         - "${ETCD_FULL_ADDRESS}"
         cluster_name: "${FLUXON_CLUSTER_NAME}"
-        shared_memory_path: "${FLUXON_SHARED_MEM}"
-        shared_file_path: "${FLUXON_SHARED_FILE}"
+        share_mem_path: "${FLUXON_SHARED_MEM}"
         large_file_paths:
         - "${HOSTWORKDIR}/large/owner_${NODE_ID}"
         sub_cluster: "owner"
@@ -369,7 +366,7 @@ service:
 
       cd "${FLUXON_SRC_ROOT}/fluxon_py/fluxon_fs"
       WORKDIR="${HOSTWORKDIR}/fluxon_fs/master"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}" "${HOSTWORKDIR}/fluxon_release"
+      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${HOSTWORKDIR}/fluxon_release"
       # English note:
       # - fluxon_fs master CLI resolves relative --config / --workdir against the installed module path.
       # - Pass explicit WORKDIR-anchored absolute paths here so startup never depends on cwd.
@@ -380,8 +377,7 @@ service:
         instance_key: "fluxon_fs_master"
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       fluxon_fs:
         master:
           instance_key: "fluxon_fs_master"
@@ -448,7 +444,7 @@ service:
 
       cd "${FLUXON_SRC_ROOT}/fluxon_py/fluxon_fs"
       WORKDIR="${HOSTWORKDIR}/fluxon_fs/agent_${NODE_ID}"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}" "${HOSTWORKDIR}/fluxon_release"
+      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${HOSTWORKDIR}/fluxon_release"
       # English note:
       # - fluxon_fs agent passes --config as a relative path; keep YAML generation in WORKDIR
       #   so future chdir changes do not silently pick up stale configs.
@@ -481,8 +477,7 @@ service:
         instance_key: "fluxon_fs_agent_${NODE_ID}"
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       fluxon_fs:
         master:
           instance_key: "fluxon_fs_master"
@@ -515,7 +510,7 @@ service:
       eval "${FLUXON_RELEASE_WHEEL_FETCH_CMD}"
 
       WORKDIR="${HOSTWORKDIR}/ops_agent/${NODE_ID}"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}"
 
       OPS_AGENT_INSTANCE_KEY="fluxon_ops_${NODE_ID}"
       case "${NODE_ID}" in
@@ -537,8 +532,7 @@ service:
         pprof_duration_seconds: 60
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${FLUXON_SHARED_FILE}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
           p2p_listen_port: ${OPS_AGENT_P2P_LISTEN_PORT}
       controller_instance_key: "${FLUXON_OPS_CONTROLLER_INSTANCE_KEY}"
       hostworkdir: "${HOSTWORKDIR}"
@@ -560,7 +554,7 @@ service:
       eval "${FLUXON_RELEASE_WHEEL_FETCH_CMD}"
 
       WORKDIR="${HOSTWORKDIR}/ops_controller"
-      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}" "${FLUXON_SHARED_FILE}"
+      mkdir -p "${WORKDIR}" "${FLUXON_SHARED_MEM}"
 
       cat > "${WORKDIR}/ops_controller.yaml" <<YAML
       ops_controller:
@@ -569,8 +563,7 @@ service:
           pprof_duration_seconds: 60
           fluxonkv_spec:
             cluster_name: "${FLUXON_CLUSTER_NAME}"
-            shared_memory_path: "${FLUXON_SHARED_MEM}"
-            shared_file_path: "${FLUXON_SHARED_FILE}"
+            share_mem_path: "${FLUXON_SHARED_MEM}"
             p2p_listen_port: 12102
         panel:
           max_body_bytes: 1073741824
@@ -616,8 +609,7 @@ service:
         instance_key: mpmc_demo_producer_base
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${HOSTWORKDIR}/mpmc_demo/shared_file_producer_${NODE_ID}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       mpmc_demo:
         key: demo_mpmc
         capacity: 20
@@ -685,8 +677,7 @@ service:
         instance_key: mpmc_demo_consumer_base
         fluxonkv_spec:
           cluster_name: "${FLUXON_CLUSTER_NAME}"
-          shared_memory_path: "${FLUXON_SHARED_MEM}"
-          shared_file_path: "${HOSTWORKDIR}/mpmc_demo/shared_file_consumer_${NODE_ID}"
+          share_mem_path: "${FLUXON_SHARED_MEM}"
       mpmc_demo:
         key: demo_mpmc
         capacity: 20
diff --git a/fluxon_test_stack/test_runner.py b/fluxon_test_stack/test_runner.py
index fee4313..2236be5 100644
--- a/fluxon_test_stack/test_runner.py
+++ b/fluxon_test_stack/test_runner.py
@@ -1333,26 +1333,16 @@ def _load_source_stack_contract() -> Dict[str, Any]:
         global_envs.get("FLUXON_CLUSTER_NAME"),
         "bootstrap source deployconf.global_envs.FLUXON_CLUSTER_NAME",
     )
-    shared_memory_hostworkdir = _require_str(
+    share_mem_hostworkdir = _require_str(
         global_envs.get("FLUXON_SHARED_MEM"),
         "bootstrap source deployconf.global_envs.FLUXON_SHARED_MEM",
     )
-    shared_file_hostworkdir = _require_str(
-        global_envs.get("FLUXON_SHARED_MEM2"),
-        "bootstrap source deployconf.global_envs.FLUXON_SHARED_MEM2",
-    )
     _resolve_stack_contract_path(
         contract_hostworkdir,
-        shared_memory_hostworkdir,
+        share_mem_hostworkdir,
         field_name="bootstrap source deployconf.global_envs.FLUXON_SHARED_MEM",
         allow_absolute=True,
     )
-    _resolve_stack_contract_path(
-        contract_hostworkdir,
-        shared_file_hostworkdir,
-        field_name="bootstrap source deployconf.global_envs.FLUXON_SHARED_MEM2",
-        allow_absolute=False,
-    )
 
     source_bootstrap_cfg_path = _load_test_bed_bootstrap_config_path()
     source_bootstrap_cfg = _require_dict(
@@ -1387,8 +1377,7 @@ def _load_source_stack_contract() -> Dict[str, Any]:
         # - /r/fs_s3/* proxy for downloading release artifacts
         "ops_controller_url": controller_url,
         "controller_basic_auth": controller_basic_auth,
-        "shared_memory_hostworkdir": shared_memory_hostworkdir,
-        "shared_file_hostworkdir": shared_file_hostworkdir,
+        "share_mem_hostworkdir": share_mem_hostworkdir,
     }
 
 
@@ -1397,8 +1386,7 @@ def _write_ci_runtime_test_config(
     src_root: Path,
     etcd_address: str,
     cluster_name: str,
-    shared_memory_path: str,
-    shared_file_path: str,
+    share_mem_path: str,
 ) -> Path:
     """Materialize the single CI test authority consumed by fluxon_py integration tests.
 
@@ -1417,8 +1405,7 @@ def _write_ci_runtime_test_config(
             "kv_svc_type": "fluxon",
             "etcd_address": str(etcd_address),
             "cluster_name": str(cluster_name),
-            "shared_memory_path": str(shared_memory_path),
-            "shared_file_path": str(shared_file_path),
+            "share_mem_path": str(share_mem_path),
         },
     )
     return test_cfg_path
@@ -2048,21 +2035,16 @@ def _cluster_scoped_shared_dir(*, root_path: str, cluster_name: str) -> Path:
 
 def _shared_bundle_paths_for_cluster(
     *,
-    shared_memory_root: str,
-    shared_file_root: str,
+    share_mem_root: str,
     cluster_name: str,
 ) -> List[Path]:
-    shared_memory_dir = _cluster_scoped_shared_dir(
-        root_path=shared_memory_root,
-        cluster_name=cluster_name,
-    )
-    shared_file_dir = _cluster_scoped_shared_dir(
-        root_path=shared_file_root,
+    share_mem_dir = _cluster_scoped_shared_dir(
+        root_path=share_mem_root,
         cluster_name=cluster_name,
     )
     return [
-        shared_file_dir / "shared.json",
-        shared_memory_dir / "mmap.file",
+        share_mem_dir / "shared.json",
+        share_mem_dir / "mmap.file",
     ]
 
 
@@ -2076,35 +2058,28 @@ def _owner_target_slug(*, owner_target: str, ctx: str) -> str:
 
 def _owner_bundle_roots_for_target(
     *,
-    shared_memory_root: str,
-    shared_file_root: str,
+    share_mem_root: str,
     owner_target: str,
     ctx: str,
-) -> Tuple[str, str]:
+) -> str:
     owner_slug = _owner_target_slug(owner_target=owner_target, ctx=ctx)
-    return (
-        str((Path(shared_memory_root) / owner_slug).resolve()),
-        str((Path(shared_file_root) / owner_slug).resolve()),
-    )
+    return str((Path(share_mem_root) / owner_slug).resolve())
 
 
 def _owner_bundle_paths_for_target(
     *,
-    shared_memory_root: str,
-    shared_file_root: str,
+    share_mem_root: str,
     cluster_name: str,
     owner_target: str,
     ctx: str,
 ) -> List[Path]:
-    owner_shared_memory_root, owner_shared_file_root = _owner_bundle_roots_for_target(
-        shared_memory_root=shared_memory_root,
-        shared_file_root=shared_file_root,
+    owner_share_mem_root = _owner_bundle_roots_for_target(
+        share_mem_root=share_mem_root,
         owner_target=owner_target,
         ctx=ctx,
     )
     return _shared_bundle_paths_for_cluster(
-        shared_memory_root=owner_shared_memory_root,
-        shared_file_root=owner_shared_file_root,
+        share_mem_root=owner_share_mem_root,
         cluster_name=cluster_name,
     )
 
@@ -2220,7 +2195,7 @@ def _require_explicit_owner_group_processes_for_multi_owner_same_machine(
     raise ValueError(
         f"{ctx}.benchmark.owner_group_processes is required when external Fluxon KV owners share a machine: "
         f"machines={multi_owner_machines}. Without an explicit group size, benchmark nodes and owners "
-        "silently reuse the same shared_memory_path/shared_file_path roots, which invalidates owner binding."
+        "silently reuse the same share_mem_path roots, which invalidates owner binding."
     )
 
 
@@ -2233,13 +2208,9 @@ def _load_stack_identity(*, workdir_root: Path) -> Dict[str, Any]:
         contract.get("controller_basic_auth"),
         field_name="bootstrap_contract.controller_basic_auth",
     )
-    shared_mem_hostworkdir = _require_str(
-        contract.get("shared_memory_hostworkdir"),
-        "bootstrap_contract.shared_memory_hostworkdir",
-    )
-    shared_file_hostworkdir = _require_str(
-        contract.get("shared_file_hostworkdir"),
-        "bootstrap_contract.shared_file_hostworkdir",
+    share_mem_hostworkdir = _require_str(
+        contract.get("share_mem_hostworkdir"),
+        "bootstrap_contract.share_mem_hostworkdir",
     )
     cluster_name = _suite_cluster_name_for_workdir(workdir_root)
     if cluster_name == ops_cluster_name:
@@ -2254,18 +2225,12 @@ def _load_stack_identity(*, workdir_root: Path) -> Dict[str, Any]:
         "cluster_name": cluster_name,
         "controller_url": ops_controller_url,
         "controller_basic_auth": controller_basic_auth,
-        "shared_memory_path": _resolve_stack_contract_path(
+        "share_mem_path": _resolve_stack_contract_path(
             hostworkdir,
-            shared_mem_hostworkdir,
-            field_name="bootstrap_contract.shared_memory_hostworkdir",
+            share_mem_hostworkdir,
+            field_name="bootstrap_contract.share_mem_hostworkdir",
             allow_absolute=True,
         ),
-        "shared_file_path": _resolve_stack_contract_path(
-            hostworkdir,
-            shared_file_hostworkdir,
-            field_name="bootstrap_contract.shared_file_hostworkdir",
-            allow_absolute=False,
-        ),
     }
 
 
@@ -2295,13 +2260,9 @@ def _build_runtime_token_mapping(
             stack_identity.get("controller_url"),
             "stack_identity.controller_url",
         ),
-        "__STACK_SHARED_MEMORY_PATH__": _require_str(
-            stack_identity.get("shared_memory_path"),
-            "stack_identity.shared_memory_path",
-        ),
-        "__STACK_SHARED_FILE_PATH__": _require_str(
-            stack_identity.get("shared_file_path"),
-            "stack_identity.shared_file_path",
+        "__STACK_SHARE_MEM_PATH__": _require_str(
+            stack_identity.get("share_mem_path"),
+            "stack_identity.share_mem_path",
         ),
     }
     if extra_tokens is not None:
@@ -3691,30 +3652,19 @@ def _resolved_run_dir_path(resolved_case: Dict[str, Any]) -> Path:
     return Path(_require_str(runtime.get("run_dir"), "runtime.run_dir")).resolve()
 
 
-def _ci_shared_memory_path(resolved_case: Dict[str, Any], *, run_dir: Path) -> str:
+def _ci_share_mem_path(resolved_case: Dict[str, Any], *, run_dir: Path) -> str:
     runtime = _require_dict(resolved_case.get("runtime"), "resolved_case.runtime")
     stack_identity = _require_dict(runtime.get("stack_identity"), "resolved_case.runtime.stack_identity")
-    shared_memory_root = _require_str(
-        stack_identity.get("shared_memory_path"),
-        "resolved_case.runtime.stack_identity.shared_memory_path",
+    share_mem_root = _require_str(
+        stack_identity.get("share_mem_path"),
+        "resolved_case.runtime.stack_identity.share_mem_path",
     )
     # English note:
-    # - iceoryx2 uses shared_memory_path as a base for per-node paths (e.g. .../nodes/<id>/iox2_<hash>/.service_tag).
+    # - iceoryx2 uses share_mem_path as a base for per-node paths (e.g. .../nodes/<id>/iox2_<hash>/.service_tag).
     # - The per-node suffix can be long, and some filesystems enforce a max path length of 255 bytes.
-    # - Therefore shared_memory_path must be short and must not embed run_dir (which can be deep under repo/workdir).
-    token = hashlib.sha256(str(run_dir.resolve()).encode("utf-8")).hexdigest()[:16]
-    return str((Path(shared_memory_root) / "ci" / token).resolve())
-
-
-def _ci_shared_file_path(resolved_case: Dict[str, Any], *, run_dir: Path) -> str:
-    runtime = _require_dict(resolved_case.get("runtime"), "resolved_case.runtime")
-    stack_identity = _require_dict(runtime.get("stack_identity"), "resolved_case.runtime.stack_identity")
-    shared_file_root = _require_str(
-        stack_identity.get("shared_file_path"),
-        "resolved_case.runtime.stack_identity.shared_file_path",
-    )
+    # - Therefore share_mem_path must be short and must not embed run_dir (which can be deep under repo/workdir).
     token = hashlib.sha256(str(run_dir.resolve()).encode("utf-8")).hexdigest()[:16]
-    return str((Path(shared_file_root) / "ci" / token).resolve())
+    return str((Path(share_mem_root) / "ci" / token).resolve())
 
 
 def _ci_owner_shared_bundle_paths(run_dir: Path, *, owner_config_path: Path) -> List[Path]:
@@ -3727,14 +3677,9 @@ def _ci_owner_shared_bundle_paths(run_dir: Path, *, owner_config_path: Path) ->
         fluxonkv_spec.get("cluster_name"),
         "ci_owner_0.yaml.fluxonkv_spec.cluster_name",
     )
-    shm = _require_str(fluxonkv_spec.get("shared_memory_path"), "ci_owner_0.yaml.fluxonkv_spec.shared_memory_path")
-    shared_file = _require_str(
-        fluxonkv_spec.get("shared_file_path"),
-        "ci_owner_0.yaml.fluxonkv_spec.shared_file_path",
-    )
+    shm = _require_str(fluxonkv_spec.get("share_mem_path"), "ci_owner_0.yaml.fluxonkv_spec.share_mem_path")
     return _shared_bundle_paths_for_cluster(
-        shared_memory_root=shm,
-        shared_file_root=shared_file,
+        share_mem_root=shm,
         cluster_name=cluster_name,
     )
 
@@ -3749,7 +3694,7 @@ def _wait_ci_owner_shared_bundle_ready_and_stage_shared_json(
     timeout_s: int,
 ) -> None:
     # English note:
-    # - `shared_memory_path` is host-local. When owner_0 runs on a remote node, the runner host
+    # - `share_mem_path` is host-local. When owner_0 runs on a remote node, the runner host
     #   cannot see shared.json/mmap.file by filesystem path.
     # - CI execution already depends on the remote shared bundle being ready. Here we additionally
     #   fetch shared.json back to a stable local path for determinism and postmortem.
@@ -3770,8 +3715,7 @@ def _wait_ci_owner_shared_bundle_ready_and_stage_shared_json(
                     required_str_keys = (
                         "owner_id",
                         "cluster_name",
-                        "shared_memory_path",
-                        "shared_file_path",
+                        "share_mem_path",
                         "protocol_version",
                     )
                     for k in required_str_keys:
@@ -3791,17 +3735,11 @@ def _wait_ci_owner_shared_bundle_ready_and_stage_shared_json(
                             f"expected={_ci_cluster_name(resolved_case)!r}"
                         )
                     expected_shm_dir = str(mmap_file_path.parent.resolve())
-                    if meta.get("shared_memory_path") != expected_shm_dir:
+                    if meta.get("share_mem_path") != expected_shm_dir:
                         raise ValueError(
-                            f"shared.json shared_memory_path mismatch: shared={meta.get('shared_memory_path')!r} "
+                            f"shared.json share_mem_path mismatch: shared={meta.get('share_mem_path')!r} "
                             f"expected={expected_shm_dir!r}"
                         )
-                    expected_file_dir = str(shared_json_path.parent.resolve())
-                    if meta.get("shared_file_path") != expected_file_dir:
-                        raise ValueError(
-                            f"shared.json shared_file_path mismatch: shared={meta.get('shared_file_path')!r} "
-                            f"expected={expected_file_dir!r}"
-                        )
                 except Exception as exc:  # noqa: BLE001
                     last_err = f"{type(exc).__name__}: {exc}"
                 else:
@@ -8669,8 +8607,7 @@ def _build_test_stack_external_kv_owner_instances(
 
     stack_identity = _require_dict(runtime.get("stack_identity"), "runtime.stack_identity")
     cluster_name = _require_str(stack_identity.get("cluster_name"), "runtime.stack_identity.cluster_name")
-    shared_memory_root = _require_str(stack_identity.get("shared_memory_path"), "runtime.stack_identity.shared_memory_path")
-    shared_file_root = _require_str(stack_identity.get("shared_file_path"), "runtime.stack_identity.shared_file_path")
+    share_mem_root = _require_str(stack_identity.get("share_mem_path"), "runtime.stack_identity.share_mem_path")
     etcd_endpoints = _test_stack_etcd_addresses(resolved_case)
     master_port_offset = 0
     owner_instances: List[Dict[str, Any]] = []
@@ -8693,12 +8630,10 @@ def _build_test_stack_external_kv_owner_instances(
             raise ValueError(f"computed owner_p2p_listen_port out of range: {owner_p2p_listen_port}")
 
         if owner_group_processes is None:
-            owner_shared_memory_path = shared_memory_root
-            owner_shared_file_path = shared_file_root
+            owner_share_mem_path = share_mem_root
         else:
-            owner_shared_memory_path, owner_shared_file_path = _owner_bundle_roots_for_target(
-                shared_memory_root=shared_memory_root,
-                shared_file_root=shared_file_root,
+            owner_share_mem_path = _owner_bundle_roots_for_target(
+                share_mem_root=share_mem_root,
                 owner_target=target,
                 ctx="runtime.stack_identity owner bundle roots",
             )
@@ -8714,8 +8649,7 @@ def _build_test_stack_external_kv_owner_instances(
             "fluxonkv_spec": {
                 "etcd_addresses": list(etcd_endpoints),
                 "cluster_name": cluster_name,
-                "shared_memory_path": owner_shared_memory_path,
-                "shared_file_path": owner_shared_file_path,
+                "share_mem_path": owner_share_mem_path,
                 "large_file_paths": owner_large_file_paths,
                 "sub_cluster": FLUXON_KV_OWNER_SUB_CLUSTER,
                 "p2p_listen_port": int(owner_p2p_listen_port),
@@ -9233,21 +9167,16 @@ def _compile_test_stack_case(resolved_case: Dict[str, Any], *, run_index: int) -
     node_roles: List[str] = []
     node_overrides: List[Dict[str, Any]] = []
     stack_cluster_name: Optional[str] = None
-    stack_shared_memory_path: Optional[str] = None
-    stack_shared_file_path: Optional[str] = None
+    stack_share_mem_path: Optional[str] = None
     if backend_kind == TEST_STACK_BACKEND_FLUXON:
         stack_identity = _require_dict(runtime.get("stack_identity"), "runtime.stack_identity")
         stack_cluster_name = _require_str(
             stack_identity.get("cluster_name"),
             "runtime.stack_identity.cluster_name",
         )
-        stack_shared_memory_path = _require_str(
-            stack_identity.get("shared_memory_path"),
-            "runtime.stack_identity.shared_memory_path",
-        )
-        stack_shared_file_path = _require_str(
-            stack_identity.get("shared_file_path"),
-            "runtime.stack_identity.shared_file_path",
+        stack_share_mem_path = _require_str(
+            stack_identity.get("share_mem_path"),
+            "runtime.stack_identity.share_mem_path",
         )
 
     rc = _require_dict(ts_profile.get("runtime_config"), "profile.test_stack.runtime_config")
@@ -9947,8 +9876,7 @@ def _compile_test_stack_case(resolved_case: Dict[str, Any], *, run_index: int) -
                     # Benchmark nodes bootstrap from owner shared bundles. Strict dual-owner mode
                     # routes each process group to a different same-machine owner bundle root.
                     assert stack_cluster_name is not None
-                    assert stack_shared_memory_path is not None
-                    assert stack_shared_file_path is not None
+                    assert stack_share_mem_path is not None
                     selected_owner_target = _test_stack_owner_target_for_node_process(
                         target=target,
                         process_idx=process_idx,
@@ -9957,18 +9885,15 @@ def _compile_test_stack_case(resolved_case: Dict[str, Any], *, run_index: int) -
                         owner_group_processes=owner_group_processes,
                     )
                     if selected_owner_target is None:
-                        selected_shared_memory_path = stack_shared_memory_path
-                        selected_shared_file_path = stack_shared_file_path
+                        selected_share_mem_path = stack_share_mem_path
                     else:
-                        selected_shared_memory_path, selected_shared_file_path = _owner_bundle_roots_for_target(
-                            shared_memory_root=stack_shared_memory_path,
-                            shared_file_root=stack_shared_file_path,
+                        selected_share_mem_path = _owner_bundle_roots_for_target(
+                            share_mem_root=stack_share_mem_path,
                             owner_target=selected_owner_target,
                             ctx=f"strict dual-owner routing target={target} process_idx={process_idx}",
                         )
                     fluxonkv_override["cluster_name"] = stack_cluster_name
-                    fluxonkv_override["shared_memory_path"] = selected_shared_memory_path
-                    fluxonkv_override["shared_file_path"] = selected_shared_file_path
+                    fluxonkv_override["share_mem_path"] = selected_share_mem_path
                     fluxonkv_override["p2p_listen_port"] = int(kv_p2p_listen_port)
                     kv["fluxonkv_spec"] = fluxonkv_override
                 elif backend_kind == TEST_STACK_BACKEND_ALLUXIO:
@@ -13820,8 +13745,7 @@ def _ci_prepare_run_inputs(
     overlay_live_checkout: bool,
     etcd_address: str,
     cluster_name: str,
-    shared_memory_path: str,
-    shared_file_path: str,
+    share_mem_path: str,
 ) -> None:
     """Materialize CI run inputs from the case release into an isolated run_dir.
 
@@ -13896,8 +13820,7 @@ def _ci_prepare_run_inputs(
         src_root=src_root,
         etcd_address=etcd_address,
         cluster_name=cluster_name,
-        shared_memory_path=shared_memory_path,
-        shared_file_path=shared_file_path,
+        share_mem_path=share_mem_path,
     )
     release_link_path = src_root / "fluxon_release"
     _materialize_ci_runtime_release_view(
@@ -13963,7 +13886,12 @@ def _write_ci_scene_config_yaml(
 
 
 def _write_ci_master_owner_configs(
-    resolved_case: Dict[str, Any], *, run_dir: Path, cluster_name: str, share_mem_path: str, share_file_path: str, owner_dram_bytes: int
+    resolved_case: Dict[str, Any],
+    *,
+    run_dir: Path,
+    cluster_name: str,
+    share_mem_path: str,
+    owner_dram_bytes: int,
 ) -> tuple[Path, Path]:
     owner_work_root = run_dir / "services" / "owner_0"
     master_cfg = {
@@ -13992,8 +13920,7 @@ def _write_ci_master_owner_configs(
         "fluxonkv_spec": {
             "etcd_addresses": ["__ETCD__"],
             "cluster_name": cluster_name,
-            "shared_memory_path": share_mem_path,
-            "shared_file_path": share_file_path,
+            "share_mem_path": share_mem_path,
             # Shared testbed / CI owners keep p2p_listen_port implicit so the
             # runtime can bind a free host port, but owner mode still requires
             # explicit large-file roots.
@@ -14268,7 +14195,6 @@ def _write_ci_runner_script(
     run_dir: Path,
     src_root: Path,
     share_mem_path: str,
-    share_file_path: str,
 ) -> Path:
     commands = _resolved_ci_command_list(resolved_case)
     venv_python = run_dir / "venv" / "bin" / "python3"
@@ -14309,30 +14235,22 @@ def _write_ci_runner_script(
     readiness_probe_block = ""
     if requires_owner_shared_bundle:
         bundle_cluster_name = _ci_cluster_name(resolved_case)
-        bundle_shared_memory_dir = str(
-            _cluster_scoped_shared_dir(root_path=share_mem_path, cluster_name=bundle_cluster_name)
-        )
-        bundle_shared_file_dir = str(
-            _cluster_scoped_shared_dir(root_path=share_file_path, cluster_name=bundle_cluster_name)
-        )
+        bundle_dir = str(_cluster_scoped_shared_dir(root_path=share_mem_path, cluster_name=bundle_cluster_name))
         shared_bundle_block = f"""
 echo "[ci_runner] waiting for owner shared bundle..."
 deadline=$(( $(date +%s) + {CI_RUNNER_SHARED_BUNDLE_TIMEOUT_S} ))
-shm={bundle_shared_memory_dir}
-shared_file={bundle_shared_file_dir}
+share_mem={bundle_dir}
 while [ $(date +%s) -lt "$deadline" ]; do
-  if [ -f "$shared_file/shared.json" ] && [ -f "$shm/mmap.file" ]; then
+  if [ -f "$share_mem/shared.json" ] && [ -f "$share_mem/mmap.file" ]; then
     echo "[ci_runner] owner shared bundle ready"
     break
   fi
   sleep 1
 done
-if [ ! -f "$shared_file/shared.json" ] || [ ! -f "$shm/mmap.file" ]; then
+if [ ! -f "$share_mem/shared.json" ] || [ ! -f "$share_mem/mmap.file" ]; then
   echo "[ci_runner] ERROR: owner shared bundle not ready in {CI_RUNNER_SHARED_BUNDLE_TIMEOUT_S}s"
-  echo "[ci_runner] shm=$shm"
-  echo "[ci_runner] shared_file=$shared_file"
-  ls -la "$shm"
-  ls -la "$shared_file"
+  echo "[ci_runner] share_mem=$share_mem"
+  ls -la "$share_mem"
   fail_and_exit 2
 fi
 """
@@ -15043,13 +14961,9 @@ def _test_stack_external_owner_shared_bundle_paths(
         stack_identity.get("cluster_name"),
         "resolved_case.runtime.stack_identity.cluster_name",
     )
-    shared_memory_path = _require_str(
-        stack_identity.get("shared_memory_path"),
-        "resolved_case.runtime.stack_identity.shared_memory_path",
-    )
-    shared_file_path = _require_str(
-        stack_identity.get("shared_file_path"),
-        "resolved_case.runtime.stack_identity.shared_file_path",
+    share_mem_path = _require_str(
+        stack_identity.get("share_mem_path"),
+        "resolved_case.runtime.stack_identity.share_mem_path",
     )
     if owner_target is not None:
         scale = _require_dict(resolved_case.get("scale"), "resolved_case.scale")
@@ -15079,15 +14993,13 @@ def _test_stack_external_owner_shared_bundle_paths(
         )
         if owner_group_processes is not None:
             return _owner_bundle_paths_for_target(
-                shared_memory_root=shared_memory_path,
-                shared_file_root=shared_file_path,
+                share_mem_root=share_mem_path,
                 cluster_name=cluster_name,
                 owner_target=owner_target,
                 ctx="TEST_STACK owner shared bundle paths",
             )
     return _shared_bundle_paths_for_cluster(
-        shared_memory_root=shared_memory_path,
-        shared_file_root=shared_file_path,
+        share_mem_root=share_mem_path,
         cluster_name=cluster_name,
     )
 
diff --git a/fluxon_test_stack/test_runner_runtime_backend.py b/fluxon_test_stack/test_runner_runtime_backend.py
index bc46a76..14a85e4 100644
--- a/fluxon_test_stack/test_runner_runtime_backend.py
+++ b/fluxon_test_stack/test_runner_runtime_backend.py
@@ -64,10 +64,8 @@ def _prepare_ci_case(
     services_root = (run_dir / "services").resolve()
     services_root.mkdir(parents=True, exist_ok=True)
     (services_root / "share_mem").mkdir(parents=True, exist_ok=True)
-    share_mem_path = ctx._ci_shared_memory_path(resolved_case, run_dir=run_dir)
-    share_file_path = ctx._ci_shared_file_path(resolved_case, run_dir=run_dir)
+    share_mem_path = ctx._ci_share_mem_path(resolved_case, run_dir=run_dir)
     Path(share_mem_path).mkdir(parents=True, exist_ok=True)
-    Path(share_file_path).mkdir(parents=True, exist_ok=True)
 
     venv_python = ctx._create_ci_runtime_venv(run_dir=run_dir)
 
@@ -83,8 +81,7 @@ def _prepare_ci_case(
         overlay_live_checkout=True,
         etcd_address=f"{ctx._ci_base_runtime_service_target_ip(resolved_case, service_id='etcd')}:{ctx._ci_base_runtime_service_port(resolved_case, service_id='etcd')}",
         cluster_name=out_cluster_name,
-        shared_memory_path=share_mem_path,
-        shared_file_path=share_file_path,
+        share_mem_path=share_mem_path,
     )
 
     prepare_env_exports = ctx._run_ci_prepare_steps(
@@ -108,7 +105,6 @@ def _prepare_ci_case(
             run_dir=run_dir,
             cluster_name=out_cluster_name,
             share_mem_path=share_mem_path,
-            share_file_path=share_file_path,
             owner_dram_bytes=owner_dram_bytes,
         )
     _ = ctx._write_ci_runner_script(
@@ -116,7 +112,6 @@ def _prepare_ci_case(
         run_dir=run_dir,
         src_root=src_root,
         share_mem_path=share_mem_path,
-        share_file_path=share_file_path,
     )
     ci_runner_exit_code_path = (run_dir / "logs" / "ci_runner" / "exit_code.txt").resolve()
     ci_runner_exit_code_baseline = ctx._observe_file_state(ci_runner_exit_code_path)
@@ -196,8 +191,7 @@ def _prepare_test_stack_case(
         "resolved_case.profile.test_stack.kind",
     )
     owner_instance_ids: List[str] = []
-    shared_memory_path: Optional[str] = None
-    shared_file_path: Optional[str] = None
+    share_mem_path: Optional[str] = None
     stack_cluster_name: Optional[str] = None
     if ctx._test_stack_backend_uses_dedicated_kv_owners(backend_kind=backend_kind, mode=mode):
         runtime = ctx._require_dict(resolved_case.get("runtime"), "resolved_case.runtime")
@@ -216,13 +210,9 @@ def _prepare_test_stack_case(
                 stack_identity.get("cluster_name"),
                 "runtime.stack_identity.cluster_name",
             )
-            shared_memory_path = ctx._require_str(
-                stack_identity.get("shared_memory_path"),
-                "runtime.stack_identity.shared_memory_path",
-            )
-            shared_file_path = ctx._require_str(
-                stack_identity.get("shared_file_path"),
-                "runtime.stack_identity.shared_file_path",
+            share_mem_path = ctx._require_str(
+                stack_identity.get("share_mem_path"),
+                "runtime.stack_identity.share_mem_path",
             )
             ctx._converge_test_stack_external_owner_shared_bundle_cleanup(
                 resolved_case,
@@ -302,7 +292,7 @@ def _prepare_test_stack_case(
         ctx="TEST_STACK prepare",
     )
     if ctx._test_stack_backend_uses_external_fluxon_kv(backend_kind=backend_kind, mode=mode):
-        if shared_memory_path is None or shared_file_path is None or stack_cluster_name is None:
+        if share_mem_path is None or stack_cluster_name is None:
             raise ValueError(
                 "internal error: TEST_STACK shared bundle identity is missing after pre-deploy cleanup"
             )
diff --git a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
index 8dbd5e4..86f41cb 100644
--- a/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
+++ b/fluxon_test_stack/tests/test_test_runner_testbed_contract.py
@@ -58,7 +58,6 @@ def test_write_ci_master_owner_configs_emits_owner_large_file_paths(self) -> Non
                         run_dir=run_dir,
                         cluster_name="ci_cluster",
                         share_mem_path="/tmp/ci_shm",
-                        share_file_path="/tmp/ci_share",
                         owner_dram_bytes=1073741824,
                     )
 
@@ -67,6 +66,7 @@ def test_write_ci_master_owner_configs_emits_owner_large_file_paths(self) -> Non
                 owner_cfg["fluxonkv_spec"]["large_file_paths"],
                 [str((run_dir / "services" / "owner_0" / "large").resolve())],
             )
+            self.assertNotIn("shared_file_path", owner_cfg["fluxonkv_spec"])
 
     def test_ci_runtime_python_executable_requires_python310_on_path(self) -> None:
         with mock.patch.object(_RUNNER.shutil, "which", return_value=None):
@@ -255,8 +255,7 @@ def test_generated_test_stack_owner_config_emits_large_file_paths(self) -> None:
                     "run_dir": str(run_dir),
                     "stack_identity": {
                         "cluster_name": "bench_cluster",
-                        "shared_memory_path": "/tmp/bench_shm",
-                        "shared_file_path": "/tmp/bench_share",
+                        "share_mem_path": "/tmp/bench_shm",
                     },
                 }
             }
@@ -385,8 +384,7 @@ def test_ci_prepare_run_inputs_rebuilds_release_view_without_reusing_source_test
                         "kv_svc_type: fluxon",
                         "etcd_address: 127.0.0.1:2379",
                         "cluster_name: fluxon-example-cluster",
-                        "shared_memory_path: /tmp/fluxon-example-cluster/shm",
-                        "shared_file_path: /tmp/fluxon-example-cluster/share",
+                        "share_mem_path: /tmp/fluxon-example-cluster/shm",
                         "",
                     ]
                 ),
@@ -520,8 +518,7 @@ def test_ci_prepare_run_inputs_rebuilds_release_view_without_reusing_source_test
                             overlay_live_checkout=False,
                             etcd_address="127.0.0.1:32579",
                             cluster_name="ci_case_cluster",
-                            shared_memory_path="/tmp/ci_case_cluster/shm",
-                            shared_file_path="/tmp/ci_case_cluster/share",
+                            share_mem_path="/tmp/ci_case_cluster/shm",
                         )
 
             release_view_root = src_root / "fluxon_release"
@@ -540,8 +537,7 @@ def test_ci_prepare_run_inputs_rebuilds_release_view_without_reusing_source_test
                     "kv_svc_type": "fluxon",
                     "etcd_address": "127.0.0.1:32579",
                     "cluster_name": "ci_case_cluster",
-                    "shared_memory_path": "/tmp/ci_case_cluster/shm",
-                    "shared_file_path": "/tmp/ci_case_cluster/share",
+                    "share_mem_path": "/tmp/ci_case_cluster/shm",
                 },
             )
             assert_python_abi.assert_called_once_with(venv_python=venv_python)
@@ -625,8 +621,7 @@ def test_ci_runner_script_sources_prepare_env_when_present(self) -> None:
                         "ops_cluster_name": "fluxon_testbed",
                         "cluster_name": "fluxon_testbed",
                         "controller_url": "http://127.0.0.1:19080/r/ops/fluxon_testbed",
-                        "shared_memory_path": "/tmp/shm",
-                        "shared_file_path": "/tmp/share",
+                        "share_mem_path": "/tmp/shm",
                     },
                     "deploy_instances": {
                         "case_runtime": [
@@ -650,7 +645,6 @@ def test_ci_runner_script_sources_prepare_env_when_present(self) -> None:
                     run_dir=run_dir,
                     src_root=src_root,
                     share_mem_path="/tmp/shm",
-                    share_file_path="/tmp/share",
                 )
             script_text = script_path.read_text(encoding="utf-8")
             self.assertIn('prepare_env_path="', script_text)
@@ -875,8 +869,9 @@ def test_load_source_stack_contract_accepts_same_host_dual_local_hostworkdirs(se
                 contract["ops_controller_url"],
                 "http://127.0.0.1:19080/r/ops/fluxon_testbed",
             )
-            self.assertEqual(contract["shared_memory_hostworkdir"], "${HOSTWORKDIR}/shm1")
-            self.assertEqual(contract["shared_file_hostworkdir"], "${HOSTWORKDIR}/shm2_files")
+            self.assertEqual(contract["share_mem_hostworkdir"], "${HOSTWORKDIR}/shm1")
+            self.assertNotIn("shared_memory_hostworkdir", contract)
+            self.assertNotIn("shared_file_hostworkdir", contract)
 
     def test_load_source_stack_contract_rejects_multi_hostworkdir_remote_layout(self) -> None:
         with tempfile.TemporaryDirectory() as td:
@@ -1044,8 +1039,7 @@ def test_write_deployer_manifests_renders_payload_wrapper_from_template(self) ->
                     "stack_identity": {
                         "cluster_name": "fluxon_testbed",
                         "controller_url": "http://127.0.0.1:19080/r/ops/fluxon_testbed",
-                        "shared_memory_path": "/tmp/shm",
-                        "shared_file_path": "/tmp/share",
+                        "share_mem_path": "/tmp/shm",
                     },
                 },
                 "artifact_set": {
diff --git a/setup_and_pack/utils/repo_config_utils.py b/setup_and_pack/utils/repo_config_utils.py
index 46f4686..ca51703 100644
--- a/setup_and_pack/utils/repo_config_utils.py
+++ b/setup_and_pack/utils/repo_config_utils.py
@@ -9,8 +9,7 @@
 from deployment.utils.deployconf_config_utils import (
     load_deployconf_etcd_address,
     load_deployconf_fluxon_cluster_name,
-    load_deployconf_fluxon_shared_file_path,
-    load_deployconf_fluxon_shared_memory_path,
+    load_deployconf_fluxon_share_mem_path,
     load_deployconf_mapping,
     load_deployconf_prom_remote_write_url,
     load_deployconf_prometheus_base_url,
@@ -35,16 +34,14 @@
     "load_test_kv_svc_type_from_test_config",
     "load_test_etcd_address_from_test_config",
     "load_test_fluxon_cluster_name_from_test_config",
-    "load_test_fluxon_shared_memory_path_from_test_config",
-    "load_test_fluxon_shared_file_path_from_test_config",
+    "load_test_fluxon_share_mem_path_from_test_config",
     "load_deployconf_mapping",
     "load_deployconf_resolved_global_envs",
     "load_deployconf_etcd_address",
     "load_deployconf_prometheus_base_url",
     "load_deployconf_prom_remote_write_url",
     "load_deployconf_fluxon_cluster_name",
-    "load_deployconf_fluxon_shared_memory_path",
-    "load_deployconf_fluxon_shared_file_path",
+    "load_deployconf_fluxon_share_mem_path",
     "load_deployconf_service_ip_port",
 ]
 
@@ -375,19 +372,10 @@ def load_test_fluxon_cluster_name_from_test_config(*, config_path: Optional[Path
     return raw.strip()
 
 
-def load_test_fluxon_shared_memory_path_from_test_config(*, config_path: Optional[Path] = None) -> str:
-    """Load Fluxon shared-memory root from test_config.yaml as the single test authority."""
+def load_test_fluxon_share_mem_path_from_test_config(*, config_path: Optional[Path] = None) -> str:
+    """Load Fluxon shared bundle root from test_config.yaml as the single test authority."""
     test_cfg = load_test_config_mapping(config_path=config_path)
-    raw = test_cfg.get("shared_memory_path")
+    raw = test_cfg.get("share_mem_path")
     if not isinstance(raw, str) or not raw.strip():
-        raise ValueError("test_config.yaml must define non-empty shared_memory_path")
-    return raw.strip()
-
-
-def load_test_fluxon_shared_file_path_from_test_config(*, config_path: Optional[Path] = None) -> str:
-    """Load Fluxon shared-file root from test_config.yaml as the single test authority."""
-    test_cfg = load_test_config_mapping(config_path=config_path)
-    raw = test_cfg.get("shared_file_path")
-    if not isinstance(raw, str) or not raw.strip():
-        raise ValueError("test_config.yaml must define non-empty shared_file_path")
+        raise ValueError("test_config.yaml must define non-empty share_mem_path")
     return raw.strip()