cheetahclaws/context.py at main · SafeRL-Lab/cheetahclaws · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
"""System context: CLAUDE.md, git info, cwd injection.

Prompt assembly pipeline:

    build_system_prompt(config) -> str
        = pick_base_prompt(provider, model)      # default.md + matched overlay
        + _render_env_block(config)              # date / cwd / platform / git / CLAUDE.md
        + memory index (if any)
        + tmux fragment (if tmux available)      # prompts/fragments/tmux.md
        + plan mode fragment (if plan active)    # prompts/fragments/plan.md

Base + overlay design lives under ``prompts/`` — see ``prompts/README.md``.
Base/overlay files contain no placeholders and are loaded verbatim.
Dynamic per-run data (date, cwd, CLAUDE.md, plan file path) is rendered
separately and appended.

Callers outside this module should only touch ``build_system_prompt``.
The helper functions (``get_git_info``, ``get_claude_md``,
``get_platform_hints``) are exposed for tests and for REPL commands
that want to show individual context blocks (e.g. ``/doctor``).
"""
from __future__ import annotations

import os
import re
import subprocess
import threading
import time
from pathlib import Path
from datetime import datetime

from memory import get_memory_context
from prompts import pick_base_prompt, load_fragment


# Short-TTL caches: each turn rebuilds the system prompt, and shelling out to
# git + re-reading CLAUDE.md every turn is a measurable chunk of latency in
# long REPL sessions. Numbers are deliberately conservative.
_GIT_CACHE_TTL = 30.0   # seconds — long enough to span a tool batch
_CLAUDE_MD_TTL = 10.0   # seconds — short so user edits to CLAUDE.md show up quickly

_git_cache: tuple[float, str, str] | None = None   # (expiry, cwd, value)
_claude_md_cache: tuple[float, str, str] | None = None
_cache_lock = threading.Lock()

# ── Prompt injection detection ───────────────────────────────────────────
_THREAT_PATTERNS = [
    re.compile(r'ignore\s+(previous|all|above|prior)(\s+\w+)*\s+(instructions?|prompts?|rules?)', re.I),
    re.compile(r'system\s+prompt\s+(override|replace|change|modify|ignore)', re.I),
    re.compile(r'you\s+are\s+now\s+(a|an|no\s+longer)', re.I),
    re.compile(r'disregard\s+(all|any|your)\s+(previous|prior|above)', re.I),
    re.compile(r'new\s+instructions?\s*:', re.I),
    re.compile(r'curl\s+[^\n]*\$\{?\w*(KEY|TOKEN|SECRET|PASSWORD|CREDENTIAL)', re.I),
    re.compile(r'(cat|echo|print|export)\s+.*\$(ANTHROPIC|OPENAI|API|SECRET|TOKEN)', re.I),
    re.compile(r'base64\s+(encode|decode).*\b(key|token|secret|password)\b', re.I),
]


def _scan_for_threats(content: str, source: str) -> str | None:
    """Scan content for prompt injection patterns. Returns warning or None."""
    for pattern in _THREAT_PATTERNS:
        match = pattern.search(content)
        if match:
            return (
                f"[SECURITY WARNING] Potential prompt injection detected in {source}:\n"
                f"  Pattern: {match.group()!r}\n"
                f"  This content has been excluded from the system prompt."
            )
    return None


def get_git_info() -> str:
    """Return git branch/status summary if in a git repo. Cached for ~30s."""
    global _git_cache
    cwd = str(Path.cwd())
    now = time.monotonic()
    with _cache_lock:
        if _git_cache is not None and _git_cache[1] == cwd and _git_cache[0] > now:
            return _git_cache[2]
    try:
        branch = subprocess.check_output(
            ["git", "rev-parse", "--abbrev-ref", "HEAD"],
            stderr=subprocess.DEVNULL, text=True).strip()
        status = subprocess.check_output(
            ["git", "status", "--short"],
            stderr=subprocess.DEVNULL, text=True).strip()
        log = subprocess.check_output(
            ["git", "log", "--oneline", "-5"],
            stderr=subprocess.DEVNULL, text=True).strip()
        parts = [f"- Git branch: {branch}"]
        if status:
            lines = status.split('\n')[:10]
            parts.append("- Git status:\n" + "\n".join(f"  {l}" for l in lines))
        if log:
            parts.append("- Recent commits:\n" + "\n".join(f"  {l}" for l in log.split('\n')))
        result = "\n".join(parts) + "\n"
    except Exception:
        result = ""
    with _cache_lock:
        _git_cache = (now + _GIT_CACHE_TTL, cwd, result)
    return result


def get_claude_md() -> str:
    """Load CLAUDE.md from cwd or parents, and ~/.claude/CLAUDE.md.

    Each file is scanned for prompt injection patterns before inclusion.
    Cached for ~10s; the cache key is cwd so changing directories invalidates.
    """
    global _claude_md_cache
    cwd = str(Path.cwd())
    now = time.monotonic()
    with _cache_lock:
        if _claude_md_cache is not None and _claude_md_cache[1] == cwd and _claude_md_cache[0] > now:
            return _claude_md_cache[2]

    content_parts = []
    warnings = []

    # Global CLAUDE.md
    global_md = Path.home() / ".claude" / "CLAUDE.md"
    if global_md.exists():
        try:
            text = global_md.read_text()
            threat = _scan_for_threats(text, f"Global CLAUDE.md ({global_md})")
            if threat:
                warnings.append(threat)
            else:
                content_parts.append(f"[Global CLAUDE.md]\n{text}")
        except Exception:
            pass

    # Project CLAUDE.md (walk up from cwd)
    p = Path.cwd()
    for _ in range(10):
        candidate = p / "CLAUDE.md"
        if candidate.exists():
            try:
                text = candidate.read_text()
                threat = _scan_for_threats(text, f"Project CLAUDE.md ({candidate})")
                if threat:
                    warnings.append(threat)
                else:
                    content_parts.append(f"[Project CLAUDE.md: {candidate}]\n{text}")
            except Exception:
                pass
            break
        parent = p.parent
        if parent == p:
            break
        p = parent

    # Print warnings to stderr so user sees them
    if warnings:
        import sys
        for w in warnings:
            print(f"\033[33m{w}\033[0m", file=sys.stderr)

    if not content_parts:
        result = ""
    else:
        result = "\n# Memory / CLAUDE.md\n" + "\n\n".join(content_parts) + "\n"
    with _cache_lock:
        _claude_md_cache = (now + _CLAUDE_MD_TTL, cwd, result)
    return result


def get_platform_hints() -> str:
    """Return shell hints tailored to the current OS."""
    import platform as _plat
    if _plat.system() == "Windows":
        return (
            "\n## Windows Shell Hints\n"
            "You are on Windows. Do NOT use Unix commands. Use these instead:\n"
            "- `type file.txt` instead of `cat file.txt`\n"
            "- `type file.txt | findstr /n /i \"pattern\"` instead of `grep`\n"
            "- `powershell -Command \"Get-Content file.txt -Tail 20\"` instead of `tail -n 20`\n"
            "- `powershell -Command \"Get-Content file.txt -Head 20\"` instead of `head -n 20`\n"
            "- `dir /s /b *.py` or `powershell -Command \"Get-ChildItem -Recurse -Filter *.py\"` instead of `find . -name '*.py'`\n"
            "- `del file.txt` instead of `rm file.txt`\n"
            "- `mkdir folder` works on both (no -p needed)\n"
            "- `copy` / `move` instead of `cp` / `mv`\n"
            "- Use `&&` to chain commands, not `;`\n"
            "- Paths use backslashes `\\` but forward slashes `/` also work in most cases\n"
            "- Python is available: `python -c \"...\"` works for complex text processing\n"
        )
    return ""


def _render_env_block(config: dict | None = None) -> str:
    """Render the per-run environment block (date / cwd / platform / git / CLAUDE.md).

    This used to be the ``# Environment`` section at the bottom of the
    monolithic SYSTEM_PROMPT_TEMPLATE.  It now renders fresh every call
    so the base prompt can remain pure static text.
    """
    import platform as _plat
    # Trailing \n on the Platform line is load-bearing: get_git_info()
    # returns content that starts with "- Git branch:" (no leading newline),
    # so without this \n it concatenates as "Platform: Linux- Git branch:".
    header = (
        "# Environment\n"
        f"- Current date: {datetime.now().strftime('%Y-%m-%d %A')}\n"
        f"- Working directory: {Path.cwd()}\n"
        f"- Platform: {_plat.system()}\n"
    )
    return header + get_platform_hints() + get_git_info() + get_claude_md()


def _render_plan_fragment(config: dict) -> str:
    """Load the plan-mode fragment and fill in {plan_file}."""
    import runtime
    plan_file = runtime.get_ctx(config).plan_file or ""
    template = load_fragment("plan")
    return template.format(plan_file=plan_file)


def _tmux_available() -> bool:
    try:
        from tmux_tools import tmux_available
        return tmux_available()
    except ImportError:
        return False


def _render_commands_block() -> str:
    """Render a markdown list of every registered slash command.

    Pulls live from ``cheetahclaws._CMD_META`` (lazy import to avoid the
    cheetahclaws -> context -> cheetahclaws circular at module load), so
    the prompt always reflects the current command surface — including
    plugins merged in via ``_load_external_commands_into``.

    Without this block the model has no idea what `/trading`,
    `/research`, `/lab`, `/web`, `/wechat` etc. are and will confabulate
    when the user asks "what can you do?" — see context.py docstring.
    """
    try:
        import cheetahclaws as _cc
    except ImportError:
        return ""
    meta = getattr(_cc, "_CMD_META", None)
    if not meta:
        return ""

    lines = [
        "# Available Slash Commands (User-invokable in this CheetahClaws session)",
        "",
        "These commands the **user** can invoke at the REPL prompt — they are"
        " NOT tools you call. When the user asks 'what can you do?' / '你能做什么?'"
        " / asks about a feature like trading or research or web UI, reference"
        " these by their exact `/name` so the user can try them. Do not invent"
        " commands that are not on this list.",
        "",
    ]
    for name in sorted(meta.keys()):
        desc, subs = meta[name]
        sub_str = f" `[{' | '.join(subs)}]`" if subs else ""
        lines.append(f"- `/{name}`{sub_str} — {desc}")
    return "\n".join(lines)


def build_system_prompt(config: dict | None = None) -> str:
    """Build the full system prompt for the current session.

    Structure (top → bottom):
        1. Provider-selected base prompt (``prompts/base/<provider>.md``)
        2. Per-run environment block (date, cwd, platform, git, CLAUDE.md)
        3. Live slash-command index (so the model can answer
           "what can you do?" without confabulating)
        4. Memory index (if any memories exist)
        5. Tmux fragment (if tmux is installed)
        6. Plan-mode fragment (if ``permission_mode == "plan"``)
    """
    # Resolve provider lazily to avoid circular imports at module load.
    from providers import detect_provider

    cfg = config or {}
    model_id = cfg.get("model", "")
    # No model -> empty provider so pick_base_prompt falls through to
    # default.md.  The previous "anthropic" fallback silently gave Claude-
    # styled prompts (XML tags, minimal-scope guard) to whatever model
    # picked them up later, which is wrong for non-Claude families.
    provider = detect_provider(model_id) if model_id else ""

    parts: list[str] = [
        pick_base_prompt(provider, model_id),
        _render_env_block(cfg),
    ]

    cmds_block = _render_commands_block()
    if cmds_block:
        parts.append(cmds_block)

    memory_ctx = get_memory_context()
    if memory_ctx:
        parts.append(f"# Memory\nYour persistent memories:\n{memory_ctx}")

    if _tmux_available():
        parts.append(load_fragment("tmux"))

    if cfg.get("permission_mode") == "plan":
        parts.append(_render_plan_fragment(cfg))

    # Collapse any trailing whitespace on each part so the "\n\n"
    # separator produces a consistent two-newline gap regardless of how
    # each file/helper terminates.
    return "\n\n".join(p.rstrip() for p in parts if p)