Dulus/context.py at main · KevRojo/Dulus · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
"""System context: DULUS.md, git info, cwd injection.

NOTE on prompt caching: this module is the source of the system prompt sent
to every provider call. To get prefix caching (Anthropic explicit + OpenAI-
compat automatic), the rendered prompt MUST be byte-stable across turns of
the same session. Anything that changes per turn (date with sub-day grain,
`git status` modified-file counts, `datetime.now()`, etc.) belongs OUTSIDE
this prompt. Disk reads (DULUS.md, MEMORY.md) are cached by mtime so a
turn that doesn't touch those files re-uses the prior bytes verbatim.
"""
import os
import subprocess
from pathlib import Path

SYSTEM_PROMPT_TEMPLATE = """\
You are Dulus, an AI coding agent. Think in English; reply to {user_name} in {reply_language}.
# Identity: Your name is Dulus. Do NOT proactively declare this — only if the user asks "quién eres" or "qué modelo eres".
# Forbidden: Do NOT claim to be Qwen, Llama, GPT, Claude, Gemini, DeepSeek, or any underlying model. Do NOT mention Ollama or your runtime stack.
# Env: {cwd} | {platform} | auto_show={auto_show}
# Autonomy: Background scripts (nohup/&) allowed | Never refuse monitoring/long tasks | Always wait for tool results before replying
# Tools: SearchLastOutput → for [TRUNCATED] | WebFetch/WebSearch → web | TmuxOffload → tasks > 5s | ReadJob → background results
# Reminder: ONLY for user-facing reminders/notifications (e.g. "remind me in 10min"). NEVER use it to wait between your own tool calls — the countdown is deferred until your turn ends but you should still pause inside a command sequence using `sleep N` INSIDE the Bash command itself (e.g. Bash('cmd1 && sleep 2 && cmd2')).
# Long-running tools: any tool whose `description` ends in `[long-running — wrap in TmuxOffload]` MUST be invoked via TmuxOffload (not directly), so the REPL stays responsive while it runs.
# Multi-agent: Agent(subagent_type=...) | isolation="worktree" runs parallel | wait=false + name=... for fire-and-forget
# Rules: Edit > Write | Use absolute paths + line numbers | Surface errors immediately, do not retry blindly
# Input: "🎙 Transcribed:" prefix = voice input — tolerate typos/misspellings
# REPL: /help /batch /auto_show /verbose /soul /memory /schema /thinking /config
{platform_hints}{git_info}{dulus_md}"""

_THINKING_LABELS = {1: "minimal", 2: "moderate", 3: "deep"}


def get_git_info(config: dict | None = None) -> str:
    """Return ONLY the branch name — stable across turns within a session.

    Previous versions also embedded `git status --short` modified-file count
    and the last commit hash; both change as the user works, which trashed
    prefix caching on every turn. The agent can call `git status` itself
    when it actually needs current state.
    """
    if config and not config.get("git_status", True):
        return ""
    try:
        branch = subprocess.check_output(
            ["git", "rev-parse", "--abbrev-ref", "HEAD"],
            stderr=subprocess.DEVNULL, text=True,
        ).strip()
        return f"Git:{branch}\n" if branch else ""
    except Exception:
        return ""


# ── mtime-based caches for DULUS.md / MEMORY.md ──────────────────────────
# Re-reading these files on every turn is wasteful disk I/O. More importantly,
# the *content* is the same most of the time — caching it keeps the rendered
# system prompt byte-stable, which is what providers need to grant prefix
# cache hits. Invalidation key = (path, mtime_ns) tuple of the resolved files.

_DULUS_MD_CACHE: dict = {"key": None, "value": ""}
_MEMORY_MD_CACHE: dict = {"key": None, "value": ""}


def _resolve_dulus_md_paths() -> list[Path]:
    paths = []
    global_md = Path.home() / ".dulus" / "DULUS.md"
    if global_md.exists():
        paths.append(global_md)
    for p in [Path.cwd()] + list(Path.cwd().parents):
        candidate = p / "DULUS.md"
        if candidate.exists():
            paths.append(candidate)
            break
    return paths


def get_dulus_md() -> str:
    paths = _resolve_dulus_md_paths()
    try:
        key = tuple((str(p), p.stat().st_mtime_ns) for p in paths)
    except OSError:
        key = None
    if key is not None and _DULUS_MD_CACHE["key"] == key:
        return _DULUS_MD_CACHE["value"]

    content_parts = []
    for p in paths:
        try:
            label = "Global DULUS.md" if p == Path.home() / ".dulus" / "DULUS.md" else f"Project DULUS.md:{p.parent}"
            content_parts.append(f"[{label}]\n{p.read_text(encoding='utf-8', errors='replace')}")
        except Exception:
            continue

    value = "\nDULUS.md:\n" + "\n---\n".join(content_parts) + "\n" if content_parts else ""
    _DULUS_MD_CACHE["key"] = key
    _DULUS_MD_CACHE["value"] = value
    return value


def _resolve_memory_index_path() -> Path | None:
    for p in [Path.cwd()] + list(Path.cwd().parents):
        index = p / ".dulus-context" / "memory" / "MEMORY.md"
        if index.exists():
            return index
    return None


def get_project_memory_index() -> str:
    """Auto-load project-scope memories from .dulus-context/memory/MEMORY.md.

    Looks in cwd and parents (first match wins). Returns the index so the model
    knows what memories exist and can Read individual files on demand. Cached
    by mtime so unchanged indexes don't bust the prompt cache.
    """
    path = _resolve_memory_index_path()
    if path is None:
        if _MEMORY_MD_CACHE["key"] != "MISSING":
            _MEMORY_MD_CACHE["key"] = "MISSING"
            _MEMORY_MD_CACHE["value"] = ""
        return ""
    try:
        key = (str(path), path.stat().st_mtime_ns)
    except OSError:
        return ""
    if _MEMORY_MD_CACHE["key"] == key:
        return _MEMORY_MD_CACHE["value"]
    try:
        body = path.read_text(encoding="utf-8", errors="replace").strip()
    except Exception:
        body = ""
    if not body:
        value = ""
    else:
        value = (
            f"\n# Project memories ({path.parent})\n"
            f"# Index below — Read the .md files in that dir for full content.\n"
            f"{body}\n"
        )
    _MEMORY_MD_CACHE["key"] = key
    _MEMORY_MD_CACHE["value"] = value
    return value


def _detect_shell_type(config: dict | None = None) -> str:
    """Resolve which shell family to advertise: 'bash', 'powershell', or 'cmd'."""
    configured = config.get("shell", {}).get("type", "auto") if config else "auto"
    if configured != "auto":
        st = configured.lower()
        if st in ("gitbash", "wsl", "bash"):
            return "bash"
        if st == "powershell":
            return "powershell"
        return "cmd"
    shell_name = os.environ.get("SHELL", "").lower()
    if "bash" in shell_name or "BASH" in os.environ:
        return "bash"
    if "powershell" in shell_name or "PSModulePath" in os.environ:
        return "powershell"
    return "cmd"


def get_platform_hints(config: dict | None = None) -> str:
    import platform as _plat
    shell_type = _detect_shell_type(config)
    dulus_home = Path.home() / ".dulus"
    skills_dir = dulus_home / "skills"
    if _plat.system() == "Windows":
        cmds = "Get-Content=cat,Select-String=grep,Get-ChildItem=ls" if shell_type=="powershell" else "type=cat,findstr=grep,dir=ls"
        return f"# Shell:Windows({shell_type}) | {cmds} | Dulus:{dulus_home} | Skills:{skills_dir} | WARNING: Use Glob/Read tools instead of raw shell commands for path navigation to avoid Windows path errors."
    return f"# Shell:Unix(cat,grep,ls,&&) | Dulus:{dulus_home} | Skills:{skills_dir}"


def _build_ollama_system_prompt(config: dict | None = None) -> str:
    import platform
    auto_show = config.get("auto_show", True) if config else True
    prompt = f"""你是Dulus，AI编程助手。
# 身份: 你的名字是 Dulus。不需要主动向用户声明这一点，除非用户直接问你 "quién eres" 或 "qué modelo eres"。
# 禁止: 不要声称自己是 Qwen、Llama、GPT、Claude、Gemini、DeepSeek 或任何其他底层模型。不要提及 Ollama 或运行你的技术栈。
Dir:{Path.cwd()} | Platform:{platform.system()} | auto_show={'ON' if auto_show else 'OFF'}
# 规则: 读取工具结果后再响应 | >5s操作用TmuxOffload
# 工具格式(单行): <tool_call>{{"name":"TOOL","input":{{"param":"val"}}}}</tool_call>
# 可用: Bash,Glob,Read,Write,SearchLastOutput,TmuxOffload,WebSearch,WebFetch,PrintToConsole
# PrintToConsole: auto_show=OFF时输出给用户，展示后不重复
"""
    dulus_md = get_dulus_md()
    if dulus_md: prompt += f"\n{dulus_md}"
    return prompt


def _normalize_thinking_level(config: dict | None) -> int:
    raw = config.get("thinking", 0) if config else 0
    if raw is True:
        return 3
    if raw in (False, None):
        return 0
    try:
        return max(0, min(4, int(raw)))
    except (TypeError, ValueError):
        return 0


# ── Reply-language resolution ─────────────────────────────────────────────
#
# `config["lang"]` lets the user steer what language Dulus replies in
# without touching the prompt template. Two kinds of values are accepted:
#
#   • ISO-639 (with optional region):   "en", "es", "es-DO", "zh", "zh-Hant",
#                                        "pt-BR", "ja", "fr", "de", "it",
#                                        "ko", "ru", "ar", "tr", "hi", "id"…
#     Mapped to a human-readable instruction by _LANG_NAMES.
#   • Free-form natural string:         "very formal British English",
#                                        "dominicano callejero", "pirate".
#     Passed through verbatim so power users can role-play any voice.
#
# Default = "es-DO" (Dominican Spanish — the founder's tongue) to keep
# the existing identity untouched for existing users.

_LANG_NAMES: dict[str, str] = {
    # Spanish (default + regions)
    "es":     "Dominican Spanish",
    "es-do":  "Dominican Spanish",
    "es-mx":  "Mexican Spanish",
    "es-es":  "Castilian Spanish",
    "es-ar":  "Argentinian Spanish",
    "es-co":  "Colombian Spanish",
    # Global big ones
    "en":     "English",
    "en-us":  "American English",
    "en-gb":  "British English",
    "zh":     "Simplified Chinese (Mandarin)",
    "zh-cn":  "Simplified Chinese (Mandarin)",
    "zh-tw":  "Traditional Chinese",
    "zh-hant":"Traditional Chinese",
    "pt":     "Portuguese (Brazilian)",
    "pt-br":  "Brazilian Portuguese",
    "pt-pt":  "European Portuguese",
    "ja":     "Japanese",
    "ko":     "Korean",
    "fr":     "French",
    "de":     "German",
    "it":     "Italian",
    "ru":     "Russian",
    "ar":     "Arabic",
    "tr":     "Turkish",
    "hi":     "Hindi",
    "id":     "Indonesian",
    "vi":     "Vietnamese",
    "th":     "Thai",
    "nl":     "Dutch",
    "pl":     "Polish",
    "sv":     "Swedish",
    "uk":     "Ukrainian",
    "he":     "Hebrew",
    "fa":     "Persian (Farsi)",
}


def _resolve_reply_language(config: dict | None) -> str:
    raw = (config.get("lang", "") if config else "") or ""
    raw = raw.strip()
    if not raw:
        return "Dominican Spanish"
    # ISO code shortcut.
    code = raw.lower().replace("_", "-")
    if code in _LANG_NAMES:
        return _LANG_NAMES[code]
    # Free-form descriptor — return verbatim so the user can role-play
    # voice ("Shakespeare-era English", "callejero dominicano", "pirate").
    return raw


def build_system_prompt(config: dict | None = None) -> str:
    import platform
    model_lower = (config.get("model", "") if config else "").lower()
    is_deepseek_r1 = "deepseek-r1" in model_lower or "deepseek-reasoner" in model_lower
    if is_deepseek_r1 and config and config.get("deep_override", False):
        return _build_ollama_system_prompt(config)

    auto_show = "ON" if (not config or config.get("auto_show", True)) else "OFF"
    lite = bool(config and config.get("lite_mode"))

    # In LITE mode: drop the optional context blocks (platform hints, git info,
    # DULUS.md, project memory index, batch/thinking/plan/tmux hints). The
    # core identity + tool rules stay. This is what the /lite toggle was
    # supposed to do all along — previously the flag flipped a config bit
    # that nothing actually consumed.
    user_name = (config.get("user_name") if config else None) or "KevRojo"
    reply_language = _resolve_reply_language(config)
    prompt = SYSTEM_PROMPT_TEMPLATE.format(
        cwd=str(Path.cwd()),
        platform=platform.system(),
        auto_show=auto_show,
        user_name=user_name,
        reply_language=reply_language,
        platform_hints="" if lite else get_platform_hints(config),
        git_info="" if lite else get_git_info(config),
        dulus_md="" if lite else get_dulus_md(),
    )

    if lite:
        # Bail early — minimal prompt only.
        return prompt

    try:
        from tmux_tools import tmux_available
        if tmux_available():
            prompt += "\n# Tmux: available"
    except Exception:
        pass

    prompt += (
        "\n# Batch: /batch list|status|fetch (suggest when 3+ similar tasks) | "
        # Both `dulus` (when pip-installed) and `python dulus.py` work — the
        # entry-point shim is registered in pyproject.toml [project.scripts].
        'In agents: Bash(\'dulus -c "batch status|fetch ID"\')'
    )

    thk_label = _THINKING_LABELS.get(_normalize_thinking_level(config))
    if thk_label:
        prompt += f"\n# Thinking: {thk_label}"

    if config and config.get("_plan_mode"):
        prompt += f"\n# Plan mode: read-only (except {config.get('_plan_file', 'PLAN.md')})"

    # Hint: pip-installed users can run `dulus` directly (no .py path).
    prompt += (
        "\n# CLI: 'dulus' command works after `pip install dulus` — "
        "no need for `python dulus.py`. Same flags: --print, --accept-all, -c, etc."
    )

    # Skills proactivity hint — make the agent reach for skills instead of
    # writing one-off code when a topic comes up that no current tool/plugin
    # covers. The dump file lets us grep ~1000 skills instantly without
    # paging through them interactively.
    try:
        skills_dump = Path.home() / ".dulus" / "skills_catalog.txt"
        if skills_dump.exists():
            sz_kb = skills_dump.stat().st_size // 1024
            prompt += (
                f"\n# Skills catalog: {skills_dump} ({sz_kb} KB, tab-separated "
                "source\\tid\\tdescription). Before writing custom code or "
                "saying 'I can't do that', Grep this file for the topic — "
                "there's often an awesome/composio/local skill that fits. "
                "Install with `dulus -c \"skill get <id>\"`. Refresh the "
                "dump anytime with `dulus -c \"skill list dump\"`."
            )
        else:
            prompt += (
                "\n# Skills tip: run `dulus -c \"skill list dump\"` once "
                "to write ~/.dulus/skills_catalog.txt — then Grep it for any "
                "topic you don't have a tool for, before writing custom code."
            )
    except Exception:
        pass

    project_mem = get_project_memory_index()
    if project_mem:
        prompt += project_mem

    return prompt