ForgeLM/tests/test_quickstart_subprocess.py at main · HodeTech/ForgeLM · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
"""Phase 10.5 UX hardening: subprocess argv + actionable error messages.

Two regressions covered here:

1. ``_resolve_dataset`` raises :class:`FileExistsError` when a per-run scratch
   directory is reused. The message must point the operator at a recovery path
   (``--dataset`` to reuse, or delete the file) instead of just blaming them.
2. ``_run_quickstart_cmd`` builds ``train_cmd`` and ``chat_cmd`` argv lists.
   The ``--config`` and the final-model-dir argument must be absolute paths so
   the child subprocess does not silently fail if the parent's cwd shifts
   between argv construction and ``subprocess.run``.

The ``_RunRecorder`` pattern is duplicated inline (per task instructions) so
this module stays independent of ``tests/test_cli_quickstart_wiring.py``.
"""

from __future__ import annotations

import os
from pathlib import Path
from unittest.mock import patch

import pytest


class _RunRecorder:
    """Minimal stand-in for :func:`subprocess.run` that captures argv lists."""

    def __init__(self, returncodes: list[int] | None = None) -> None:
        self.returncodes = returncodes if returncodes is not None else [0, 0]
        self.calls: list[list[str]] = []

    def __call__(self, argv, *args, **kwargs):  # noqa: D401 — match subprocess.run
        self.calls.append(list(argv))
        idx = len(self.calls) - 1
        rc = self.returncodes[idx] if idx < len(self.returncodes) else 0

        class _Completed:
            returncode = rc

        return _Completed()


# ---------------------------------------------------------------------------
# 1. FileExistsError message must surface recovery actions
# ---------------------------------------------------------------------------


def test_file_exists_error_message_actionable(tmp_path: Path):
    """Reusing a scratch dir must yield an action-oriented FileExistsError."""
    from forgelm.quickstart import _resolve_dataset, get_template

    template = get_template("customer-support")
    scratch = tmp_path / "run-1"

    # First call seeds the dataset into the scratch dir.
    _resolve_dataset(template, dataset_override=None, scratch_dir=scratch)

    # Second call must refuse and explain what the user can do next.
    with pytest.raises(FileExistsError) as exc_info:
        _resolve_dataset(template, dataset_override=None, scratch_dir=scratch)

    msg = str(exc_info.value)
    assert "pass --dataset" in msg, f"Expected '--dataset' recovery hint in error message, got: {msg!r}"
    assert "delete" in msg, f"Expected 'delete' recovery hint in error message, got: {msg!r}"


# ---------------------------------------------------------------------------
# 2. train_cmd argv must use the absolute config path
# ---------------------------------------------------------------------------


def test_train_subprocess_uses_absolute_config_path(tmp_path: Path):
    """If parent cwd changes between argv build and exec, the child still finds the config."""
    from forgelm.cli import main

    config_out = tmp_path / "abs-path-test.yaml"
    recorder = _RunRecorder()

    # final_model_dir must look real so the chat block (also patched) is
    # exercised end-to-end. Without it, _run_quickstart_cmd would log a warning
    # and skip the chat subprocess — fine for this test, but explicit setup
    # keeps the harness uniform with the chat-path test below.
    final_dir = tmp_path / "checkpoints" / "final_model"
    final_dir.mkdir(parents=True)

    argv = [
        "forgelm",
        "quickstart",
        "customer-support",
        "--output",
        str(config_out),
    ]

    with (
        patch("forgelm.quickstart._detect_available_vram_gb", return_value=24.0),
        patch(
            "forgelm.cli._load_quickstart_train_paths",
            return_value=(str(tmp_path / "checkpoints"), "final_model"),
        ),
        patch("subprocess.run", new=recorder),
        patch("sys.argv", argv),
    ):
        with pytest.raises(SystemExit) as exc_info:
            main()
    assert exc_info.value.code == 0
    assert recorder.calls, "subprocess.run was never invoked"

    train_argv = recorder.calls[0]
    assert "--config" in train_argv, f"--config missing from train argv: {train_argv}"
    cfg_value = train_argv[train_argv.index("--config") + 1]
    assert os.path.isabs(cfg_value), f"Expected absolute --config path, got relative: {cfg_value!r}"
    assert cfg_value.endswith("abs-path-test.yaml"), f"Expected the configured output path, got: {cfg_value!r}"


# ---------------------------------------------------------------------------
# 3. chat_cmd argv must use the absolute final_model_dir path
# ---------------------------------------------------------------------------


def test_chat_subprocess_uses_absolute_model_path(tmp_path: Path):
    """The auto-launched chat REPL must receive an absolute model dir.

    Uses a real ``tmp_path/checkpoints/final_model`` directory rather than
    monkey-patching ``pathlib.Path.is_dir`` globally — the global patch
    affected every Path.is_dir() call in the importlib/yaml/setuptools
    stack and was a foot-gun for unrelated changes.
    """
    from forgelm.cli import main

    config_out = tmp_path / "abs-path-test.yaml"
    recorder = _RunRecorder()

    # Materialise the real directory the chat-launch gate checks for.
    checkpoints_dir = tmp_path / "checkpoints"
    final_model_dir = checkpoints_dir / "final_model"
    final_model_dir.mkdir(parents=True)

    argv = [
        "forgelm",
        "quickstart",
        "customer-support",
        "--output",
        str(config_out),
    ]

    with (
        patch("forgelm.quickstart._detect_available_vram_gb", return_value=24.0),
        patch(
            "forgelm.cli._load_quickstart_train_paths",
            return_value=(str(checkpoints_dir), "final_model"),
        ),
        patch("subprocess.run", new=recorder),
        patch("sys.argv", argv),
    ):
        with pytest.raises(SystemExit) as exc_info:
            main()
    assert exc_info.value.code == 0
    assert len(recorder.calls) == 2, (
        f"Expected train + chat subprocess calls, got {len(recorder.calls)}: {recorder.calls}"
    )

    chat_argv = recorder.calls[1]
    # The model path is the final positional argument to ``chat``.
    assert "chat" in chat_argv, f"'chat' subcommand missing: {chat_argv}"
    model_path = chat_argv[-1]
    assert os.path.isabs(model_path), f"Expected absolute chat model path, got relative: {model_path!r}"
    assert model_path.endswith("final_model"), f"Expected path to end with 'final_model', got: {model_path!r}"