claw-code/tests/test_parse_error_envelope.py

"""#178 — argparse-level errors emit JSON envelope when --output-format json is requested.

Before #178:
  $ claw nonexistent --output-format json
  usage: main.py [-h] {summary,manifest,...} ...
  main.py: error: argument command: invalid choice: 'nonexistent' (choose from ...)
  [exit 2, argparse dumps help to stderr, no JSON envelope]

After #178:
  $ claw nonexistent --output-format json
  {"timestamp": "...", "command": "nonexistent", "exit_code": 1, ...,
   "error": {"kind": "parse", "operation": "argparse", ...}}
  [exit 1, JSON envelope on stdout, matches SCHEMAS.md contract]

Contract:
- text mode: unchanged (argparse still dumps help to stderr, exit code 2)
- JSON mode: envelope matches SCHEMAS.md 'error' shape, exit code 1
- Parse errors use error.kind='parse' (distinct from runtime/session/etc.)
"""

from __future__ import annotations

import json
import subprocess
import sys
from pathlib import Path

import pytest

CLI = [sys.executable, '-m', 'src.main']
REPO_ROOT = Path(__file__).resolve().parent.parent


class TestParseErrorJsonEnvelope:
    """Argparse errors emit JSON envelope when --output-format json is requested."""

    def test_unknown_command_json_mode_emits_envelope(self) -> None:
        """Unknown command + --output-format json → parse-error envelope."""
        result = subprocess.run(
            CLI + ['nonexistent-command', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.returncode == 1, f"expected exit 1; got {result.returncode}"
        envelope = json.loads(result.stdout)
        # Common fields
        assert envelope['schema_version'] == '1.0'
        assert envelope['output_format'] == 'json'
        assert envelope['exit_code'] == 1
        # Error envelope shape
        assert envelope['error']['kind'] == 'parse'
        assert envelope['error']['operation'] == 'argparse'
        assert envelope['error']['retryable'] is False
        assert envelope['error']['target'] == 'nonexistent-command'
        assert 'hint' in envelope['error']

    def test_unknown_command_json_equals_syntax(self) -> None:
        """--output-format=json syntax also works."""
        result = subprocess.run(
            CLI + ['nonexistent-command', '--output-format=json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.returncode == 1
        envelope = json.loads(result.stdout)
        assert envelope['error']['kind'] == 'parse'

    def test_unknown_command_text_mode_unchanged(self) -> None:
        """Text mode (default) preserves argparse behavior: help to stderr, exit 2."""
        result = subprocess.run(
            CLI + ['nonexistent-command'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.returncode == 2, f"text mode must preserve argparse exit 2; got {result.returncode}"
        # stderr should have argparse error (help + error message)
        assert 'invalid choice' in result.stderr
        # stdout should be empty (no JSON leaked)
        assert result.stdout == ''

    def test_invalid_flag_json_mode_emits_envelope(self) -> None:
        """Invalid flag at top level + --output-format json → envelope."""
        result = subprocess.run(
            CLI + ['--invalid-top-level-flag', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        # argparse might reject before --output-format is parsed; still emit envelope
        assert result.returncode == 1, f"got {result.returncode}: {result.stderr}"
        envelope = json.loads(result.stdout)
        assert envelope['error']['kind'] == 'parse'

    def test_missing_command_no_json_flag_behaves_normally(self) -> None:
        """No --output-format flag + missing command → normal argparse behavior."""
        result = subprocess.run(
            CLI,
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        # argparse exits 2 when required subcommand is missing
        assert result.returncode == 2
        assert 'required' in result.stderr.lower() or 'the following arguments are required' in result.stderr.lower()

    def test_valid_command_unaffected(self) -> None:
        """Valid commands still work normally (no regression)."""
        result = subprocess.run(
            CLI + ['list-sessions', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.returncode == 0
        envelope = json.loads(result.stdout)
        assert envelope['command'] == 'list-sessions'
        assert 'sessions' in envelope

    def test_parse_error_envelope_contains_common_fields(self) -> None:
        """Parse-error envelope must include all common fields per SCHEMAS.md."""
        result = subprocess.run(
            CLI + ['bogus', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        envelope = json.loads(result.stdout)
        # All common fields required by SCHEMAS.md
        for field in ('timestamp', 'command', 'exit_code', 'output_format', 'schema_version'):
            assert field in envelope, f"common field '{field}' missing from parse-error envelope"


class TestParseErrorSchemaCompliance:
    """Parse-error envelope matches SCHEMAS.md error shape."""

    def test_error_kind_is_parse(self) -> None:
        """error.kind='parse' distinguishes argparse errors from runtime errors."""
        result = subprocess.run(
            CLI + ['unknown', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        envelope = json.loads(result.stdout)
        assert envelope['error']['kind'] == 'parse'

    def test_error_retryable_false(self) -> None:
        """Parse errors are never retryable (typo won't magically fix itself)."""
        result = subprocess.run(
            CLI + ['unknown', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        envelope = json.loads(result.stdout)
        assert envelope['error']['retryable'] is False


class TestParseErrorStderrHygiene:
    """#179: JSON mode must fully suppress argparse stderr output.

    Before #179: stderr leaked argparse usage + error text even when --output-format json.
    After #179: stderr is silent; envelope carries the real error message verbatim.
    """

    def test_json_mode_stderr_is_silent_on_unknown_command(self) -> None:
        """Unknown command in JSON mode: stderr empty."""
        result = subprocess.run(
            CLI + ['nonexistent-cmd', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.stderr == '', (
            f"JSON mode stderr must be empty; got:\n{result.stderr!r}"
        )

    def test_json_mode_stderr_is_silent_on_missing_arg(self) -> None:
        """Missing required arg in JSON mode: stderr empty (no argparse usage leak)."""
        result = subprocess.run(
            CLI + ['load-session', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        assert result.stderr == '', (
            f"JSON mode stderr must be empty on missing arg; got:\n{result.stderr!r}"
        )

    def test_json_mode_envelope_carries_real_argparse_message(self) -> None:
        """#179: envelope.error.message contains argparse's actual text, not generic rejection."""
        result = subprocess.run(
            CLI + ['load-session', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        envelope = json.loads(result.stdout)
        # Real argparse message: 'the following arguments are required: session_id'
        msg = envelope['error']['message']
        assert 'session_id' in msg, (
            f"envelope.error.message must carry real argparse text mentioning missing arg; got: {msg!r}"
        )
        assert 'required' in msg.lower(), (
            f"envelope.error.message must indicate what is required; got: {msg!r}"
        )

    def test_json_mode_envelope_carries_invalid_choice_details(self) -> None:
        """#179: unknown command envelope includes valid-choice list from argparse."""
        result = subprocess.run(
            CLI + ['typo-command', '--output-format', 'json'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        envelope = json.loads(result.stdout)
        msg = envelope['error']['message']
        assert 'invalid choice' in msg.lower(), (
            f"envelope must mention 'invalid choice'; got: {msg!r}"
        )
        # Should include at least one valid command name for discoverability
        assert 'bootstrap' in msg or 'summary' in msg, (
            f"envelope must include valid choices for discoverability; got: {msg!r}"
        )

    def test_text_mode_stderr_preserved_on_unknown_command(self) -> None:
        """Text mode: argparse stderr behavior unchanged (backward compat)."""
        result = subprocess.run(
            CLI + ['nonexistent-cmd'],
            cwd=REPO_ROOT,
            capture_output=True,
            text=True,
        )
        # Text mode still dumps argparse help to stderr
        assert 'invalid choice' in result.stderr
        assert result.returncode == 2
feat: #178 — argparse errors emit JSON envelope when --output-format json requested Dogfood pinpoint: running 'claw nonexistent-command --output-format json' bypasses the JSON envelope contract — argparse dumps human-readable usage to stderr with exit 2, breaking the SCHEMAS.md guarantee that JSON mode returns structured output. Problem: $ claw nonexistent --output-format json usage: main.py [-h] {summary,manifest,...} ... main.py: error: argument command: invalid choice: 'nonexistent' (choose from ...) [exit 2 — no envelope, claws must parse argparse usage messages] Fix: $ claw nonexistent --output-format json { "timestamp": "2026-04-22T11:00:29Z", "command": "nonexistent-command", "exit_code": 1, "output_format": "json", "schema_version": "1.0", "error": { "kind": "parse", "operation": "argparse", "target": "nonexistent-command", "retryable": false, "message": "invalid command or argument (argparse rejection)", "hint": "run with no arguments to see available subcommands" } } [exit 1, clean JSON envelope on stdout per SCHEMAS.md] Changes: - src/main.py: - _wants_json_output(argv): pre-scan for --output-format json before parsing - _emit_parse_error_envelope(argv, message): emit wrapped envelope on stdout - main(): catch SystemExit from argparse; if JSON requested, emit envelope instead of letting argparse's help dump go through - tests/test_parse_error_envelope.py (new, 9 tests): - TestParseErrorJsonEnvelope (7): unknown command, =syntax, text mode unchanged, invalid flag, missing command, valid command unaffected, common fields - TestParseErrorSchemaCompliance (2): error.kind='parse', retryable=false Contract: - text mode (default): unchanged — argparse dumps help to stderr, exits 2 - JSON mode: envelope per SCHEMAS.md, error.kind='parse', exit 1 - Parse errors always retryable=false (typo won't self-fix) - error.kind='parse' already enumerated in SCHEMAS.md (no schema changes) This closes a real gap: claws invoking unknown commands in JSON mode can now route via exit code + envelope.kind='parse' instead of scraping argparse output. Test results: 192 → 201 passing, 3 skipped unchanged, zero regression. Pinpoint discovered via dogfood at 2026-04-22 19:59 KST (cycle #19). 2026-04-22 20:02:39 +09:00			`"""#178 — argparse-level errors emit JSON envelope when --output-format json is requested.`

			`Before #178:`
			`$ claw nonexistent --output-format json`
			`usage: main.py [-h] {summary,manifest,...} ...`
			`main.py: error: argument command: invalid choice: 'nonexistent' (choose from ...)`
			`[exit 2, argparse dumps help to stderr, no JSON envelope]`

			`After #178:`
			`$ claw nonexistent --output-format json`
			`{"timestamp": "...", "command": "nonexistent", "exit_code": 1, ...,`
			`"error": {"kind": "parse", "operation": "argparse", ...}}`
			`[exit 1, JSON envelope on stdout, matches SCHEMAS.md contract]`

			`Contract:`
			`- text mode: unchanged (argparse still dumps help to stderr, exit code 2)`
			`- JSON mode: envelope matches SCHEMAS.md 'error' shape, exit code 1`
			`- Parse errors use error.kind='parse' (distinct from runtime/session/etc.)`
			`"""`

			`from __future__ import annotations`

			`import json`
			`import subprocess`
			`import sys`
			`from pathlib import Path`

			`import pytest`

			`CLI = [sys.executable, '-m', 'src.main']`
			`REPO_ROOT = Path(__file__).resolve().parent.parent`


			`class TestParseErrorJsonEnvelope:`
			`"""Argparse errors emit JSON envelope when --output-format json is requested."""`

			`def test_unknown_command_json_mode_emits_envelope(self) -> None:`
			`"""Unknown command + --output-format json → parse-error envelope."""`
			`result = subprocess.run(`
			`CLI + ['nonexistent-command', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.returncode == 1, f"expected exit 1; got {result.returncode}"`
			`envelope = json.loads(result.stdout)`
			`# Common fields`
			`assert envelope['schema_version'] == '1.0'`
			`assert envelope['output_format'] == 'json'`
			`assert envelope['exit_code'] == 1`
			`# Error envelope shape`
			`assert envelope['error']['kind'] == 'parse'`
			`assert envelope['error']['operation'] == 'argparse'`
			`assert envelope['error']['retryable'] is False`
			`assert envelope['error']['target'] == 'nonexistent-command'`
			`assert 'hint' in envelope['error']`

			`def test_unknown_command_json_equals_syntax(self) -> None:`
			`"""--output-format=json syntax also works."""`
			`result = subprocess.run(`
			`CLI + ['nonexistent-command', '--output-format=json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.returncode == 1`
			`envelope = json.loads(result.stdout)`
			`assert envelope['error']['kind'] == 'parse'`

			`def test_unknown_command_text_mode_unchanged(self) -> None:`
			`"""Text mode (default) preserves argparse behavior: help to stderr, exit 2."""`
			`result = subprocess.run(`
			`CLI + ['nonexistent-command'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.returncode == 2, f"text mode must preserve argparse exit 2; got {result.returncode}"`
			`# stderr should have argparse error (help + error message)`
			`assert 'invalid choice' in result.stderr`
			`# stdout should be empty (no JSON leaked)`
			`assert result.stdout == ''`

			`def test_invalid_flag_json_mode_emits_envelope(self) -> None:`
			`"""Invalid flag at top level + --output-format json → envelope."""`
			`result = subprocess.run(`
			`CLI + ['--invalid-top-level-flag', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`# argparse might reject before --output-format is parsed; still emit envelope`
			`assert result.returncode == 1, f"got {result.returncode}: {result.stderr}"`
			`envelope = json.loads(result.stdout)`
			`assert envelope['error']['kind'] == 'parse'`

			`def test_missing_command_no_json_flag_behaves_normally(self) -> None:`
			`"""No --output-format flag + missing command → normal argparse behavior."""`
			`result = subprocess.run(`
			`CLI,`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`# argparse exits 2 when required subcommand is missing`
			`assert result.returncode == 2`
			`assert 'required' in result.stderr.lower() or 'the following arguments are required' in result.stderr.lower()`

			`def test_valid_command_unaffected(self) -> None:`
			`"""Valid commands still work normally (no regression)."""`
			`result = subprocess.run(`
			`CLI + ['list-sessions', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.returncode == 0`
			`envelope = json.loads(result.stdout)`
			`assert envelope['command'] == 'list-sessions'`
			`assert 'sessions' in envelope`

			`def test_parse_error_envelope_contains_common_fields(self) -> None:`
			`"""Parse-error envelope must include all common fields per SCHEMAS.md."""`
			`result = subprocess.run(`
			`CLI + ['bogus', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`envelope = json.loads(result.stdout)`
			`# All common fields required by SCHEMAS.md`
			`for field in ('timestamp', 'command', 'exit_code', 'output_format', 'schema_version'):`
			`assert field in envelope, f"common field '{field}' missing from parse-error envelope"`


			`class TestParseErrorSchemaCompliance:`
			`"""Parse-error envelope matches SCHEMAS.md error shape."""`

			`def test_error_kind_is_parse(self) -> None:`
			`"""error.kind='parse' distinguishes argparse errors from runtime errors."""`
			`result = subprocess.run(`
			`CLI + ['unknown', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`envelope = json.loads(result.stdout)`
			`assert envelope['error']['kind'] == 'parse'`

			`def test_error_retryable_false(self) -> None:`
			`"""Parse errors are never retryable (typo won't magically fix itself)."""`
			`result = subprocess.run(`
			`CLI + ['unknown', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`envelope = json.loads(result.stdout)`
			`assert envelope['error']['retryable'] is False`
fix: #179 — JSON mode now fully suppresses argparse stderr + preserves real error message Dogfood discovered #178 had two residual gaps: 1. Stderr pollution: argparse usage + error text still leaked to stderr even in JSON mode (envelope was correct on stdout, but stderr noise broke the 'machine-first protocol' contract — claws capturing both streams got dual output) 2. Generic error message: envelope carried 'invalid command or argument (argparse rejection)' instead of argparse's actual text like 'the following arguments are required: session_id' or 'invalid choice: typo (choose from ...)' Before #179: $ claw load-session --output-format json [stdout] {"error": {"message": "invalid command or argument (argparse rejection)"}} [stderr] usage: main.py load-session [-h] ... main.py load-session: error: the following arguments are required: session_id [exit 1] After #179: $ claw load-session --output-format json [stdout] {"error": {"message": "the following arguments are required: session_id"}} [stderr] (empty) [exit 1] Implementation: - New _ArgparseError exception class captures argparse's real message - main() monkey-patches parser.error (+ all subparser.error) in JSON mode to raise _ArgparseError instead of print-to-stderr + sys.exit(2) - _emit_parse_error_envelope() now receives the real message verbatim - Text mode path unchanged: still uses original argparse print+exit behavior Contract: - JSON mode: stdout carries envelope with argparse's actual error; stderr silent - Text mode: unchanged — argparse usage to stderr, exit 2 - Parse errors still error.kind='parse', retryable=false Test additions (5 new, 14 total in test_parse_error_envelope.py): - TestParseErrorStderrHygiene (5): - test_json_mode_stderr_is_silent_on_unknown_command - test_json_mode_stderr_is_silent_on_missing_arg - test_json_mode_envelope_carries_real_argparse_message - test_json_mode_envelope_carries_invalid_choice_details (verifies valid-choices list) - test_text_mode_stderr_preserved_on_unknown_command (backward compat) Operational impact: Claws capturing both stdout and stderr no longer get garbled output. The envelope message now carries discoverability info (valid command list, missing-arg name) that claws can use for retry/recovery without probing the CLI a second time. Test results: 201 → 206 passing, 3 skipped unchanged, zero regression. Pinpoint discovered via dogfood at 2026-04-22 20:30 KST (cycle #20). 2026-04-22 20:32:28 +09:00

			`class TestParseErrorStderrHygiene:`
			`"""#179: JSON mode must fully suppress argparse stderr output.`

			`Before #179: stderr leaked argparse usage + error text even when --output-format json.`
			`After #179: stderr is silent; envelope carries the real error message verbatim.`
			`"""`

			`def test_json_mode_stderr_is_silent_on_unknown_command(self) -> None:`
			`"""Unknown command in JSON mode: stderr empty."""`
			`result = subprocess.run(`
			`CLI + ['nonexistent-cmd', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.stderr == '', (`
			`f"JSON mode stderr must be empty; got:\n{result.stderr!r}"`
			`)`

			`def test_json_mode_stderr_is_silent_on_missing_arg(self) -> None:`
			`"""Missing required arg in JSON mode: stderr empty (no argparse usage leak)."""`
			`result = subprocess.run(`
			`CLI + ['load-session', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`assert result.stderr == '', (`
			`f"JSON mode stderr must be empty on missing arg; got:\n{result.stderr!r}"`
			`)`

			`def test_json_mode_envelope_carries_real_argparse_message(self) -> None:`
			`"""#179: envelope.error.message contains argparse's actual text, not generic rejection."""`
			`result = subprocess.run(`
			`CLI + ['load-session', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`envelope = json.loads(result.stdout)`
			`# Real argparse message: 'the following arguments are required: session_id'`
			`msg = envelope['error']['message']`
			`assert 'session_id' in msg, (`
			`f"envelope.error.message must carry real argparse text mentioning missing arg; got: {msg!r}"`
			`)`
			`assert 'required' in msg.lower(), (`
			`f"envelope.error.message must indicate what is required; got: {msg!r}"`
			`)`

			`def test_json_mode_envelope_carries_invalid_choice_details(self) -> None:`
			`"""#179: unknown command envelope includes valid-choice list from argparse."""`
			`result = subprocess.run(`
			`CLI + ['typo-command', '--output-format', 'json'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`envelope = json.loads(result.stdout)`
			`msg = envelope['error']['message']`
			`assert 'invalid choice' in msg.lower(), (`
			`f"envelope must mention 'invalid choice'; got: {msg!r}"`
			`)`
			`# Should include at least one valid command name for discoverability`
			`assert 'bootstrap' in msg or 'summary' in msg, (`
			`f"envelope must include valid choices for discoverability; got: {msg!r}"`
			`)`

			`def test_text_mode_stderr_preserved_on_unknown_command(self) -> None:`
			`"""Text mode: argparse stderr behavior unchanged (backward compat)."""`
			`result = subprocess.run(`
			`CLI + ['nonexistent-cmd'],`
			`cwd=REPO_ROOT,`
			`capture_output=True,`
			`text=True,`
			`)`
			`# Text mode still dumps argparse help to stderr`
			`assert 'invalid choice' in result.stderr`
			`assert result.returncode == 2`