80 lines
2.8 KiB
Python
80 lines
2.8 KiB
Python
|
|
"""Harness: docker run <image> [cmd...] invocation patterns.
|
||
|
|
|
||
|
|
These tests MUST pass on the current tini-based image AND continue to
|
||
|
|
pass after the Phase 2 s6 migration. Any behavior drift is a regression.
|
||
|
|
|
||
|
|
The harness expects ``built_image`` and ``container_name`` fixtures from
|
||
|
|
``tests/docker/conftest.py``. When Docker isn't available every test
|
||
|
|
here is skipped at collection time.
|
||
|
|
"""
|
||
|
|
from __future__ import annotations
|
||
|
|
|
||
|
|
import subprocess
|
||
|
|
|
||
|
|
|
||
|
|
def test_no_args_starts_hermes(built_image: str) -> None:
|
||
|
|
"""``docker run <image>`` should start hermes cleanly.
|
||
|
|
|
||
|
|
We invoke ``--version`` so the call exits without needing a configured
|
||
|
|
model. Exit code may be 0 (printed version) or 1 (config bootstrapping
|
||
|
|
failure on a fresh volume), but never a stack trace.
|
||
|
|
"""
|
||
|
|
r = subprocess.run(
|
||
|
|
["docker", "run", "--rm", built_image, "--version"],
|
||
|
|
capture_output=True, text=True, timeout=60,
|
||
|
|
)
|
||
|
|
assert r.returncode in (0, 1), (
|
||
|
|
f"Unexpected exit {r.returncode}: stderr={r.stderr!r}"
|
||
|
|
)
|
||
|
|
assert "Traceback" not in r.stderr
|
||
|
|
|
||
|
|
|
||
|
|
def test_chat_subcommand_passthrough(built_image: str) -> None:
|
||
|
|
"""``docker run <image> chat --help`` should exec ``hermes chat --help``.
|
||
|
|
|
||
|
|
Uses ``--help`` so the call doesn't need an upstream model configured.
|
||
|
|
"""
|
||
|
|
r = subprocess.run(
|
||
|
|
["docker", "run", "--rm", built_image, "chat", "--help"],
|
||
|
|
capture_output=True, text=True, timeout=60,
|
||
|
|
)
|
||
|
|
assert r.returncode == 0
|
||
|
|
combined = (r.stdout + r.stderr).lower()
|
||
|
|
assert "chat" in combined or "usage" in combined
|
||
|
|
|
||
|
|
|
||
|
|
def test_bare_executable_passthrough(built_image: str) -> None:
|
||
|
|
"""``docker run <image> sleep 1`` should exec ``sleep`` directly.
|
||
|
|
|
||
|
|
The entrypoint detects that ``sleep`` is on PATH and routes around the
|
||
|
|
hermes wrapper. Useful for long-lived sandbox mode and for testing.
|
||
|
|
"""
|
||
|
|
r = subprocess.run(
|
||
|
|
["docker", "run", "--rm", built_image, "sleep", "1"],
|
||
|
|
capture_output=True, text=True, timeout=30,
|
||
|
|
)
|
||
|
|
assert r.returncode == 0
|
||
|
|
|
||
|
|
|
||
|
|
def test_bash_pattern(built_image: str) -> None:
|
||
|
|
"""``docker run <image> bash -c 'echo ok'`` should exec bash directly."""
|
||
|
|
r = subprocess.run(
|
||
|
|
["docker", "run", "--rm", built_image, "bash", "-c", "echo ok"],
|
||
|
|
capture_output=True, text=True, timeout=30,
|
||
|
|
)
|
||
|
|
assert r.returncode == 0
|
||
|
|
assert "ok" in r.stdout
|
||
|
|
|
||
|
|
|
||
|
|
def test_container_exit_code_matches_inner_exit(built_image: str) -> None:
|
||
|
|
"""The container exit code must match the inner process's exit code.
|
||
|
|
|
||
|
|
Critical for CI: ``docker run <image> hermes batch ...`` returns a
|
||
|
|
non-zero status when batch fails. Phase 2 (s6) must preserve this.
|
||
|
|
"""
|
||
|
|
r = subprocess.run(
|
||
|
|
["docker", "run", "--rm", built_image, "sh", "-c", "exit 42"],
|
||
|
|
capture_output=True, text=True, timeout=30,
|
||
|
|
)
|
||
|
|
assert r.returncode == 42
|