test: BATS coverage for supporting scripts (functional resilience + sr_resolve)

yasinBursali · claude · yasinBursali · commit eb944194e972 · 2026-04-29T04:18:48.000+03:00
test-functional-resilience.bats pins dream-test-functional.sh set -e resilience: summary emission even under all-fail, sentinel delivery, bounded set +e/-e around test functions (#428). test-sr-resolve.bats pins sr_resolve 8-case matrix including the dream- prefix strip added post-PR-10 (#430). Co-Authored-By: Claude Opus 4.7 (1M context) <noreply@anthropic.com>
diff --git a/dream-server/tests/bats-tests/test-functional-resilience.bats b/dream-server/tests/bats-tests/test-functional-resilience.bats
@@ -0,0 +1,162 @@
+#!/usr/bin/env bats
+# ============================================================================
+# BATS tests for scripts/dream-test-functional.sh set -e resilience.
+# ============================================================================
+# Guards against re-breakage of PR #428:
+#   - Arithmetic expansion (TESTS_FAILED=$((TESTS_FAILED + 1))) must not
+#     trip `set -e` on the first increment when the counter is 0.
+#   - The summary line and the final exit code must be emitted even when
+#     every underlying functional test fails.
+#   - `set +e / -e` bounded around the test-function dispatch block lets
+#     all tests run to completion before the summary.
+#
+# Note: the sentinel `__DREAM_RESULT__` is emitted by the Python streaming
+# endpoint (routers/setup.py), not by this shell script directly. The shell
+# just needs to exit with the right code so the endpoint can report it.
+# Sentinel-delivery itself is covered by PR-2F's Python tests.
+
+load '../bats/bats-support/load'
+load '../bats/bats-assert/load'
+
+setup() {
+    export TMPDIR_TEST="$BATS_TEST_TMPDIR"
+    export SCRIPT_SRC="$BATS_TEST_DIRNAME/../../scripts/dream-test-functional.sh"
+}
+
+# Build a patched copy of the script with test_*_functional() overridden.
+# Uses a single marker-insert to stick overrides just before the bounded
+# `set +e` dispatch block, so the rest of the script (strict mode, counters,
+# summary, exit logic) runs exactly as in production.
+_patch_script() {
+    local mode="$1"  # all-fail | all-pass | mixed
+    local out="$TMPDIR_TEST/patched-${mode}.sh"
+    local overrides_file="$TMPDIR_TEST/overrides-${mode}.sh"
+
+    # Stub bodies for each mode. Every stub runs `pass` or `fail`, which
+    # exist in the original script; those mutate the real counters.
+    case "$mode" in
+        all-fail)
+            cat > "$overrides_file" <<'OV'
+test_llm_functional()        { fail "LLM (stubbed)"; return 1; }
+test_tts_functional()        { fail "TTS (stubbed)"; return 1; }
+test_embeddings_functional() { fail "Embeddings (stubbed)"; return 1; }
+test_whisper_functional()    { fail "Whisper (stubbed)"; return 1; }
+OV
+            ;;
+        all-pass)
+            cat > "$overrides_file" <<'OV'
+test_llm_functional()        { pass "LLM (stubbed)"; }
+test_tts_functional()        { pass "TTS (stubbed)"; }
+test_embeddings_functional() { pass "Embeddings (stubbed)"; }
+test_whisper_functional()    { pass "Whisper (stubbed)"; }
+OV
+            ;;
+        mixed)
+            cat > "$overrides_file" <<'OV'
+test_llm_functional()        { pass "LLM (stubbed)"; }
+test_tts_functional()        { fail "TTS (stubbed)"; return 1; }
+test_embeddings_functional() { pass "Embeddings (stubbed)"; }
+test_whisper_functional()    { fail "Whisper (stubbed)"; return 1; }
+OV
+            ;;
+    esac
+
+    # Insert overrides at the marker — the line immediately before the
+    # bounded `set +e` dispatch block. BSD+GNU awk portable.
+    awk -v ov_file="$overrides_file" '
+        BEGIN {
+            while ((getline line < ov_file) > 0) overrides = overrides line "\n"
+            close(ov_file)
+        }
+        /^# Each test returns 1 on failure/ && !inserted {
+            printf "%s", overrides
+            inserted = 1
+        }
+        { print }
+    ' "$SCRIPT_SRC" > "$out"
+
+    # Neutralize the service-registry source block — it hard-depends on a
+    # full install layout that does not exist in tmpdir. Strip surgically
+    # by matching the opening `if [[ -f "$_FT_DIR/lib/service-registry.sh"`
+    # to its closing `fi`. The `declare -A SERVICE_PORTS` line that follows
+    # keeps the URL default-expansions safe.
+    awk '
+        /^if \[\[ -f "\$_FT_DIR\/lib\/service-registry\.sh" \]\]; then/ { in_block = 1; next }
+        in_block && /^fi$/ { in_block = 0; next }
+        !in_block { print }
+    ' "$out" > "$out.tmp" && mv "$out.tmp" "$out"
+
+    chmod +x "$out"
+    echo "$out"
+}
+
+# ── all-fail path — the core regression (PR #428) ───────────────────────────
+
+@test "resilience: summary line prints even when every test fails" {
+    local script
+    script=$(_patch_script all-fail)
+    run bash "$script"
+    # Script must exit 1 on any failure.
+    [ "$status" -eq 1 ]
+    # Summary must still appear.
+    assert_output --partial "Results: 0 passed, 4 failed"
+    assert_output --partial "Some functional tests failed"
+}
+
+@test "resilience: first fail call does not trip set -e at counter=0" {
+    # The critical regression this guards against: `((TESTS_FAILED++))` under
+    # set -e aborts the script on the FIRST call because the pre-increment
+    # value is 0 and compound arithmetic returns that as exit code. With the
+    # PR #428 fix (`TESTS_FAILED=$((TESTS_FAILED+1))`), the assignment form
+    # always returns 0. If the first fail aborts the script, we'd see "0
+    # passed, 1 failed" (only the first test ran). Assert we reached all 4.
+    local script
+    script=$(_patch_script all-fail)
+    run bash "$script"
+    assert_output --partial "4 failed"
+}
+
+# ── all-pass path ───────────────────────────────────────────────────────────
+
+@test "resilience: all-pass exits 0 with full summary" {
+    local script
+    script=$(_patch_script all-pass)
+    run bash "$script"
+    assert_success
+    assert_output --partial "Results: 4 passed, 0 failed"
+    assert_output --partial "All functional tests passed"
+}
+
+# ── mixed path (regression guard for bounded set +e / -e) ───────────────────
+
+@test "resilience: mixed pass/fail still runs every test and prints summary" {
+    local script
+    script=$(_patch_script mixed)
+    run bash "$script"
+    [ "$status" -eq 1 ]
+    # All 4 test functions ran (2 pass, 2 fail).
+    assert_output --partial "Results: 2 passed, 2 failed"
+}
+
+# ── static assertions on the resilience idioms in the script itself ─────────
+
+@test "resilience: script uses arithmetic-expansion assignment (not ((++)))" {
+    # TESTS_FAILED=$((TESTS_FAILED+1)) — the set-e-safe form.
+    run grep -E 'TESTS_FAILED=\$\(\(TESTS_FAILED[[:space:]]*\+' "$SCRIPT_SRC"
+    assert_success
+    # And must NOT contain the dangerous ((TESTS_FAILED++)) form.
+    run grep -E '\(\(TESTS_FAILED\+\+\)\)' "$SCRIPT_SRC"
+    assert_failure
+}
+
+@test "resilience: script has bounded 'set +e' / 'set -e' around test dispatch" {
+    run grep -n "^set +e" "$SCRIPT_SRC"
+    assert_success
+    run grep -n "^set -e" "$SCRIPT_SRC"
+    assert_success
+}
+
+@test "resilience: TESTS_PASSED also uses the set-e-safe assignment form" {
+    run grep -E 'TESTS_PASSED=\$\(\(TESTS_PASSED[[:space:]]*\+' "$SCRIPT_SRC"
+    assert_success
+}
diff --git a/dream-server/tests/bats-tests/test-sr-resolve.bats b/dream-server/tests/bats-tests/test-sr-resolve.bats
@@ -0,0 +1,171 @@
+#!/usr/bin/env bats
+# ============================================================================
+# BATS tests for sr_resolve in lib/service-registry.sh.
+# ============================================================================
+# Guards against re-breakage of the `dream-<id>` prefix-strip added in
+# PR #406 (container names pasted from `docker ps` should resolve to their
+# service IDs), and of the broader alias-resolution contract.
+#
+# 8-case matrix:
+#   1. Exact ID               →  resolves to the same ID
+#   2. Known alias            →  resolves to canonical ID
+#   3. `dream-<id>` prefix    →  strips prefix, resolves to ID
+#   4. `dream-<alias>` prefix →  strips prefix, resolves through alias
+#   5. Unknown `dream-*`      →  passes through as-is (not our container)
+#   6. Unknown non-dream      →  passes through as-is (best-effort)
+#   7. Empty input            →  passes through empty
+#   8. Container that happens to start with `dream-` but isn't our
+#      convention → passes through as-is (no alias match after strip)
+#
+# We invoke the registry inside a fresh `bash -c` subshell per test because
+# `declare -A` at the top of service-registry.sh creates function-local
+# arrays when the file is sourced from within bats' setup() (which is a
+# shell function). A subshell sources at top level, populating the globals
+# sr_resolve then actually reads.
+
+load '../bats/bats-support/load'
+load '../bats/bats-assert/load'
+
+setup() {
+    export TMPDIR_TEST="$BATS_TEST_TMPDIR"
+    export FIXTURE_DIR="$TMPDIR_TEST/fixture"
+    export REGISTRY_PATH="$BATS_TEST_DIRNAME/../../lib/service-registry.sh"
+
+    # Fake EXTENSIONS_DIR so sr_load's Python loader has something to read.
+    mkdir -p "$FIXTURE_DIR/extensions/services"
+
+    # Service A — id "alpha", aliases [a, al]
+    mkdir -p "$FIXTURE_DIR/extensions/services/alpha"
+    cat > "$FIXTURE_DIR/extensions/services/alpha/manifest.yaml" <<'YAML'
+schema_version: dream.services.v1
+service:
+  id: alpha
+  name: Alpha Service
+  aliases: [a, al]
+  container_name: dream-alpha
+  category: core
+YAML
+
+    # Service B — id "bravo", aliases [b]
+    mkdir -p "$FIXTURE_DIR/extensions/services/bravo"
+    cat > "$FIXTURE_DIR/extensions/services/bravo/manifest.yaml" <<'YAML'
+schema_version: dream.services.v1
+service:
+  id: bravo
+  name: Bravo Service
+  aliases: [b]
+  container_name: dream-bravo
+  category: recommended
+YAML
+
+    command -v python3 >/dev/null 2>&1 || skip "python3 not available"
+    python3 -c "import yaml" 2>/dev/null || skip "PyYAML not available"
+}
+
+# Resolve `$1` using a freshly-loaded registry against the fixture.
+# Runs in a subshell so `declare -A` lines in service-registry.sh create
+# true globals (not function-locals under bats' setup()).
+# stderr is suppressed so we only assert on stdout — empty input legitimately
+# triggers "bad array index" diagnostics from bash for SERVICE_ALIASES[""]
+# which are not part of the contract we're pinning.
+_sr() {
+    bash -c '
+        SCRIPT_DIR="'"$FIXTURE_DIR"'"
+        export SCRIPT_DIR
+        . "'"$REGISTRY_PATH"'"
+        sr_resolve "$1" 2>/dev/null
+    ' _ "$1"
+}
+
+# ── the 8-case matrix ───────────────────────────────────────────────────────
+
+@test "sr_resolve: case 1 — exact ID resolves to same ID" {
+    run _sr "alpha"
+    assert_success
+    assert_output "alpha"
+}
+
+@test "sr_resolve: case 2 — known alias resolves to canonical ID" {
+    run _sr "a"
+    assert_success
+    assert_output "alpha"
+
+    run _sr "al"
+    assert_success
+    assert_output "alpha"
+
+    run _sr "b"
+    assert_success
+    assert_output "bravo"
+}
+
+@test "sr_resolve: case 3 — dream-<id> prefix strips and resolves" {
+    # This is the PR-10 / #406 regression point: users copy container names
+    # from `docker ps` (e.g. `dream-alpha`) and expect `dream restart` to
+    # accept them.
+    run _sr "dream-alpha"
+    assert_success
+    assert_output "alpha"
+}
+
+@test "sr_resolve: case 4 — dream-<alias> prefix strips and resolves through alias" {
+    run _sr "dream-a"
+    assert_success
+    assert_output "alpha"
+
+    run _sr "dream-b"
+    assert_success
+    assert_output "bravo"
+}
+
+@test "sr_resolve: case 5 — unknown dream-* passes through as-is" {
+    # Container that starts with `dream-` but whose stripped form isn't a
+    # known alias: return the input verbatim (best-effort; compose will
+    # fail later with a clear error).
+    run _sr "dream-unknown-service"
+    assert_success
+    assert_output "dream-unknown-service"
+}
+
+@test "sr_resolve: case 6 — unknown non-dream passes through as-is" {
+    run _sr "not-a-service"
+    assert_success
+    assert_output "not-a-service"
+}
+
+@test "sr_resolve: case 7 — empty input returns empty" {
+    run _sr ""
+    assert_success
+    # Empty input hits SERVICE_ALIASES[""] (unset) and falls back to echoing
+    # the input (also empty). No crash, no stderr.
+    assert_output ""
+}
+
+@test "sr_resolve: case 8 — dream-* where strip doesn't match any alias passes through" {
+    # Container name-like string that isn't from our extensions and whose
+    # stripped form doesn't collide with any known alias.
+    run _sr "dream-some-other-project-container"
+    assert_success
+    assert_output "dream-some-other-project-container"
+}
+
+# ── additional correctness guards ───────────────────────────────────────────
+
+@test "sr_resolve: does NOT strip dream- when the full input is already a known alias" {
+    # The resolver checks SERVICE_ALIASES[input] first, only stripping if
+    # missing. We prove the ordering holds by asserting plain `bravo` still
+    # resolves even though `dream-bravo` is its container name.
+    run _sr "bravo"
+    assert_success
+    assert_output "bravo"
+}
+
+@test "sr_resolve: idempotent — resolving twice yields same result" {
+    run _sr "dream-a"
+    assert_success
+    [ "$output" = "alpha" ]
+
+    run _sr "$output"
+    assert_success
+    [ "$output" = "alpha" ]
+}