Some checks failed
Deploy (Gitea) / deploy (push) Failing after 2s
- TUI agent-responds: hardened to detect and FAIL on cascade/exhausted responses (previously a separate WARN-only test that let real cascade failures slip through) - New TUI cascade-parsing test: /eval *provider-cascade* on screen, checks for clean keywords (no cl-dotenv quote artifacts) - Pre-warm step: sbcl --eval '(ql:quickload :passepartout/tui)' before launching tmux, cuts TUI startup from ~120s to ~10s - Removed test_agent_not_cascade_failure (absorbed into agent-responds) - New integration test: test-provider-cascade-parsing verifies PROVIDER_CASCADE entries are keywords without quotes, matching registered backends — catches the exact cl-dotenv quote bug - Fixed stop-daemon ghost symbol (removed export) and paren bug - Contract section updated with numbered Phase 2/3 items
114 lines
3.1 KiB
Bash
Executable File
114 lines
3.1 KiB
Bash
Executable File
#!/bin/bash
|
|
set -euo pipefail
|
|
|
|
PASS=0
|
|
FAIL=0
|
|
WARN=0
|
|
TUI_LOG="/tmp/passepartout-tui-test.log"
|
|
> "$TUI_LOG"
|
|
|
|
cleanup() {
|
|
tmux kill-session -t tui-test 2>/dev/null || true
|
|
}
|
|
trap cleanup EXIT
|
|
|
|
run_test() {
|
|
local name="$1"; shift
|
|
echo -n " $name ... "
|
|
if "$@" 2>/dev/null; then
|
|
echo "PASS"
|
|
PASS=$((PASS + 1))
|
|
else
|
|
echo "FAIL"
|
|
FAIL=$((FAIL + 1))
|
|
fi
|
|
}
|
|
|
|
# ---- Setup ----
|
|
echo "Pre-warming FASL cache (speeds up TUI start from ~120s to ~10s)..."
|
|
sbcl --noinform --load ~/quicklisp/setup.lisp \
|
|
--eval '(ql:quickload :passepartout/tui :silent t)' \
|
|
--eval '(uiop:quit)' 2>/dev/null &
|
|
WARM_PID=$!
|
|
wait $WARM_PID 2>/dev/null
|
|
echo " Pre-warm complete"
|
|
|
|
echo "Starting TUI in tmux (daemon must already be running on port 9105)..."
|
|
tmux new-session -d -s tui-test "passepartout tui 2>&1 | tee $TUI_LOG"
|
|
for i in $(seq 1 15); do
|
|
sleep 2
|
|
if tmux capture-pane -t tui-test -p 2>/dev/null | grep -q 'Connected v[0-9]'; then
|
|
echo " TUI ready after $((i*2))s"
|
|
break
|
|
fi
|
|
if [ "$i" -eq 15 ]; then
|
|
echo " WARNING: TUI did not render after 30s"
|
|
fi
|
|
done
|
|
|
|
# ---- Tests ----
|
|
|
|
test_agent_responds() {
|
|
# Full round-trip: TUI → daemon → LLM → daemon → TUI.
|
|
# Must contain a real agent response (⬇), NOT a cascade failure.
|
|
local before_ts
|
|
before_ts=$(date +%s)
|
|
tmux send-keys -t tui-test "Say hello in one word" Enter
|
|
while true; do
|
|
local pane
|
|
pane=$(tmux capture-pane -t tui-test -p -S -60 2>/dev/null)
|
|
if echo "$pane" | grep -q '⬇.*[a-zA-Z]\{3,\}'; then
|
|
if echo "$pane" | grep '⬇' | grep -qi 'cascade.*fail\|exhausted\|neural cascade'; then
|
|
echo "FAIL: agent responded with cascade failure, not LLM content" >&2
|
|
return 1
|
|
fi
|
|
return 0
|
|
fi
|
|
local now_ts
|
|
now_ts=$(date +%s)
|
|
if (( now_ts - before_ts > 60 )); then
|
|
echo "TIMEOUT: no agent response after 60s" >&2
|
|
return 1
|
|
fi
|
|
sleep 2
|
|
done
|
|
}
|
|
|
|
test_cascade_parsing() {
|
|
# Via /eval, check that *provider-cascade* contains clean keywords.
|
|
# This catches the cl-dotenv quote contamination bug.
|
|
tmux send-keys -t tui-test "/eval *provider-cascade*" Enter
|
|
sleep 3
|
|
local pane
|
|
pane=$(tmux capture-pane -t tui-test -p -S -15 2>/dev/null)
|
|
# Must contain keyword syntax :SOMETHING (not "SOMETHING with quotes)
|
|
echo "$pane" | grep -q ':DEEPSEEK\|:OPENROUTER\|:OPENAI\|:ANTHROPIC\|:GROQ\|:GEMINI\|:NVIDIA'
|
|
}
|
|
|
|
test_eval_command() {
|
|
tmux send-keys -t tui-test "/eval (+ 1 2)" Enter
|
|
sleep 3
|
|
tmux capture-pane -t tui-test -p -S -10 2>/dev/null | grep -q '=> 3'
|
|
}
|
|
|
|
test_status_bar() {
|
|
tmux capture-pane -t tui-test -p -S -20 2>/dev/null | grep -q 'msgs:'
|
|
}
|
|
|
|
test_connection_drop() {
|
|
sleep 1
|
|
tmux capture-pane -t tui-test -p -S -10 2>/dev/null | grep -qi 'connection.*lost\|ERROR.*Connection\|error.*connect' || true
|
|
return 0
|
|
}
|
|
|
|
run_test "agent-responds" test_agent_responds
|
|
run_test "cascade-parsing" test_cascade_parsing
|
|
run_test "eval-command" test_eval_command
|
|
run_test "status-bar" test_status_bar
|
|
run_test "connection-drop" test_connection_drop
|
|
|
|
# ---- Summary ----
|
|
echo ""
|
|
echo "===== $PASS passed, $FAIL failed, $WARN warnings ====="
|
|
exit $(( FAIL > 0 ? 1 : 0 ))
|