disinto/lib/agent-session.sh

#!/usr/bin/env bash
# agent-session.sh — Shared tmux + Claude interactive session helpers
#
# Source this into agent orchestrator scripts for reusable session management.
#
# Functions:
#   agent_wait_for_claude_ready SESSION_NAME [TIMEOUT_SECS]
#   agent_inject_into_session   SESSION_NAME TEXT
#   agent_kill_session          SESSION_NAME
#   monitor_phase_loop          PHASE_FILE IDLE_TIMEOUT_SECS CALLBACK_FN [SESSION_NAME]
#   session_lock_acquire        [TIMEOUT_SECS]
#   session_lock_release

# --- Cooperative session lock (fd-based) ---
# File descriptor for the session lock. Set by create_agent_session().
# Callers can release/re-acquire via session_lock_release/session_lock_acquire
# to allow other Claude sessions during idle phases (awaiting_review/awaiting_ci).
SESSION_LOCK_FD=""

# Release the session lock without closing the file descriptor.
# The fd stays open so it can be re-acquired later.
session_lock_release() {
  if [ -n "${SESSION_LOCK_FD:-}" ]; then
    flock -u "$SESSION_LOCK_FD"
  fi
}

# Re-acquire the session lock. Blocks until available or timeout.
# Opens the lock fd if not already open (for use by external callers).
# Args: [timeout_secs] (default 300)
# Returns 0 on success, 1 on timeout/error.
# shellcheck disable=SC2120  # timeout arg is used by external callers
session_lock_acquire() {
  local timeout="${1:-300}"
  if [ -z "${SESSION_LOCK_FD:-}" ]; then
    local lock_dir="${HOME}/.claude"
    mkdir -p "$lock_dir"
    exec {SESSION_LOCK_FD}>>"${lock_dir}/session.lock"
  fi
  flock -w "$timeout" "$SESSION_LOCK_FD"
}

# Wait for the Claude ❯ ready prompt in a tmux pane.
# Returns 0 if ready within TIMEOUT_SECS (default 120), 1 otherwise.
agent_wait_for_claude_ready() {
  local session="$1"
  local timeout="${2:-120}"
  local elapsed=0
  while [ "$elapsed" -lt "$timeout" ]; do
    if tmux capture-pane -t "$session" -p 2>/dev/null | grep -q '❯'; then
      return 0
    fi
    sleep 2
    elapsed=$((elapsed + 2))
  done
  return 1
}

# Paste TEXT into SESSION (waits for Claude to be ready first), then press Enter.
agent_inject_into_session() {
  local session="$1"
  local text="$2"
  local tmpfile
  # Re-acquire session lock before injecting — Claude will resume working
  # shellcheck disable=SC2119  # using default timeout
  session_lock_acquire || true
  agent_wait_for_claude_ready "$session" 120 || true
  # Clear idle marker — new work incoming
  rm -f "/tmp/claude-idle-${session}.ts"
  tmpfile=$(mktemp /tmp/agent-inject-XXXXXX)
  printf '%s' "$text" > "$tmpfile"
  tmux load-buffer -b "agent-inject-$$" "$tmpfile"
  tmux paste-buffer -t "$session" -b "agent-inject-$$"
  sleep 0.5
  tmux send-keys -t "$session" "" Enter
  tmux delete-buffer -b "agent-inject-$$" 2>/dev/null || true
  rm -f "$tmpfile"
}

# Create a tmux session running Claude in the given workdir.
# Installs a Stop hook for idle detection (see monitor_phase_loop).
# Installs a PreToolUse hook to guard destructive Bash operations.
# Optionally installs a PostToolUse hook for phase file write detection.
# Optionally installs a StopFailure hook for immediate phase file update on API error.
# Args: session workdir [phase_file]
# Returns 0 if session is ready, 1 otherwise.
create_agent_session() {
  local session="$1"
  local workdir="${2:-.}"
  local phase_file="${3:-}"

  # Prepare settings directory for hooks
  mkdir -p "${workdir}/.claude"
  local settings="${workdir}/.claude/settings.json"

  # Install Stop hook for idle detection: when Claude finishes a response,
  # the hook writes a timestamp to a marker file. monitor_phase_loop checks
  # this marker instead of fragile tmux pane scraping.
  local idle_marker="/tmp/claude-idle-${session}.ts"
  local hook_script="${FACTORY_ROOT}/lib/hooks/on-idle-stop.sh"
  if [ -x "$hook_script" ]; then
    local hook_cmd="${hook_script} ${idle_marker}"
    # When a phase file is available, pass it and the session name so the
    # hook can nudge Claude if it returns to the prompt without signalling.
    if [ -n "$phase_file" ]; then
      hook_cmd="${hook_script} ${idle_marker} ${phase_file} ${session}"
    fi
    if [ -f "$settings" ]; then
      # Append our Stop hook to existing project settings
      jq --arg cmd "$hook_cmd" '
        if (.hooks.Stop // [] | any(.[]; .hooks[]?.command == $cmd))
        then .
        else .hooks.Stop = (.hooks.Stop // []) + [{
          matcher: "",
          hooks: [{type: "command", command: $cmd}]
        }]
        end
      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
    else
      jq -n --arg cmd "$hook_cmd" '{
        hooks: {
          Stop: [{
            matcher: "",
            hooks: [{type: "command", command: $cmd}]
          }]
        }
      }' > "$settings"
    fi
  fi

  # Install PostToolUse hook for phase file write detection: when Claude
  # writes to the phase file via Bash or Write, the hook writes a marker
  # so monitor_phase_loop can react immediately instead of waiting for
  # the next mtime-based poll cycle.
  if [ -n "$phase_file" ]; then
    local phase_marker="/tmp/phase-changed-${session}.marker"
    local phase_hook_script="${FACTORY_ROOT}/lib/hooks/on-phase-change.sh"
    if [ -x "$phase_hook_script" ]; then
      local phase_hook_cmd="${phase_hook_script} ${phase_file} ${phase_marker}"
      if [ -f "$settings" ]; then
        jq --arg cmd "$phase_hook_cmd" '
          if (.hooks.PostToolUse // [] | any(.[]; .hooks[]?.command == $cmd))
          then .
          else .hooks.PostToolUse = (.hooks.PostToolUse // []) + [{
            matcher: "Bash|Write",
            hooks: [{type: "command", command: $cmd}]
          }]
          end
        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
      else
        jq -n --arg cmd "$phase_hook_cmd" '{
          hooks: {
            PostToolUse: [{
              matcher: "Bash|Write",
              hooks: [{type: "command", command: $cmd}]
            }]
          }
        }' > "$settings"
      fi
      rm -f "$phase_marker"
    fi
  fi

  # Install StopFailure hook for immediate phase file update on API error:
  # when Claude hits a rate limit, server error, billing error, or auth failure,
  # the hook writes PHASE:failed to the phase file and touches the phase-changed
  # marker so monitor_phase_loop picks it up within one poll cycle instead of
  # waiting for idle timeout (up to 2 hours).
  if [ -n "$phase_file" ]; then
    local stop_failure_hook_script="${FACTORY_ROOT}/lib/hooks/on-stop-failure.sh"
    if [ -x "$stop_failure_hook_script" ]; then
      # phase_marker is defined in the PostToolUse block above; redeclare so
      # this block is self-contained if that block is ever removed.
      local sf_phase_marker="/tmp/phase-changed-${session}.marker"
      local stop_failure_hook_cmd="${stop_failure_hook_script} ${phase_file} ${sf_phase_marker}"
      if [ -f "$settings" ]; then
        jq --arg cmd "$stop_failure_hook_cmd" '
          if (.hooks.StopFailure // [] | any(.[]; .hooks[]?.command == $cmd))
          then .
          else .hooks.StopFailure = (.hooks.StopFailure // []) + [{
            matcher: "rate_limit|server_error|authentication_failed|billing_error",
            hooks: [{type: "command", command: $cmd}]
          }]
          end
        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
      else
        jq -n --arg cmd "$stop_failure_hook_cmd" '{
          hooks: {
            StopFailure: [{
              matcher: "rate_limit|server_error|authentication_failed|billing_error",
              hooks: [{type: "command", command: $cmd}]
            }]
          }
        }' > "$settings"
      fi
    fi
  fi

  # Install PreToolUse hook for destructive operation guard: blocks force push
  # to primary branch, rm -rf outside worktree, direct API merge calls, and
  # checkout/switch to primary branch.  Claude sees the denial reason on exit 2
  # and can self-correct.
  local guard_hook_script="${FACTORY_ROOT}/lib/hooks/on-pretooluse-guard.sh"
  if [ -x "$guard_hook_script" ]; then
    local abs_workdir
    abs_workdir=$(cd "$workdir" 2>/dev/null && pwd) || abs_workdir="$workdir"
    local guard_hook_cmd="${guard_hook_script} ${PRIMARY_BRANCH:-main} ${abs_workdir} ${session}"
    if [ -f "$settings" ]; then
      jq --arg cmd "$guard_hook_cmd" '
        if (.hooks.PreToolUse // [] | any(.[]; .hooks[]?.command == $cmd))
        then .
        else .hooks.PreToolUse = (.hooks.PreToolUse // []) + [{
          matcher: "Bash",
          hooks: [{type: "command", command: $cmd}]
        }]
        end
      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
    else
      jq -n --arg cmd "$guard_hook_cmd" '{
        hooks: {
          PreToolUse: [{
            matcher: "Bash",
            hooks: [{type: "command", command: $cmd}]
          }]
        }
      }' > "$settings"
    fi
  fi

  # Install SessionEnd hook for guaranteed cleanup: when the Claude session
  # exits (clean or crash), write a termination marker so monitor_phase_loop
  # detects the exit faster than tmux has-session polling alone.
  local exit_marker="/tmp/claude-exited-${session}.ts"
  local session_end_hook_script="${FACTORY_ROOT}/lib/hooks/on-session-end.sh"
  if [ -x "$session_end_hook_script" ]; then
    local session_end_hook_cmd="${session_end_hook_script} ${exit_marker}"
    if [ -f "$settings" ]; then
      jq --arg cmd "$session_end_hook_cmd" '
        if (.hooks.SessionEnd // [] | any(.[]; .hooks[]?.command == $cmd))
        then .
        else .hooks.SessionEnd = (.hooks.SessionEnd // []) + [{
          matcher: "",
          hooks: [{type: "command", command: $cmd}]
        }]
        end
      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
    else
      jq -n --arg cmd "$session_end_hook_cmd" '{
        hooks: {
          SessionEnd: [{
            matcher: "",
            hooks: [{type: "command", command: $cmd}]
          }]
        }
      }' > "$settings"
    fi
  fi
  rm -f "$exit_marker"

  # Install SessionStart hook for context re-injection after compaction:
  # when Claude Code compacts context during long sessions, the phase protocol
  # instructions are lost. This hook fires after each compaction and outputs
  # the content of a context file so Claude retains critical instructions.
  # The context file is written by callers via write_compact_context().
  if [ -n "$phase_file" ]; then
    local compact_hook_script="${FACTORY_ROOT}/lib/hooks/on-compact-reinject.sh"
    if [ -x "$compact_hook_script" ]; then
      local context_file="${phase_file%.phase}.context"
      local compact_hook_cmd="${compact_hook_script} ${context_file}"
      if [ -f "$settings" ]; then
        jq --arg cmd "$compact_hook_cmd" '
          if (.hooks.SessionStart // [] | any(.[]; .hooks[]?.command == $cmd))
          then .
          else .hooks.SessionStart = (.hooks.SessionStart // []) + [{
            matcher: "compact",
            hooks: [{type: "command", command: $cmd}]
          }]
          end
        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
      else
        jq -n --arg cmd "$compact_hook_cmd" '{
          hooks: {
            SessionStart: [{
              matcher: "compact",
              hooks: [{type: "command", command: $cmd}]
            }]
          }
        }' > "$settings"
      fi
    fi
  fi

  rm -f "$idle_marker"
  local model_flag=""
  if [ -n "${CLAUDE_MODEL:-}" ]; then
    model_flag="--model ${CLAUDE_MODEL}"
  fi

  # Acquire a session-level mutex via fd-based flock to prevent concurrent
  # Claude sessions from racing on OAuth token refresh.  Unlike the previous
  # command-wrapper flock, the fd approach allows callers to release the lock
  # during idle phases (awaiting_review/awaiting_ci) and re-acquire before
  # injecting the next prompt.  See #724.
  # Use ~/.claude/session.lock so the lock is shared across containers when
  # the host ~/.claude directory is bind-mounted.
  local lock_dir="${HOME}/.claude"
  mkdir -p "$lock_dir"
  local claude_lock="${lock_dir}/session.lock"
  if [ -z "${SESSION_LOCK_FD:-}" ]; then
    exec {SESSION_LOCK_FD}>>"${claude_lock}"
  fi
  if ! flock -w 300 "$SESSION_LOCK_FD"; then
    return 1
  fi
  local claude_cmd="claude --dangerously-skip-permissions ${model_flag}"

  tmux new-session -d -s "$session" -c "$workdir" \
    "$claude_cmd" 2>/dev/null
  sleep 1
  tmux has-session -t "$session" 2>/dev/null || return 1
  agent_wait_for_claude_ready "$session" 120 || return 1
  return 0
}

# Inject a prompt/formula into a session (alias for agent_inject_into_session).
inject_formula() {
  agent_inject_into_session "$@"
}

# Monitor a phase file, calling a callback on changes and handling idle timeout.
# Sets _MONITOR_LOOP_EXIT to the exit reason (idle_timeout, idle_prompt, done, crashed, PHASE:failed, PHASE:escalate).
# Sets _MONITOR_SESSION to the resolved session name (arg 4 or $SESSION_NAME).
#   Callbacks should reference _MONITOR_SESSION instead of $SESSION_NAME directly.
# Args: phase_file idle_timeout_secs callback_fn [session_name]
#   session_name — tmux session to health-check; falls back to $SESSION_NAME global
#
# Idle detection: uses a Stop hook marker file (written by lib/hooks/on-idle-stop.sh)
# to detect when Claude finishes responding without writing a phase signal.
# If the marker exists for 3 consecutive polls with no phase written, the session
# is killed and the callback invoked with "PHASE:failed".
monitor_phase_loop() {
  local phase_file="$1"
  local idle_timeout="$2"
  local callback="$3"
  local _session="${4:-${SESSION_NAME:-}}"
  # Export resolved session name so callbacks can reference it regardless of
  # which session was passed to monitor_phase_loop (analogous to _MONITOR_LOOP_EXIT).
  export _MONITOR_SESSION="$_session"
  local poll_interval="${PHASE_POLL_INTERVAL:-10}"
  local last_mtime=0
  local idle_elapsed=0
  local idle_pane_count=0

  while true; do
    sleep "$poll_interval"
    idle_elapsed=$(( idle_elapsed + poll_interval ))

    # Session health check: SessionEnd hook marker provides fast detection,
    # tmux has-session is the fallback for unclean exits (e.g. tmux crash).
    local exit_marker="/tmp/claude-exited-${_session}.ts"
    if [ -f "$exit_marker" ] || ! tmux has-session -t "${_session}" 2>/dev/null; then
      local current_phase
      current_phase=$(head -1 "$phase_file" 2>/dev/null | tr -d '[:space:]' || true)
      case "$current_phase" in
        PHASE:done|PHASE:failed|PHASE:merged|PHASE:escalate)
          ;; # terminal — fall through to phase handler
        *)
          # Call callback with "crashed" — let agent-specific code handle recovery
          if type "${callback}" &>/dev/null; then
            "$callback" "PHASE:crashed"
          fi
          # If callback didn't restart session, break
          if ! tmux has-session -t "${_session}" 2>/dev/null; then
            _MONITOR_LOOP_EXIT="crashed"
            return 1
          fi
          idle_elapsed=0
          idle_pane_count=0
          continue
          ;;
      esac
    fi

    # Check phase-changed marker from PostToolUse hook — if present, the hook
    # detected a phase file write so we reset last_mtime to force processing
    # this cycle instead of waiting for the next mtime change.
    local phase_marker="/tmp/phase-changed-${_session}.marker"
    if [ -f "$phase_marker" ]; then
      rm -f "$phase_marker"
      last_mtime=0
    fi

    # Check phase file for changes
    local phase_mtime
    phase_mtime=$(stat -c %Y "$phase_file" 2>/dev/null || echo 0)
    local current_phase
    current_phase=$(head -1 "$phase_file" 2>/dev/null | tr -d '[:space:]' || true)

    if [ -z "$current_phase" ] || [ "$phase_mtime" -le "$last_mtime" ]; then
      # No phase change — check idle timeout
      if [ "$idle_elapsed" -ge "$idle_timeout" ]; then
        _MONITOR_LOOP_EXIT="idle_timeout"
        agent_kill_session "${_session}"
        return 0
      fi
      # Idle detection via Stop hook: the on-idle-stop.sh hook writes a marker
      # file when Claude finishes a response. If the marker exists and no phase
      # has been written, Claude returned to the prompt without following the
      # phase protocol. 3 consecutive polls = confirmed idle (not mid-turn).
      local idle_marker="/tmp/claude-idle-${_session}.ts"
      if [ -z "$current_phase" ] && [ -f "$idle_marker" ]; then
        idle_pane_count=$(( idle_pane_count + 1 ))
        if [ "$idle_pane_count" -ge 3 ]; then
          _MONITOR_LOOP_EXIT="idle_prompt"
          # Session is killed before the callback is invoked.
          # Callbacks that handle PHASE:failed must not assume the session is alive.
          agent_kill_session "${_session}"
          if type "${callback}" &>/dev/null; then
            "$callback" "PHASE:failed"
          fi
          return 0
        fi
      else
        idle_pane_count=0
      fi
      continue
    fi

    # Phase changed
    last_mtime="$phase_mtime"
    # shellcheck disable=SC2034  # read by phase-handler.sh callback
    LAST_PHASE_MTIME="$phase_mtime"
    idle_elapsed=0
    idle_pane_count=0

    # Terminal phases
    case "$current_phase" in
      PHASE:done|PHASE:merged)
        _MONITOR_LOOP_EXIT="done"
        if type "${callback}" &>/dev/null; then
          "$callback" "$current_phase"
        fi
        return 0
        ;;
      PHASE:failed|PHASE:escalate)
        _MONITOR_LOOP_EXIT="$current_phase"
        if type "${callback}" &>/dev/null; then
          "$callback" "$current_phase"
        fi
        return 0
        ;;
    esac

    # Non-terminal phase — call callback
    if type "${callback}" &>/dev/null; then
      "$callback" "$current_phase"
    fi
  done
}

# Write context to a file for re-injection after context compaction.
# The SessionStart compact hook reads this file and outputs it to stdout.
# Args: phase_file content
write_compact_context() {
  local phase_file="$1"
  local content="$2"
  local context_file="${phase_file%.phase}.context"
  printf '%s\n' "$content" > "$context_file"
}

# Kill a tmux session gracefully (no-op if not found).
agent_kill_session() {
  local session="${1:-}"
  [ -n "$session" ] && tmux kill-session -t "$session" 2>/dev/null || true
  rm -f "/tmp/claude-idle-${session}.ts"
  rm -f "/tmp/phase-changed-${session}.marker"
  rm -f "/tmp/claude-exited-${session}.ts"
  rm -f "/tmp/claude-nudge-${session}.count"
}

# Read the current phase from a phase file, stripped of whitespace.
# Usage: read_phase [file]  — defaults to $PHASE_FILE
read_phase() {
  local file="${1:-${PHASE_FILE:-}}"
  { cat "$file" 2>/dev/null || true; } | head -1 | tr -d '[:space:]'
}
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								#!/usr/bin/env bash
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# agent-session.sh — Shared tmux + Claude interactive session helpers
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								#
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# Source this into agent orchestrator scripts for reusable session management.
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								#
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# Functions:
 								#   agent_wait_for_claude_ready SESSION_NAME [TIMEOUT_SECS]
 								#   agent_inject_into_session   SESSION_NAME TEXT
 								#   agent_kill_session          SESSION_NAME
-												fix: agent-session.sh: monitor_phase_loop should accept SESSION_NAME as a parameter (#187)

Add optional 4th parameter to monitor_phase_loop for SESSION_NAME,
falling back to the $SESSION_NAME global for backwards-compatibility.
Document the full function signature in both the file header and inline comment.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 20:15:14 +00:00
+								#   monitor_phase_loop          PHASE_FILE IDLE_TIMEOUT_SECS CALLBACK_FN [SESSION_NAME]
-												fix: Session lock must not block during idle phases (awaiting_review/awaiting_ci) (#724)

Restructure session.lock from command-wrapper flock to fd-based flock so
the lock can be released when Claude is idle and re-acquired before
injecting the next prompt.

- agent-session.sh: add session_lock_acquire/release helpers, open fd in
  create_agent_session instead of wrapping claude with flock, auto-acquire
  in agent_inject_into_session before injecting
- phase-handler.sh: call session_lock_release at start of awaiting_ci and
  awaiting_review handlers (Claude is idle during CI polling / review wait)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-26 10:11:50 +00:00
+								#   session_lock_acquire        [TIMEOUT_SECS]
 								#   session_lock_release
 								# --- Cooperative session lock (fd-based) ---
 								# File descriptor for the session lock. Set by create_agent_session().
 								# Callers can release/re-acquire via session_lock_release/session_lock_acquire
 								# to allow other Claude sessions during idle phases (awaiting_review/awaiting_ci).
 								SESSION_LOCK_FD=""
 								# Release the session lock without closing the file descriptor.
 								# The fd stays open so it can be re-acquired later.
 								session_lock_release() {
 								  if [ -n "${SESSION_LOCK_FD:-}" ]; then
 								    flock -u "$SESSION_LOCK_FD"
 								  fi
 								}
 								# Re-acquire the session lock. Blocks until available or timeout.
 								# Opens the lock fd if not already open (for use by external callers).
 								# Args: [timeout_secs] (default 300)
 								# Returns 0 on success, 1 on timeout/error.
 								# shellcheck disable=SC2120  # timeout arg is used by external callers
 								session_lock_acquire() {
 								  local timeout="${1:-300}"
 								  if [ -z "${SESSION_LOCK_FD:-}" ]; then
 								    local lock_dir="${HOME}/.claude"
 								    mkdir -p "$lock_dir"
 								    exec {SESSION_LOCK_FD}>>"${lock_dir}/session.lock"
 								  fi
 								  flock -w "$timeout" "$SESSION_LOCK_FD"
 								}
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# Wait for the Claude ❯ ready prompt in a tmux pane.
 								# Returns 0 if ready within TIMEOUT_SECS (default 120), 1 otherwise.
 								agent_wait_for_claude_ready() {
 								  local session="$1"
 								  local timeout="${2:-120}"
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								  local elapsed=0
 								  while [ "$elapsed" -lt "$timeout" ]; do
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								    if tmux capture-pane -t "$session" -p 2>/dev/null | grep -q '❯'; then
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								      return 0
 								    fi
 								    sleep 2
 								    elapsed=$((elapsed + 2))
 								  done
 								  return 1
 								}
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# Paste TEXT into SESSION (waits for Claude to be ready first), then press Enter.
 								agent_inject_into_session() {
 								  local session="$1"
 								  local text="$2"
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								  local tmpfile
-												fix: Session lock must not block during idle phases (awaiting_review/awaiting_ci) (#724)

Restructure session.lock from command-wrapper flock to fd-based flock so
the lock can be released when Claude is idle and re-acquired before
injecting the next prompt.

- agent-session.sh: add session_lock_acquire/release helpers, open fd in
  create_agent_session instead of wrapping claude with flock, auto-acquire
  in agent_inject_into_session before injecting
- phase-handler.sh: call session_lock_release at start of awaiting_ci and
  awaiting_review handlers (Claude is idle during CI polling / review wait)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-26 10:11:50 +00:00
+								  # Re-acquire session lock before injecting — Claude will resume working
 								  # shellcheck disable=SC2119  # using default timeout
 								  session_lock_acquire || true
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								  agent_wait_for_claude_ready "$session" 120 || true
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								  # Clear idle marker — new work incoming
 								  rm -f "/tmp/claude-idle-${session}.ts"
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								  tmpfile=$(mktemp /tmp/agent-inject-XXXXXX)
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								  printf '%s' "$text" > "$tmpfile"
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								  tmux load-buffer -b "agent-inject-$$" "$tmpfile"
 								  tmux paste-buffer -t "$session" -b "agent-inject-$$"
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								  sleep 0.5
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								  tmux send-keys -t "$session" "" Enter
 								  tmux delete-buffer -b "agent-inject-$$" 2>/dev/null || true
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								  rm -f "$tmpfile"
 								}
-												fix: add create_agent_session and inject_formula to agent-session.sh

Both dev-agent.sh and gardener-agent.sh call these functions but they
were never implemented during the #158 extraction. Adds:
- create_agent_session(session, workdir) — tmux + claude + wait for ready
- inject_formula(session, text) — alias for agent_inject_into_session

											
										
										
											2026-03-18 16:21:05 +00:00
+								# Create a tmux session running Claude in the given workdir.
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								# Installs a Stop hook for idle detection (see monitor_phase_loop).
-												fix: feat: PreToolUse hook guards destructive operations in dev-agent sessions (#277)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 00:10:27 +00:00
+								# Installs a PreToolUse hook to guard destructive Bash operations.
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								# Optionally installs a PostToolUse hook for phase file write detection.
-												fix: feat: StopFailure hook writes phase file on API error / rate limit (#275)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:43:00 +00:00
+								# Optionally installs a StopFailure hook for immediate phase file update on API error.
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								# Args: session workdir [phase_file]
-												fix: add create_agent_session and inject_formula to agent-session.sh

Both dev-agent.sh and gardener-agent.sh call these functions but they
were never implemented during the #158 extraction. Adds:
- create_agent_session(session, workdir) — tmux + claude + wait for ready
- inject_formula(session, text) — alias for agent_inject_into_session

											
										
										
											2026-03-18 16:21:05 +00:00
+								# Returns 0 if session is ready, 1 otherwise.
 								create_agent_session() {
 								  local session="$1"
 								  local workdir="${2:-.}"
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								  local phase_file="${3:-}"
 								  # Prepare settings directory for hooks
 								  mkdir -p "${workdir}/.claude"
 								  local settings="${workdir}/.claude/settings.json"
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
 								  # Install Stop hook for idle detection: when Claude finishes a response,
 								  # the hook writes a timestamp to a marker file. monitor_phase_loop checks
 								  # this marker instead of fragile tmux pane scraping.
 								  local idle_marker="/tmp/claude-idle-${session}.ts"
 								  local hook_script="${FACTORY_ROOT}/lib/hooks/on-idle-stop.sh"
 								  if [ -x "$hook_script" ]; then
 								    local hook_cmd="${hook_script} ${idle_marker}"
-												fix: stop hook should nudge Claude when PHASE file is empty — prevents silent exit without PHASE:done (#585)

When Claude finishes a response but hasn't written to the PHASE file,
the stop hook now injects a nudge into the tmux session instead of just
marking idle. This gives Claude another chance to complete the phase
protocol before the monitor loop times out.

Key changes:
- on-idle-stop.sh: check phase file emptiness, nudge via tmux (max 2)
- agent-session.sh: pass phase_file + session to stop hook, clean up
  nudge counter on session teardown

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-23 09:56:49 +00:00
+								    # When a phase file is available, pass it and the session name so the
 								    # hook can nudge Claude if it returns to the prompt without signalling.
 								    if [ -n "$phase_file" ]; then
 								      hook_cmd="${hook_script} ${idle_marker} ${phase_file} ${session}"
 								    fi
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								    if [ -f "$settings" ]; then
 								      # Append our Stop hook to existing project settings
 								      jq --arg cmd "$hook_cmd" '
-												fix: Deduplicate hook entries in settings.json on repeated create_agent_session calls (#299)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 21:19:58 +00:00
+								        if (.hooks.Stop // [] | any(.[]; .hooks[]?.command == $cmd))
 								        then .
 								        else .hooks.Stop = (.hooks.Stop // []) + [{
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								          matcher: "",
 								          hooks: [{type: "command", command: $cmd}]
 								        }]
-												fix: Deduplicate hook entries in settings.json on repeated create_agent_session calls (#299)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 21:19:58 +00:00
+								        end
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								    else
 								      jq -n --arg cmd "$hook_cmd" '{
 								        hooks: {
 								          Stop: [{
 								            matcher: "",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
 								        }
 								      }' > "$settings"
 								    fi
 								  fi
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								  # Install PostToolUse hook for phase file write detection: when Claude
 								  # writes to the phase file via Bash or Write, the hook writes a marker
 								  # so monitor_phase_loop can react immediately instead of waiting for
 								  # the next mtime-based poll cycle.
 								  if [ -n "$phase_file" ]; then
 								    local phase_marker="/tmp/phase-changed-${session}.marker"
 								    local phase_hook_script="${FACTORY_ROOT}/lib/hooks/on-phase-change.sh"
 								    if [ -x "$phase_hook_script" ]; then
 								      local phase_hook_cmd="${phase_hook_script} ${phase_file} ${phase_marker}"
 								      if [ -f "$settings" ]; then
 								        jq --arg cmd "$phase_hook_cmd" '
-												fix: Deduplicate hook entries in settings.json on repeated create_agent_session calls (#299)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 21:19:58 +00:00
+								          if (.hooks.PostToolUse // [] | any(.[]; .hooks[]?.command == $cmd))
 								          then .
 								          else .hooks.PostToolUse = (.hooks.PostToolUse // []) + [{
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								            matcher: "Bash|Write",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
-												fix: Deduplicate hook entries in settings.json on repeated create_agent_session calls (#299)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 21:19:58 +00:00
+								          end
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								      else
 								        jq -n --arg cmd "$phase_hook_cmd" '{
 								          hooks: {
 								            PostToolUse: [{
 								              matcher: "Bash|Write",
 								              hooks: [{type: "command", command: $cmd}]
 								            }]
 								          }
 								        }' > "$settings"
 								      fi
-												fix: distinguish phase file writes from reads in PostToolUse hook

- Parse tool_name via jq: Write tool checks file_path match,
  Bash tool checks for redirect operator (>) with phase file path
- Reads (cat, head) no longer trigger false-positive markers
- Split guard into separate statements for clarity
- Move marker cleanup inside hook-install guard
- Expand tests: 5 cases covering Bash write, Write tool, Bash read,
  unrelated Bash, and Write to different file

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 18:14:49 +00:00
+								      rm -f "$phase_marker"
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								    fi
 								  fi
-												fix: feat: StopFailure hook writes phase file on API error / rate limit (#275)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:43:00 +00:00
+								  # Install StopFailure hook for immediate phase file update on API error:
 								  # when Claude hits a rate limit, server error, billing error, or auth failure,
 								  # the hook writes PHASE:failed to the phase file and touches the phase-changed
 								  # marker so monitor_phase_loop picks it up within one poll cycle instead of
 								  # waiting for idle timeout (up to 2 hours).
 								  if [ -n "$phase_file" ]; then
 								    local stop_failure_hook_script="${FACTORY_ROOT}/lib/hooks/on-stop-failure.sh"
 								    if [ -x "$stop_failure_hook_script" ]; then
-												fix: address review — terminal phase guard, explicit marker var, test coverage

- Guard against overwriting terminal phases (PHASE:done, PHASE:merged)
  in on-stop-failure.sh to prevent false failures from same-turn race
- Declare sf_phase_marker explicitly in StopFailure block instead of
  relying on phase_marker from PostToolUse block
- Add authentication_failed test (10c) and terminal phase guard tests
  (10g, 10h)
- Fix fragile nested command substitution in test 10f fail() message

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:52:46 +00:00
+								      # phase_marker is defined in the PostToolUse block above; redeclare so
 								      # this block is self-contained if that block is ever removed.
 								      local sf_phase_marker="/tmp/phase-changed-${session}.marker"
 								      local stop_failure_hook_cmd="${stop_failure_hook_script} ${phase_file} ${sf_phase_marker}"
-												fix: feat: StopFailure hook writes phase file on API error / rate limit (#275)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:43:00 +00:00
+								      if [ -f "$settings" ]; then
 								        jq --arg cmd "$stop_failure_hook_cmd" '
 								          if (.hooks.StopFailure // [] | any(.[]; .hooks[]?.command == $cmd))
 								          then .
 								          else .hooks.StopFailure = (.hooks.StopFailure // []) + [{
 								            matcher: "rate_limit|server_error|authentication_failed|billing_error",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
 								          end
 								        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								      else
 								        jq -n --arg cmd "$stop_failure_hook_cmd" '{
 								          hooks: {
 								            StopFailure: [{
 								              matcher: "rate_limit|server_error|authentication_failed|billing_error",
 								              hooks: [{type: "command", command: $cmd}]
 								            }]
 								          }
 								        }' > "$settings"
 								      fi
 								    fi
 								  fi
-												fix: feat: PreToolUse hook guards destructive operations in dev-agent sessions (#277)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 00:10:27 +00:00
+								  # Install PreToolUse hook for destructive operation guard: blocks force push
 								  # to primary branch, rm -rf outside worktree, direct API merge calls, and
 								  # checkout/switch to primary branch.  Claude sees the denial reason on exit 2
 								  # and can self-correct.
 								  local guard_hook_script="${FACTORY_ROOT}/lib/hooks/on-pretooluse-guard.sh"
 								  if [ -x "$guard_hook_script" ]; then
 								    local abs_workdir
 								    abs_workdir=$(cd "$workdir" 2>/dev/null && pwd) || abs_workdir="$workdir"
-												fix: PreToolUse guard — allow formula agents to access FACTORY_ROOT from worktrees (#487)

- Add session name as third arg to guard hook (passed from agent-session.sh)
- Detect formula sessions (supervisor-*, gardener-*, planner-*, predictor-*)
- Guard 6: block filesystem access to factory root from worktrees, exempt formulas
- Guard 7: restrict system commands (kill, docker, tmux) to supervisor only
- Guard 2: allow formula agents rm -rf within factory root

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-21 18:09:28 +00:00
+								    local guard_hook_cmd="${guard_hook_script} ${PRIMARY_BRANCH:-main} ${abs_workdir} ${session}"
-												fix: feat: PreToolUse hook guards destructive operations in dev-agent sessions (#277)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 00:10:27 +00:00
+								    if [ -f "$settings" ]; then
 								      jq --arg cmd "$guard_hook_cmd" '
 								        if (.hooks.PreToolUse // [] | any(.[]; .hooks[]?.command == $cmd))
 								        then .
 								        else .hooks.PreToolUse = (.hooks.PreToolUse // []) + [{
 								          matcher: "Bash",
 								          hooks: [{type: "command", command: $cmd}]
 								        }]
 								        end
 								      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								    else
 								      jq -n --arg cmd "$guard_hook_cmd" '{
 								        hooks: {
 								          PreToolUse: [{
 								            matcher: "Bash",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
 								        }
 								      }' > "$settings"
 								    fi
 								  fi
-												fix: feat: SessionEnd hook for guaranteed cleanup on session exit (#276)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:11:26 +00:00
+								  # Install SessionEnd hook for guaranteed cleanup: when the Claude session
 								  # exits (clean or crash), write a termination marker so monitor_phase_loop
 								  # detects the exit faster than tmux has-session polling alone.
 								  local exit_marker="/tmp/claude-exited-${session}.ts"
 								  local session_end_hook_script="${FACTORY_ROOT}/lib/hooks/on-session-end.sh"
 								  if [ -x "$session_end_hook_script" ]; then
 								    local session_end_hook_cmd="${session_end_hook_script} ${exit_marker}"
 								    if [ -f "$settings" ]; then
 								      jq --arg cmd "$session_end_hook_cmd" '
 								        if (.hooks.SessionEnd // [] | any(.[]; .hooks[]?.command == $cmd))
 								        then .
 								        else .hooks.SessionEnd = (.hooks.SessionEnd // []) + [{
 								          matcher: "",
 								          hooks: [{type: "command", command: $cmd}]
 								        }]
 								        end
 								      ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								    else
 								      jq -n --arg cmd "$session_end_hook_cmd" '{
 								        hooks: {
 								          SessionEnd: [{
 								            matcher: "",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
 								        }
 								      }' > "$settings"
 								    fi
 								  fi
 								  rm -f "$exit_marker"
-												fix: feat: SessionStart compact hook re-injects phase protocol after context compaction (#274)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 23:27:32 +00:00
+								  # Install SessionStart hook for context re-injection after compaction:
 								  # when Claude Code compacts context during long sessions, the phase protocol
 								  # instructions are lost. This hook fires after each compaction and outputs
 								  # the content of a context file so Claude retains critical instructions.
 								  # The context file is written by callers via write_compact_context().
 								  if [ -n "$phase_file" ]; then
 								    local compact_hook_script="${FACTORY_ROOT}/lib/hooks/on-compact-reinject.sh"
 								    if [ -x "$compact_hook_script" ]; then
 								      local context_file="${phase_file%.phase}.context"
 								      local compact_hook_cmd="${compact_hook_script} ${context_file}"
 								      if [ -f "$settings" ]; then
 								        jq --arg cmd "$compact_hook_cmd" '
 								          if (.hooks.SessionStart // [] | any(.[]; .hooks[]?.command == $cmd))
 								          then .
 								          else .hooks.SessionStart = (.hooks.SessionStart // []) + [{
 								            matcher: "compact",
 								            hooks: [{type: "command", command: $cmd}]
 								          }]
 								          end
 								        ' "$settings" > "${settings}.tmp" && mv "${settings}.tmp" "$settings"
 								      else
 								        jq -n --arg cmd "$compact_hook_cmd" '{
 								          hooks: {
 								            SessionStart: [{
 								              matcher: "compact",
 								              hooks: [{type: "command", command: $cmd}]
 								            }]
 								          }
 								        }' > "$settings"
 								      fi
 								    fi
 								  fi
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								  rm -f "$idle_marker"
-												fix: add model=opus to run-planner formula and wire through action-agent

TOML declares model = "opus". planner-poll.sh includes model: opus in
the issue YAML front matter. action-agent.sh extracts it and exports
CLAUDE_MODEL. create_agent_session passes --model to claude if set.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 09:08:17 +00:00
+								  local model_flag=""
 								  if [ -n "${CLAUDE_MODEL:-}" ]; then
 								    model_flag="--model ${CLAUDE_MODEL}"
 								  fi
-												fix: shared Claude OAuth credentials in containers — mount + flock to prevent token rotation race (#693)

- Make ~/.claude volume mount read-write (was :ro) so containers can
  write back refreshed OAuth tokens
- Wrap Claude CLI in flock(1) inside tmux sessions using
  ~/.claude/session.lock — prevents concurrent token refresh races
  across agents sharing the same credentials
- Add ANTHROPIC_API_KEY detection in entrypoint.sh: when set, skips
  OAuth entirely (no rotation issues, metered billing)
- Log active auth method (API key vs OAuth vs missing) at container
  startup for easier 401 debugging
- Document 'claude auth login' requirement in disinto init output

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-25 17:48:21 +00:00
-												fix: Session lock must not block during idle phases (awaiting_review/awaiting_ci) (#724)

Restructure session.lock from command-wrapper flock to fd-based flock so
the lock can be released when Claude is idle and re-acquired before
injecting the next prompt.

- agent-session.sh: add session_lock_acquire/release helpers, open fd in
  create_agent_session instead of wrapping claude with flock, auto-acquire
  in agent_inject_into_session before injecting
- phase-handler.sh: call session_lock_release at start of awaiting_ci and
  awaiting_review handlers (Claude is idle during CI polling / review wait)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-26 10:11:50 +00:00
+								  # Acquire a session-level mutex via fd-based flock to prevent concurrent
 								  # Claude sessions from racing on OAuth token refresh.  Unlike the previous
 								  # command-wrapper flock, the fd approach allows callers to release the lock
 								  # during idle phases (awaiting_review/awaiting_ci) and re-acquire before
 								  # injecting the next prompt.  See #724.
-												fix: shared Claude OAuth credentials in containers — mount + flock to prevent token rotation race (#693)

- Make ~/.claude volume mount read-write (was :ro) so containers can
  write back refreshed OAuth tokens
- Wrap Claude CLI in flock(1) inside tmux sessions using
  ~/.claude/session.lock — prevents concurrent token refresh races
  across agents sharing the same credentials
- Add ANTHROPIC_API_KEY detection in entrypoint.sh: when set, skips
  OAuth entirely (no rotation issues, metered billing)
- Log active auth method (API key vs OAuth vs missing) at container
  startup for easier 401 debugging
- Document 'claude auth login' requirement in disinto init output

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-25 17:48:21 +00:00
+								  # Use ~/.claude/session.lock so the lock is shared across containers when
 								  # the host ~/.claude directory is bind-mounted.
 								  local lock_dir="${HOME}/.claude"
 								  mkdir -p "$lock_dir"
 								  local claude_lock="${lock_dir}/session.lock"
-												fix: Session lock must not block during idle phases (awaiting_review/awaiting_ci) (#724)

Restructure session.lock from command-wrapper flock to fd-based flock so
the lock can be released when Claude is idle and re-acquired before
injecting the next prompt.

- agent-session.sh: add session_lock_acquire/release helpers, open fd in
  create_agent_session instead of wrapping claude with flock, auto-acquire
  in agent_inject_into_session before injecting
- phase-handler.sh: call session_lock_release at start of awaiting_ci and
  awaiting_review handlers (Claude is idle during CI polling / review wait)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-26 10:11:50 +00:00
+								  if [ -z "${SESSION_LOCK_FD:-}" ]; then
 								    exec {SESSION_LOCK_FD}>>"${claude_lock}"
 								  fi
 								  if ! flock -w 300 "$SESSION_LOCK_FD"; then
 								    return 1
 								  fi
 								  local claude_cmd="claude --dangerously-skip-permissions ${model_flag}"
-												fix: shared Claude OAuth credentials in containers — mount + flock to prevent token rotation race (#693)

- Make ~/.claude volume mount read-write (was :ro) so containers can
  write back refreshed OAuth tokens
- Wrap Claude CLI in flock(1) inside tmux sessions using
  ~/.claude/session.lock — prevents concurrent token refresh races
  across agents sharing the same credentials
- Add ANTHROPIC_API_KEY detection in entrypoint.sh: when set, skips
  OAuth entirely (no rotation issues, metered billing)
- Log active auth method (API key vs OAuth vs missing) at container
  startup for easier 401 debugging
- Document 'claude auth login' requirement in disinto init output

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-25 17:48:21 +00:00
-												fix: add create_agent_session and inject_formula to agent-session.sh

Both dev-agent.sh and gardener-agent.sh call these functions but they
were never implemented during the #158 extraction. Adds:
- create_agent_session(session, workdir) — tmux + claude + wait for ready
- inject_formula(session, text) — alias for agent_inject_into_session

											
										
										
											2026-03-18 16:21:05 +00:00
+								  tmux new-session -d -s "$session" -c "$workdir" \
-												fix: shared Claude OAuth credentials in containers — mount + flock to prevent token rotation race (#693)

- Make ~/.claude volume mount read-write (was :ro) so containers can
  write back refreshed OAuth tokens
- Wrap Claude CLI in flock(1) inside tmux sessions using
  ~/.claude/session.lock — prevents concurrent token refresh races
  across agents sharing the same credentials
- Add ANTHROPIC_API_KEY detection in entrypoint.sh: when set, skips
  OAuth entirely (no rotation issues, metered billing)
- Log active auth method (API key vs OAuth vs missing) at container
  startup for easier 401 debugging
- Document 'claude auth login' requirement in disinto init output

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-25 17:48:21 +00:00
+								    "$claude_cmd" 2>/dev/null
-												fix: add create_agent_session and inject_formula to agent-session.sh

Both dev-agent.sh and gardener-agent.sh call these functions but they
were never implemented during the #158 extraction. Adds:
- create_agent_session(session, workdir) — tmux + claude + wait for ready
- inject_formula(session, text) — alias for agent_inject_into_session

											
										
										
											2026-03-18 16:21:05 +00:00
+								  sleep 1
 								  tmux has-session -t "$session" 2>/dev/null || return 1
 								  agent_wait_for_claude_ready "$session" 120 || return 1
 								  return 0
 								}
 								# Inject a prompt/formula into a session (alias for agent_inject_into_session).
 								inject_formula() {
 								  agent_inject_into_session "$@"
 								}
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								# Monitor a phase file, calling a callback on changes and handling idle timeout.
-												fix: monitor_phase_loop docstring lists 'break' as a possible _MONITOR_LOOP_EXIT value but it is never set (#435)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-23 09:39:48 +00:00
+								# Sets _MONITOR_LOOP_EXIT to the exit reason (idle_timeout, idle_prompt, done, crashed, PHASE:failed, PHASE:escalate).
-												fix: Callbacks can't see the resolved _session from monitor_phase_loop (#200)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-19 01:05:21 +00:00
+								# Sets _MONITOR_SESSION to the resolved session name (arg 4 or $SESSION_NAME).
 								#   Callbacks should reference _MONITOR_SESSION instead of $SESSION_NAME directly.
-												fix: agent-session.sh: monitor_phase_loop should accept SESSION_NAME as a parameter (#187)

Add optional 4th parameter to monitor_phase_loop for SESSION_NAME,
falling back to the $SESSION_NAME global for backwards-compatibility.
Document the full function signature in both the file header and inline comment.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 20:15:14 +00:00
+								# Args: phase_file idle_timeout_secs callback_fn [session_name]
 								#   session_name — tmux session to health-check; falls back to $SESSION_NAME global
-												fix: bug: gardener hangs forever when Claude finishes without writing phase file (#261) (#263)

Fixes #261

## Changes
Fixed gardener hanging forever when Claude skips phase protocol. Three changes: (1) gardener-agent.sh: replaced 999999s timeout with 7200s (2h, matching dev-agent); (2) lib/agent-session.sh: added idle-prompt detection to monitor_phase_loop — if Claude returns to the ❯ prompt for 3 consecutive polls with no phase file written, exits immediately with _MONITOR_LOOP_EXIT=idle_prompt (only fires when phase file is empty, so awaiting_ci/review waits are unaffected); (3) gardener prompt: removed 'no time limit' wording, replaced with explicit phase-write requirement.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/263
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>

											
										
										
											2026-03-19 13:47:10 +01:00
+								#
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								# Idle detection: uses a Stop hook marker file (written by lib/hooks/on-idle-stop.sh)
 								# to detect when Claude finishes responding without writing a phase signal.
 								# If the marker exists for 3 consecutive polls with no phase written, the session
 								# is killed and the callback invoked with "PHASE:failed".
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								monitor_phase_loop() {
 								  local phase_file="$1"
 								  local idle_timeout="$2"
 								  local callback="$3"
-												fix: agent-session.sh: monitor_phase_loop should accept SESSION_NAME as a parameter (#187)

Add optional 4th parameter to monitor_phase_loop for SESSION_NAME,
falling back to the $SESSION_NAME global for backwards-compatibility.
Document the full function signature in both the file header and inline comment.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 20:15:14 +00:00
+								  local _session="${4:-${SESSION_NAME:-}}"
-												fix: Callbacks can't see the resolved _session from monitor_phase_loop (#200)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-19 01:05:21 +00:00
+								  # Export resolved session name so callbacks can reference it regardless of
 								  # which session was passed to monitor_phase_loop (analogous to _MONITOR_LOOP_EXIT).
 								  export _MONITOR_SESSION="$_session"
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								  local poll_interval="${PHASE_POLL_INTERVAL:-10}"
 								  local last_mtime=0
 								  local idle_elapsed=0
-												fix: bug: gardener hangs forever when Claude finishes without writing phase file (#261) (#263)

Fixes #261

## Changes
Fixed gardener hanging forever when Claude skips phase protocol. Three changes: (1) gardener-agent.sh: replaced 999999s timeout with 7200s (2h, matching dev-agent); (2) lib/agent-session.sh: added idle-prompt detection to monitor_phase_loop — if Claude returns to the ❯ prompt for 3 consecutive polls with no phase file written, exits immediately with _MONITOR_LOOP_EXIT=idle_prompt (only fires when phase file is empty, so awaiting_ci/review waits are unaffected); (3) gardener prompt: removed 'no time limit' wording, replaced with explicit phase-write requirement.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/263
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>

											
										
										
											2026-03-19 13:47:10 +01:00
+								  local idle_pane_count=0
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
 								  while true; do
 								    sleep "$poll_interval"
 								    idle_elapsed=$(( idle_elapsed + poll_interval ))
-												fix: feat: SessionEnd hook for guaranteed cleanup on session exit (#276)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:11:26 +00:00
+								    # Session health check: SessionEnd hook marker provides fast detection,
 								    # tmux has-session is the fallback for unclean exits (e.g. tmux crash).
 								    local exit_marker="/tmp/claude-exited-${_session}.ts"
 								    if [ -f "$exit_marker" ] || ! tmux has-session -t "${_session}" 2>/dev/null; then
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								      local current_phase
 								      current_phase=$(head -1 "$phase_file" 2>/dev/null | tr -d '[:space:]' || true)
 								      case "$current_phase" in
-												fix: feat: unified escalation — single PHASE:escalate path for all agents (#510)

Replace PHASE:needs_human with PHASE:escalate across all agent types.
Consolidates 6 overlapping escalation mechanisms into one unified path:
detect → notify via Matrix → session stays alive → human reply injected → resume.

Key changes:
- PHASE:escalate replaces PHASE:needs_human everywhere (16 files)
- CI exhausted now escalates instead of immediately marking blocked
- Matrix listener routes free-text replies to vault tmux sessions
- Vault agent writes PHASE:escalate files for procurement requests
- Supervisor monitors PHASE:escalate sessions in health checks
- 24h timeout on escalation → blocked label + session killed
- All 38 phase protocol tests updated and passing

Supersedes #462, #458, #465.

											
										
										
											2026-03-21 19:39:04 +00:00
+								        PHASE:done|PHASE:failed|PHASE:merged|PHASE:escalate)
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								          ;; # terminal — fall through to phase handler
 								        *)
 								          # Call callback with "crashed" — let agent-specific code handle recovery
 								          if type "${callback}" &>/dev/null; then
 								            "$callback" "PHASE:crashed"
 								          fi
 								          # If callback didn't restart session, break
-												fix: agent-session.sh: monitor_phase_loop should accept SESSION_NAME as a parameter (#187)

Add optional 4th parameter to monitor_phase_loop for SESSION_NAME,
falling back to the $SESSION_NAME global for backwards-compatibility.
Document the full function signature in both the file header and inline comment.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 20:15:14 +00:00
+								          if ! tmux has-session -t "${_session}" 2>/dev/null; then
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								            _MONITOR_LOOP_EXIT="crashed"
 								            return 1
 								          fi
 								          idle_elapsed=0
-												fix: bug: gardener hangs forever when Claude finishes without writing phase file (#261) (#263)

Fixes #261

## Changes
Fixed gardener hanging forever when Claude skips phase protocol. Three changes: (1) gardener-agent.sh: replaced 999999s timeout with 7200s (2h, matching dev-agent); (2) lib/agent-session.sh: added idle-prompt detection to monitor_phase_loop — if Claude returns to the ❯ prompt for 3 consecutive polls with no phase file written, exits immediately with _MONITOR_LOOP_EXIT=idle_prompt (only fires when phase file is empty, so awaiting_ci/review waits are unaffected); (3) gardener prompt: removed 'no time limit' wording, replaced with explicit phase-write requirement.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/263
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>

											
										
										
											2026-03-19 13:47:10 +01:00
+								          idle_pane_count=0
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								          continue
 								          ;;
 								      esac
 								    fi
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								    # Check phase-changed marker from PostToolUse hook — if present, the hook
 								    # detected a phase file write so we reset last_mtime to force processing
 								    # this cycle instead of waiting for the next mtime change.
 								    local phase_marker="/tmp/phase-changed-${_session}.marker"
 								    if [ -f "$phase_marker" ]; then
 								      rm -f "$phase_marker"
 								      last_mtime=0
 								    fi
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								    # Check phase file for changes
 								    local phase_mtime
 								    phase_mtime=$(stat -c %Y "$phase_file" 2>/dev/null || echo 0)
 								    local current_phase
 								    current_phase=$(head -1 "$phase_file" 2>/dev/null | tr -d '[:space:]' || true)
 								    if [ -z "$current_phase" ] || [ "$phase_mtime" -le "$last_mtime" ]; then
 								      # No phase change — check idle timeout
 								      if [ "$idle_elapsed" -ge "$idle_timeout" ]; then
 								        _MONITOR_LOOP_EXIT="idle_timeout"
-												fix: agent-session.sh: monitor_phase_loop should accept SESSION_NAME as a parameter (#187)

Add optional 4th parameter to monitor_phase_loop for SESSION_NAME,
falling back to the $SESSION_NAME global for backwards-compatibility.
Document the full function signature in both the file header and inline comment.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 20:15:14 +00:00
+								        agent_kill_session "${_session}"
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								        return 0
 								      fi
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								      # Idle detection via Stop hook: the on-idle-stop.sh hook writes a marker
 								      # file when Claude finishes a response. If the marker exists and no phase
 								      # has been written, Claude returned to the prompt without following the
 								      # phase protocol. 3 consecutive polls = confirmed idle (not mid-turn).
 								      local idle_marker="/tmp/claude-idle-${_session}.ts"
 								      if [ -z "$current_phase" ] && [ -f "$idle_marker" ]; then
-												fix: bug: gardener hangs forever when Claude finishes without writing phase file (#261) (#263)

Fixes #261

## Changes
Fixed gardener hanging forever when Claude skips phase protocol. Three changes: (1) gardener-agent.sh: replaced 999999s timeout with 7200s (2h, matching dev-agent); (2) lib/agent-session.sh: added idle-prompt detection to monitor_phase_loop — if Claude returns to the ❯ prompt for 3 consecutive polls with no phase file written, exits immediately with _MONITOR_LOOP_EXIT=idle_prompt (only fires when phase file is empty, so awaiting_ci/review waits are unaffected); (3) gardener prompt: removed 'no time limit' wording, replaced with explicit phase-write requirement.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/263
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>

											
										
										
											2026-03-19 13:47:10 +01:00
+								        idle_pane_count=$(( idle_pane_count + 1 ))
 								        if [ "$idle_pane_count" -ge 3 ]; then
 								          _MONITOR_LOOP_EXIT="idle_prompt"
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								          # Session is killed before the callback is invoked.
-												fix: bug: gardener hangs forever when Claude finishes without writing phase file (#261) (#263)

Fixes #261

## Changes
Fixed gardener hanging forever when Claude skips phase protocol. Three changes: (1) gardener-agent.sh: replaced 999999s timeout with 7200s (2h, matching dev-agent); (2) lib/agent-session.sh: added idle-prompt detection to monitor_phase_loop — if Claude returns to the ❯ prompt for 3 consecutive polls with no phase file written, exits immediately with _MONITOR_LOOP_EXIT=idle_prompt (only fires when phase file is empty, so awaiting_ci/review waits are unaffected); (3) gardener prompt: removed 'no time limit' wording, replaced with explicit phase-write requirement.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/263
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>

											
										
										
											2026-03-19 13:47:10 +01:00
+								          # Callbacks that handle PHASE:failed must not assume the session is alive.
 								          agent_kill_session "${_session}"
 								          if type "${callback}" &>/dev/null; then
 								            "$callback" "PHASE:failed"
 								          fi
 								          return 0
 								        fi
 								      else
 								        idle_pane_count=0
 								      fi
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								      continue
 								    fi
 								    # Phase changed
 								    last_mtime="$phase_mtime"
-												fix: fix: phase-handler.sh references LAST_PHASE_MTIME which is now internal to monitor_phase_loop (#181)

Export LAST_PHASE_MTIME from monitor_phase_loop before invoking the callback
so that phase-handler.sh can compare phase file mtimes inside the awaiting_review
inner poll loop without hitting an unbound variable error under set -u.

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 17:26:54 +00:00
+								    # shellcheck disable=SC2034  # read by phase-handler.sh callback
 								    LAST_PHASE_MTIME="$phase_mtime"
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								    idle_elapsed=0
-												fix: `idle_pane_count` not reset in phase-changed branch of monitor_phase_loop (#436)

When a phase change is detected (mtime changes), idle_elapsed was reset
but idle_pane_count was not. This meant idle counts accumulated before a
phase write carried into subsequent polls, so N consecutive idle polls
could be reached with fewer than N actual consecutive idle polls.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-21 17:14:54 +00:00
+								    idle_pane_count=0
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
 								    # Terminal phases
 								    case "$current_phase" in
 								      PHASE:done|PHASE:merged)
 								        _MONITOR_LOOP_EXIT="done"
 								        if type "${callback}" &>/dev/null; then
 								          "$callback" "$current_phase"
 								        fi
 								        return 0
 								        ;;
-												fix: feat: unified escalation — single PHASE:escalate path for all agents (#510)

Replace PHASE:needs_human with PHASE:escalate across all agent types.
Consolidates 6 overlapping escalation mechanisms into one unified path:
detect → notify via Matrix → session stays alive → human reply injected → resume.

Key changes:
- PHASE:escalate replaces PHASE:needs_human everywhere (16 files)
- CI exhausted now escalates instead of immediately marking blocked
- Matrix listener routes free-text replies to vault tmux sessions
- Vault agent writes PHASE:escalate files for procurement requests
- Supervisor monitors PHASE:escalate sessions in health checks
- 24h timeout on escalation → blocked label + session killed
- All 38 phase protocol tests updated and passing

Supersedes #462, #458, #465.

											
										
										
											2026-03-21 19:39:04 +00:00
+								      PHASE:failed|PHASE:escalate)
-												fix: implement monitor_phase_loop in agent-session.sh

Generic phase monitoring loop with callback for agent-specific handling.
Handles: idle timeout, session crash detection, terminal phases (done,
failed, needs_human, merged). Sets _MONITOR_LOOP_EXIT for the caller.

											
										
										
											2026-03-18 16:40:51 +00:00
+								        _MONITOR_LOOP_EXIT="$current_phase"
 								        if type "${callback}" &>/dev/null; then
 								          "$callback" "$current_phase"
 								        fi
 								        return 0
 								        ;;
 								    esac
 								    # Non-terminal phase — call callback
 								    if type "${callback}" &>/dev/null; then
 								      "$callback" "$current_phase"
 								    fi
 								  done
 								}
-												fix: feat: SessionStart compact hook re-injects phase protocol after context compaction (#274)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 23:27:32 +00:00
+								# Write context to a file for re-injection after context compaction.
 								# The SessionStart compact hook reads this file and outputs it to stdout.
 								# Args: phase_file content
 								write_compact_context() {
 								  local phase_file="$1"
 								  local content="$2"
 								  local context_file="${phase_file%.phase}.context"
 								  printf '%s\n' "$content" > "$context_file"
 								}
-												fix: feat: gardener-agent.sh — tmux + Claude interactive gardener using agent-session.sh (#159) (#163)

Fixes #159

## Changes
Add gardener-agent.sh (tmux+Claude) and lib/agent-session.sh (shared helpers). gardener-poll.sh slimmed to cron wrapper; grooming delegated to new agent; recipe engine for CI escalations unchanged.

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/163
Reviewed-by: review_bot <review_bot@noreply.codeberg.org>

											
										
										
											2026-03-18 16:21:07 +01:00
+								# Kill a tmux session gracefully (no-op if not found).
 								agent_kill_session() {
-												fix: pass SESSION_NAME to all agent-session.sh function calls

Library functions need explicit session name argument — they no longer
have closure over $SESSION_NAME from the parent script.

- agent_kill_session: add $SESSION_NAME to all 11 call sites
- agent_inject_into_session: add $SESSION_NAME to all call sites in
  phase-handler.sh and gardener-agent.sh
- agent_kill_session: guard against missing arg (defensive)

											
										
										
											2026-03-18 16:24:58 +00:00
+								  local session="${1:-}"
 								  [ -n "$session" ] && tmux kill-session -t "$session" 2>/dev/null || true
-												fix: replace fragile pane grep with Stop hook for idle detection (#272)

## Summary

- Claude Code v2.1.79 permanently shows `❯` in the input area even while actively thinking, causing `monitor_phase_loop` to false-positive on idle detection and kill working sessions after 90 seconds
- Replace `tmux capture-pane | grep ❯` with a Claude Code Stop hook (`lib/hooks/on-idle-stop.sh`) that writes a marker file only when Claude actually finishes responding
- Hook is installed per-worktree in `.claude/settings.json` by `create_agent_session`; marker cleaned up on inject/kill

## Test plan

- [x] Verified hook installs correctly in fresh worktree
- [x] Verified marker file appears only after Claude finishes responding (not during active thinking)
- [x] Verified live dev-agent session picks up fix and Claude works without being killed
- [x] Verified `agent_inject_into_session` clears marker before new work

🤖 Generated with [Claude Code](https://claude.com/claude-code)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/disinto/pulls/272

											
										
										
											2026-03-19 14:57:54 +01:00
+								  rm -f "/tmp/claude-idle-${session}.ts"
-												fix: feat: PostToolUse hook detects phase file writes in real-time (eliminates polling latency) (#278)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-19 17:55:06 +00:00
+								  rm -f "/tmp/phase-changed-${session}.marker"
-												fix: feat: SessionEnd hook for guaranteed cleanup on session exit (#276)

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-20 01:11:26 +00:00
+								  rm -f "/tmp/claude-exited-${session}.ts"
-												fix: stop hook should nudge Claude when PHASE file is empty — prevents silent exit without PHASE:done (#585)

When Claude finishes a response but hasn't written to the PHASE file,
the stop hook now injects a nudge into the tmux session instead of just
marking idle. This gives Claude another chance to complete the phase
protocol before the monitor loop times out.

Key changes:
- on-idle-stop.sh: check phase file emptiness, nudge via tmux (max 2)
- agent-session.sh: pass phase_file + session to stop hook, clean up
  nudge counter on session teardown

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>

											
										
										
											2026-03-23 09:56:49 +00:00
+								  rm -f "/tmp/claude-nudge-${session}.count"
-												refactor: extract lib/agent-session.sh — reusable tmux + Claude agent runtime (#158)

Move generic agent infrastructure from dev/dev-agent.sh into lib/agent-session.sh:
- log, status, notify, notify_ctx, read_phase, wait_for_claude_ready,
  inject_into_session, kill_tmux_session extracted verbatim
- create_agent_session(session_name, workdir) — new: tmux session creation
- inject_formula(session_name, formula_text, context) — new: prompt injection
- monitor_phase_loop(phase_file, idle_timeout, callback_fn) — new: phase loop
  with session health check, crash recovery, and idle timeout detection

dev-agent.sh: sources the library, implements _on_phase_change() callback,
calls monitor_phase_loop(); idle-timeout and crash-recovery-failed cleanup
handled via _MONITOR_LOOP_EXIT signal variable. Behavior unchanged.

											
										
										
											2026-03-18 14:36:36 +00:00
+								}
-												feat: CI smoke test — syntax check + function resolution for all agent scripts (#177)

Co-Authored-By: Claude Sonnet 4.6 <noreply@anthropic.com>

											
										
										
											2026-03-18 17:11:02 +00:00
 								# Read the current phase from a phase file, stripped of whitespace.
 								# Usage: read_phase [file]  — defaults to $PHASE_FILE
 								read_phase() {
 								  local file="${1:-${PHASE_FILE:-}}"
 								  { cat "$file" 2>/dev/null || true; } | head -1 | tr -d '[:space:]'
 								}