#!/usr/bin/env bash # formula-session.sh — Shared helpers for formula-driven cron agents # # Provides reusable functions for the common cron-wrapper + tmux-session # pattern used by planner-run.sh and gardener-agent.sh. # # Functions: # acquire_cron_lock LOCK_FILE — PID lock with stale cleanup # check_memory [MIN_MB] — skip if available RAM too low # load_formula FORMULA_FILE — sets FORMULA_CONTENT # build_context_block FILE [FILE ...] — sets CONTEXT_BLOCK # start_formula_session SESSION WORKDIR PHASE_FILE — create tmux + claude # build_prompt_footer [EXTRA_API] — sets PROMPT_FOOTER (API ref + env + phase) # run_formula_and_monitor AGENT [TIMEOUT] — session start, inject, monitor, log # formula_phase_callback PHASE — standard crash-recovery callback # # Requires: lib/agent-session.sh sourced first (for create_agent_session, # agent_kill_session, agent_inject_into_session). # Globals used by formula_phase_callback: SESSION_NAME, PHASE_FILE, # PROJECT_REPO_ROOT, PROMPT (set by the calling script). # ── Cron guards ────────────────────────────────────────────────────────── # acquire_cron_lock LOCK_FILE # Acquires a PID lock. Exits 0 if another instance is running. # Sets an EXIT trap to clean up the lock file. acquire_cron_lock() { _CRON_LOCK_FILE="$1" if [ -f "$_CRON_LOCK_FILE" ]; then local lock_pid lock_pid=$(cat "$_CRON_LOCK_FILE" 2>/dev/null || true) if [ -n "$lock_pid" ] && kill -0 "$lock_pid" 2>/dev/null; then log "run: already running (PID $lock_pid)" exit 0 fi rm -f "$_CRON_LOCK_FILE" fi echo $$ > "$_CRON_LOCK_FILE" trap 'rm -f "$_CRON_LOCK_FILE"' EXIT } # check_memory [MIN_MB] # Exits 0 (skip) if available memory is below MIN_MB (default 2000). check_memory() { local min_mb="${1:-2000}" local avail_mb avail_mb=$(free -m | awk '/Mem:/{print $7}') if [ "${avail_mb:-0}" -lt "$min_mb" ]; then log "run: skipping — only ${avail_mb}MB available (need ${min_mb})" exit 0 fi } # ── Formula loading ────────────────────────────────────────────────────── # load_formula FORMULA_FILE # Reads formula TOML into FORMULA_CONTENT. Exits 1 if missing. load_formula() { local formula_file="$1" if [ ! -f "$formula_file" ]; then log "ERROR: formula not found: $formula_file" exit 1 fi # shellcheck disable=SC2034 # consumed by the calling script FORMULA_CONTENT=$(cat "$formula_file") } # build_context_block FILE [FILE ...] # Reads each file from $PROJECT_REPO_ROOT and builds CONTEXT_BLOCK. build_context_block() { CONTEXT_BLOCK="" local ctx ctx_path for ctx in "$@"; do ctx_path="${PROJECT_REPO_ROOT}/${ctx}" if [ -f "$ctx_path" ]; then CONTEXT_BLOCK="${CONTEXT_BLOCK} ### ${ctx} $(cat "$ctx_path") " fi done } # ── Session management ─────────────────────────────────────────────────── # start_formula_session SESSION WORKDIR PHASE_FILE # Kills stale session, resets phase file, creates new tmux + claude session. # Returns 0 on success, 1 on failure. start_formula_session() { local session="$1" workdir="$2" phase_file="$3" agent_kill_session "$session" rm -f "$phase_file" log "Creating tmux session: ${session}" if ! create_agent_session "$session" "$workdir" "$phase_file"; then log "ERROR: failed to create tmux session ${session}" return 1 fi } # formula_phase_callback PHASE # Standard crash-recovery phase callback for formula sessions. # Requires globals: SESSION_NAME, PHASE_FILE, PROJECT_REPO_ROOT, PROMPT. # Uses _FORMULA_CRASH_COUNT (auto-initialized) for single-retry limit. # shellcheck disable=SC2154 # SESSION_NAME, PHASE_FILE, PROJECT_REPO_ROOT, PROMPT set by caller formula_phase_callback() { local phase="$1" log "phase: ${phase}" case "$phase" in PHASE:crashed) if [ "${_FORMULA_CRASH_COUNT:-0}" -gt 0 ]; then log "ERROR: session crashed again after recovery — giving up" return 0 fi _FORMULA_CRASH_COUNT=$(( ${_FORMULA_CRASH_COUNT:-0} + 1 )) log "WARNING: tmux session died unexpectedly — attempting recovery" if create_agent_session "${_MONITOR_SESSION:-$SESSION_NAME}" "$PROJECT_REPO_ROOT" "$PHASE_FILE" 2>/dev/null; then agent_inject_into_session "${_MONITOR_SESSION:-$SESSION_NAME}" "$PROMPT" log "Recovery session started" else log "ERROR: could not restart session after crash" fi ;; PHASE:done|PHASE:failed|PHASE:needs_human|PHASE:merged) agent_kill_session "${_MONITOR_SESSION:-$SESSION_NAME}" ;; esac } # ── Scratch file helpers (compaction survival) ──────────────────────────── # build_scratch_instruction SCRATCH_FILE # Returns a prompt block instructing Claude to periodically flush context # to a scratch file so understanding survives context compaction. build_scratch_instruction() { local scratch_file="$1" cat <<_SCRATCH_EOF_ ## Context scratch file (compaction survival) Periodically (every 10-15 tool calls), write a summary of: - What you have discovered so far - Decisions made and why - What remains to do to: ${scratch_file} If you find this file exists when you start, read it first — it is your previous context. This file is ephemeral — not evidence or permanent memory, just a compaction survival mechanism. _SCRATCH_EOF_ } # read_scratch_context SCRATCH_FILE # If the scratch file exists, returns a context block for prompt injection. # Returns empty string if the file does not exist. read_scratch_context() { local scratch_file="$1" if [ -f "$scratch_file" ]; then printf '## Previous context (from scratch file)\n%s\n' "$(cat "$scratch_file")" fi } # ── Prompt + monitor helpers ────────────────────────────────────────────── # build_prompt_footer [EXTRA_API_LINES] # Assembles the common Codeberg API reference + environment + phase protocol # block for formula prompts. Sets PROMPT_FOOTER. # Pass additional API endpoint lines (pre-formatted, newline-prefixed) via $1. # Requires globals: CODEBERG_API, FACTORY_ROOT, PROJECT_REPO_ROOT, # PRIMARY_BRANCH, PHASE_FILE. build_prompt_footer() { local extra_api="${1:-}" # shellcheck disable=SC2034 # consumed by the calling script's PROMPT PROMPT_FOOTER="## Codeberg API reference Base URL: ${CODEBERG_API} Auth header: -H \"Authorization: token \$CODEBERG_TOKEN\" Read issue: curl -sf -H \"Authorization: token \$CODEBERG_TOKEN\" '${CODEBERG_API}/issues/{number}' | jq '.body' Create issue: curl -sf -X POST -H \"Authorization: token \$CODEBERG_TOKEN\" -H 'Content-Type: application/json' '${CODEBERG_API}/issues' -d '{\"title\":\"...\",\"body\":\"...\",\"labels\":[LABEL_ID]}'${extra_api} List labels: curl -sf -H \"Authorization: token \$CODEBERG_TOKEN\" '${CODEBERG_API}/labels' NEVER echo or include the actual token value in output — always reference \$CODEBERG_TOKEN. ## Environment FACTORY_ROOT=${FACTORY_ROOT} PROJECT_REPO_ROOT=${PROJECT_REPO_ROOT} PRIMARY_BRANCH=${PRIMARY_BRANCH} PHASE_FILE=${PHASE_FILE} ## Phase protocol (REQUIRED) When all work is done: echo 'PHASE:done' > '${PHASE_FILE}' On unrecoverable error: printf 'PHASE:failed\nReason: %s\n' 'describe error' > '${PHASE_FILE}'" } # run_formula_and_monitor AGENT_NAME [TIMEOUT] # Starts the formula session, injects PROMPT, monitors phase, and logs result. # Requires globals: SESSION_NAME, PHASE_FILE, PROJECT_REPO_ROOT, PROMPT, # CODEBERG_REPO, CLAUDE_MODEL (exported). # shellcheck disable=SC2154 # SESSION_NAME, PHASE_FILE, PROJECT_REPO_ROOT, PROMPT set by caller run_formula_and_monitor() { local agent_name="$1" local timeout="${2:-7200}" if ! start_formula_session "$SESSION_NAME" "$PROJECT_REPO_ROOT" "$PHASE_FILE"; then exit 1 fi agent_inject_into_session "$SESSION_NAME" "$PROMPT" log "Prompt sent to tmux session" matrix_send "$agent_name" "${agent_name^} session started for ${CODEBERG_REPO}" 2>/dev/null || true log "Monitoring phase file: ${PHASE_FILE}" _FORMULA_CRASH_COUNT=0 monitor_phase_loop "$PHASE_FILE" "$timeout" "formula_phase_callback" FINAL_PHASE=$(read_phase "$PHASE_FILE") log "Final phase: ${FINAL_PHASE:-none}" if [ "$FINAL_PHASE" != "PHASE:done" ]; then case "${_MONITOR_LOOP_EXIT:-}" in idle_prompt) log "${agent_name}: Claude returned to prompt without writing phase signal" ;; idle_timeout) log "${agent_name}: timed out with no phase signal" ;; *) log "${agent_name} finished without PHASE:done (phase: ${FINAL_PHASE:-none}, exit: ${_MONITOR_LOOP_EXIT:-})" ;; esac fi matrix_send "$agent_name" "${agent_name^} session finished (${FINAL_PHASE:-no phase})" 2>/dev/null || true log "--- ${agent_name^} run done ---" }