refactor: planner maintains AGENTS.md instead of STATE.md
STATE.md was a machine-generated system description that was always worse than the human-curated AGENTS.md. Killed STATE.md entirely. Phase 1: Reviews recent git history against AGENTS.md, suggests updates via PR to keep the file tree, conventions, and architecture descriptions current. Phase 2: Gap analysis — compares AGENTS.md + VISION.md + open issues, creates backlog issues for missing capabilities.
This commit is contained in:
parent
e1101894d6
commit
679c62e7cb
1 changed files with 95 additions and 118 deletions
|
|
@ -1,10 +1,10 @@
|
|||
#!/usr/bin/env bash
|
||||
# =============================================================================
|
||||
# planner-agent.sh — Rebuild STATE.md from git history, then gap-analyse
|
||||
# planner-agent.sh — Keep AGENTS.md current, then gap-analyse against VISION.md
|
||||
#
|
||||
# Two-phase planner run:
|
||||
# Phase 1: Rebuild STATE.md from git log + closed issues (compact snapshot)
|
||||
# Phase 2: Compare STATE.md vs VISION.md, create backlog issues for gaps
|
||||
# Phase 1: Review recent git history, suggest AGENTS.md updates via PR
|
||||
# Phase 2: Compare AGENTS.md vs VISION.md, create backlog issues for gaps
|
||||
#
|
||||
# Usage: planner-agent.sh (no args — uses env vars from .env / env.sh)
|
||||
# =============================================================================
|
||||
|
|
@ -19,7 +19,7 @@ source "$FACTORY_ROOT/lib/env.sh"
|
|||
LOG_FILE="$SCRIPT_DIR/planner.log"
|
||||
CLAUDE_TIMEOUT="${CLAUDE_TIMEOUT:-3600}"
|
||||
MARKER_FILE="${PROJECT_REPO_ROOT}/.last-planner-sha"
|
||||
STATE_FILE="${PROJECT_REPO_ROOT}/STATE.md"
|
||||
AGENTS_FILE="${PROJECT_REPO_ROOT}/AGENTS.md"
|
||||
VISION_FILE="${PROJECT_REPO_ROOT}/VISION.md"
|
||||
|
||||
log() { echo "[$(date -u +%Y-%m-%dT%H:%M:%S)Z] $*" >> "$LOG_FILE"; }
|
||||
|
|
@ -39,139 +39,127 @@ if [ -f "$MARKER_FILE" ]; then
|
|||
if git cat-file -e "$LAST_SHA" 2>/dev/null; then
|
||||
GIT_RANGE="${LAST_SHA}..HEAD"
|
||||
else
|
||||
log "WARNING: marker SHA ${LAST_SHA:0:7} not found, using 30-day window"
|
||||
first_sha=""
|
||||
first_sha=$(git log --format=%H --after='30 days ago' --reverse 2>/dev/null | head -1) || true
|
||||
GIT_RANGE="${first_sha:-HEAD~30}..HEAD"
|
||||
log "WARNING: marker SHA ${LAST_SHA:0:7} not found, using 7-day window"
|
||||
first_sha=$(git log --format=%H --after='7 days ago' --reverse 2>/dev/null | head -1) || true
|
||||
GIT_RANGE="${first_sha:-HEAD~20}..HEAD"
|
||||
fi
|
||||
else
|
||||
log "No marker file, using 30-day window"
|
||||
first_sha=$(git log --format=%H --after='30 days ago' --reverse 2>/dev/null | head -1) || true
|
||||
GIT_RANGE="${first_sha:-HEAD~30}..HEAD"
|
||||
log "No marker file, using 7-day window"
|
||||
first_sha=$(git log --format=%H --after='7 days ago' --reverse 2>/dev/null | head -1) || true
|
||||
GIT_RANGE="${first_sha:-HEAD~20}..HEAD"
|
||||
fi
|
||||
|
||||
GIT_LOG=$(git log "$GIT_RANGE" --oneline --no-merges 2>/dev/null || true)
|
||||
MERGE_LOG=$(git log "$GIT_RANGE" --oneline --merges 2>/dev/null || true)
|
||||
COMMIT_COUNT=$(echo "$GIT_LOG" | grep -c '.' || true)
|
||||
log "Range: $GIT_RANGE ($COMMIT_COUNT commits)"
|
||||
|
||||
if [ "$COMMIT_COUNT" -eq 0 ] && [ -f "$STATE_FILE" ]; then
|
||||
log "No new commits since last run — skipping STATE.md rebuild"
|
||||
# Still run gap analysis (vision or issues may have changed)
|
||||
# ── File tree (for context on what exists) ───────────────────────────────
|
||||
FILE_TREE=$(find . -maxdepth 3 -type f \( -name '*.sol' -o -name '*.ts' -o -name '*.sh' -o -name '*.md' -o -name '*.json' \) \
|
||||
! -path '*/node_modules/*' ! -path '*/.git/*' ! -path '*/out/*' ! -path '*/cache/*' ! -path '*/dist/*' \
|
||||
2>/dev/null | sort | head -200)
|
||||
|
||||
# ── Phase 1: AGENTS.md maintenance ──────────────────────────────────────
|
||||
if [ "$COMMIT_COUNT" -eq 0 ]; then
|
||||
log "No new commits since last run — skipping AGENTS.md review"
|
||||
else
|
||||
# ── Phase 1: Rebuild STATE.md ──────────────────────────────────────────
|
||||
log "Phase 1: rebuilding STATE.md"
|
||||
log "Phase 1: reviewing AGENTS.md against recent changes"
|
||||
|
||||
CURRENT_STATE=""
|
||||
[ -f "$STATE_FILE" ] && CURRENT_STATE=$(cat "$STATE_FILE")
|
||||
CURRENT_AGENTS=""
|
||||
[ -f "$AGENTS_FILE" ] && CURRENT_AGENTS=$(cat "$AGENTS_FILE")
|
||||
|
||||
# Read project docs for high-level understanding
|
||||
PROJECT_DOCS=""
|
||||
for doc in AGENTS.md docs/PRODUCT-TRUTH.md docs/ARCHITECTURE.md docs/UX-DECISIONS.md; do
|
||||
[ -f "${PROJECT_REPO_ROOT}/${doc}" ] && \
|
||||
PROJECT_DOCS="${PROJECT_DOCS}
|
||||
### ${doc}
|
||||
$(cat "${PROJECT_REPO_ROOT}/${doc}")
|
||||
"
|
||||
done
|
||||
if [ -z "$CURRENT_AGENTS" ]; then
|
||||
log "No AGENTS.md found — skipping phase 1"
|
||||
else
|
||||
# Files changed in this range
|
||||
FILES_CHANGED=$(git diff --name-only "$GIT_RANGE" 2>/dev/null | sort -u || true)
|
||||
|
||||
# Fetch recently closed issues for context
|
||||
CLOSED_ISSUES=$(codeberg_api GET "/issues?state=closed&type=issues&limit=30&sort=updated&direction=desc" 2>/dev/null | \
|
||||
jq -r '.[] | "#\(.number) \(.title)"' 2>/dev/null || true)
|
||||
PHASE1_PROMPT="You maintain AGENTS.md for the ${PROJECT_NAME} repository. AGENTS.md is the primary onboarding document — it describes the project's architecture, file layout, conventions, and how to work in the codebase.
|
||||
|
||||
PHASE1_PROMPT="You are maintaining STATE.md — a compact factual snapshot of what ${PROJECT_NAME} currently is and does.
|
||||
## Current AGENTS.md
|
||||
${CURRENT_AGENTS}
|
||||
|
||||
## Project Documentation (read for context — understand the system before writing)
|
||||
${PROJECT_DOCS:-"(no docs found)"}
|
||||
## Recent commits (since last review)
|
||||
${GIT_LOG}
|
||||
|
||||
## Current STATE.md
|
||||
${CURRENT_STATE:-"(empty — create from scratch)"}
|
||||
## Files changed
|
||||
${FILES_CHANGED}
|
||||
|
||||
## New commits since last snapshot
|
||||
${GIT_LOG:-"(none)"}
|
||||
|
||||
## Merge commits
|
||||
${MERGE_LOG:-"(none)"}
|
||||
|
||||
## Recently closed issues
|
||||
${CLOSED_ISSUES:-"(none)"}
|
||||
## Repository file tree (top 3 levels)
|
||||
${FILE_TREE}
|
||||
|
||||
## Task
|
||||
Update STATE.md to describe what the project IS right now — its architecture, capabilities, and current state.
|
||||
Review AGENTS.md against the recent changes. Output an UPDATED version of AGENTS.md that:
|
||||
- Reflects any new directories, scripts, tools, or conventions introduced by the recent commits
|
||||
- Removes or updates references to things that were deleted or renamed
|
||||
- Keeps the existing structure, voice, and level of detail — this is a human-curated document, preserve its character
|
||||
- Does NOT add issue/PR references — AGENTS.md is timeless documentation, not a changelog
|
||||
- Does NOT rewrite sections that haven't changed — preserve the original text where possible
|
||||
|
||||
### Writing style
|
||||
- Describe the SYSTEM, not the changes. Think: 'What would a new developer need to know?'
|
||||
- Lead with what the project does at a high level, then drill into subsystems
|
||||
- Group related capabilities together (e.g. all evolution stuff in one bullet)
|
||||
- Issue/PR references (#42) are good for traceability but should SUPPORT descriptions, not replace them
|
||||
- Bad: 'evolve.sh: auto-incrementing results directory (#752), cleans stale tmpdirs (#750)'
|
||||
- Good: 'Evolution pipeline runs perpetually on a dedicated VPS, breeding Push3 optimizer bytecode through mutation, crossover, and elitism against a revm fitness evaluator'
|
||||
- No dates, no changelog framing, no 'fixed X' or 'added Y' language
|
||||
- No more than 25 bullet points — be concise and architectural
|
||||
- First bullet should be a one-line project description
|
||||
If AGENTS.md is already fully up to date and no changes are needed, output exactly: NO_CHANGES
|
||||
|
||||
Your response must start with '- ' on the very first character. No summary, no meta-commentary, no preamble, no markdown fences, no 'Here is...' or 'I have...'. ONLY the bullet list. Any response not starting with '- ' will be rejected."
|
||||
Otherwise, output the complete updated AGENTS.md content (not a diff, the full file).
|
||||
Do NOT wrap the output in markdown fences. Start directly with the file content."
|
||||
|
||||
PHASE1_OUTPUT=$(timeout "$CLAUDE_TIMEOUT" claude -p "$PHASE1_PROMPT" \
|
||||
--model sonnet \
|
||||
2>/dev/null) || {
|
||||
log "ERROR: claude exited with code $? during phase 1"
|
||||
exit 1
|
||||
}
|
||||
PHASE1_OUTPUT=$(timeout "$CLAUDE_TIMEOUT" claude -p "$PHASE1_PROMPT" \
|
||||
--model sonnet \
|
||||
--dangerously-skip-permissions \
|
||||
2>/dev/null) || {
|
||||
log "ERROR: claude exited with code $? during phase 1"
|
||||
# Update marker even on failure to avoid re-processing same range
|
||||
echo "$HEAD_SHA" > "$MARKER_FILE"
|
||||
exit 1
|
||||
}
|
||||
|
||||
if [ -z "$PHASE1_OUTPUT" ]; then
|
||||
log "ERROR: empty output from phase 1"
|
||||
exit 1
|
||||
fi
|
||||
if echo "$PHASE1_OUTPUT" | grep -q "^NO_CHANGES$"; then
|
||||
log "AGENTS.md is up to date — no changes needed"
|
||||
elif [ -n "$PHASE1_OUTPUT" ]; then
|
||||
# Write updated AGENTS.md and create PR
|
||||
TEMP_FILE=$(mktemp "${AGENTS_FILE}.XXXXXX")
|
||||
printf '%s\n' "$PHASE1_OUTPUT" > "$TEMP_FILE"
|
||||
mv "$TEMP_FILE" "$AGENTS_FILE"
|
||||
|
||||
# Strip any non-bullet preamble (Sonnet sometimes narrates before the bullets)
|
||||
PHASE1_OUTPUT=$(echo "$PHASE1_OUTPUT" | sed -n '/^- /,$p')
|
||||
if ! git diff --quiet "$AGENTS_FILE" 2>/dev/null; then
|
||||
branch_name="chore/planner-agents-$(date -u +%Y%m%d)"
|
||||
git checkout -B "$branch_name" 2>/dev/null
|
||||
git add "$AGENTS_FILE"
|
||||
git commit -m "chore: planner update AGENTS.md" --quiet 2>/dev/null
|
||||
git push -f origin "$branch_name" --quiet 2>/dev/null || { log "ERROR: failed to push $branch_name"; git checkout "${PRIMARY_BRANCH}" 2>/dev/null; }
|
||||
git checkout "${PRIMARY_BRANCH}" 2>/dev/null
|
||||
# Restore AGENTS.md to master version after branch push
|
||||
git checkout "$AGENTS_FILE" 2>/dev/null || true
|
||||
|
||||
# Validate output has bullet points
|
||||
if [ -z "$PHASE1_OUTPUT" ] || ! echo "$PHASE1_OUTPUT" | head -1 | grep -q '^- '; then
|
||||
log "ERROR: phase 1 output contains no bullet list"
|
||||
exit 1
|
||||
fi
|
||||
|
||||
# Atomic write
|
||||
TEMP_STATE=$(mktemp "${STATE_FILE}.XXXXXX")
|
||||
printf '%s\n' "$PHASE1_OUTPUT" > "$TEMP_STATE"
|
||||
mv "$TEMP_STATE" "$STATE_FILE"
|
||||
|
||||
# Commit STATE.md via PR (master is protected)
|
||||
if ! git diff --quiet "$STATE_FILE" 2>/dev/null; then
|
||||
branch_name="chore/planner-state-$(date -u +%Y%m%d)"
|
||||
git checkout -B "$branch_name" 2>/dev/null
|
||||
git add "$STATE_FILE"
|
||||
git commit -m "chore: planner rebuild STATE.md" --quiet 2>/dev/null
|
||||
git push -f origin "$branch_name" --quiet 2>/dev/null || { log "ERROR: failed to push $branch_name"; git checkout "${PRIMARY_BRANCH}" 2>/dev/null; return 1; }
|
||||
git checkout "${PRIMARY_BRANCH}" 2>/dev/null
|
||||
|
||||
# Create or update PR (filter by head ref — Codeberg's head param is unreliable)
|
||||
EXISTING_PR=$(codeberg_api GET "/pulls?state=open&limit=50" 2>/dev/null | jq -r --arg branch "$branch_name" '.[] | select(.head.ref == $branch) | .number' | head -1)
|
||||
if [ -z "$EXISTING_PR" ]; then
|
||||
PR_RESPONSE=$(codeberg_api POST "/pulls" "{\"title\":\"chore: planner rebuild STATE.md\",\"head\":\"${branch_name}\",\"base\":\"${PRIMARY_BRANCH}\",\"body\":\"Automated STATE.md rebuild from git history + closed issues.\"}" 2>/dev/null)
|
||||
PR_NUM=$(echo "$PR_RESPONSE" | jq -r '.number // empty')
|
||||
if [ -n "$PR_NUM" ]; then
|
||||
log "Created PR #${PR_NUM} for STATE.md update"
|
||||
matrix_send "planner" "📋 PR #${PR_NUM}: planner rebuild STATE.md" 2>/dev/null || true
|
||||
# Create or update PR
|
||||
EXISTING_PR=$(codeberg_api GET "/pulls?state=open&limit=50" 2>/dev/null | \
|
||||
jq -r --arg branch "$branch_name" '.[] | select(.head.ref == $branch) | .number' | head -1)
|
||||
if [ -z "$EXISTING_PR" ]; then
|
||||
PR_RESPONSE=$(codeberg_api POST "/pulls" \
|
||||
"{\"title\":\"chore: planner update AGENTS.md\",\"head\":\"${branch_name}\",\"base\":\"${PRIMARY_BRANCH}\",\"body\":\"Automated AGENTS.md update based on recent commits (${COMMIT_COUNT} changes since last review).\"}" \
|
||||
2>/dev/null)
|
||||
PR_NUM=$(echo "$PR_RESPONSE" | jq -r '.number // empty')
|
||||
if [ -n "$PR_NUM" ]; then
|
||||
log "Created PR #${PR_NUM} for AGENTS.md update"
|
||||
matrix_send "planner" "📋 PR #${PR_NUM}: planner update AGENTS.md (${COMMIT_COUNT} commits reviewed)" 2>/dev/null || true
|
||||
else
|
||||
log "ERROR: failed to create PR"
|
||||
fi
|
||||
else
|
||||
log "Updated existing PR #${EXISTING_PR}"
|
||||
fi
|
||||
else
|
||||
log "ERROR: failed to create PR"
|
||||
log "AGENTS.md diff was empty after write — no PR needed"
|
||||
fi
|
||||
else
|
||||
log "Updated existing PR #${EXISTING_PR}"
|
||||
fi
|
||||
fi
|
||||
|
||||
# Update marker
|
||||
echo "$HEAD_SHA" > "$MARKER_FILE"
|
||||
log "Phase 1 done — STATE.md rebuilt ($(wc -l < "$STATE_FILE") lines)"
|
||||
log "Phase 1 done"
|
||||
fi
|
||||
|
||||
# ── Phase 2: Gap analysis ───────────────────────────────────────────────
|
||||
log "Phase 2: gap analysis"
|
||||
|
||||
CURRENT_STATE=$(cat "$STATE_FILE" 2>/dev/null || true)
|
||||
AGENTS_CONTENT=$(cat "$AGENTS_FILE" 2>/dev/null || true)
|
||||
VISION=""
|
||||
[ -f "$VISION_FILE" ] && VISION=$(cat "$VISION_FILE")
|
||||
|
||||
|
|
@ -190,34 +178,27 @@ fi
|
|||
|
||||
OPEN_SUMMARY=$(echo "$OPEN_ISSUES" | jq -r '.[] | "#\(.number) [\(.labels | map(.name) | join(","))] \(.title)"' 2>/dev/null || true)
|
||||
|
||||
# Fetch vision-labeled issues specifically
|
||||
VISION_ISSUES=$(echo "$OPEN_ISSUES" | jq -r '.[] | select(.labels | map(.name) | index("vision")) | "#\(.number) \(.title)\n\(.body)"' 2>/dev/null || true)
|
||||
|
||||
PHASE2_PROMPT="You are the planner for ${CODEBERG_REPO}. Your job: find gaps between the project vision and current reality.
|
||||
|
||||
## VISION.md (human-maintained goals)
|
||||
${VISION}
|
||||
|
||||
## STATE.md (current project snapshot)
|
||||
${CURRENT_STATE}
|
||||
|
||||
## Vision-labeled issues (goal anchors)
|
||||
${VISION_ISSUES:-"(none)"}
|
||||
## AGENTS.md (current project state — the ground truth)
|
||||
${AGENTS_CONTENT}
|
||||
|
||||
## All open issues
|
||||
${OPEN_SUMMARY}
|
||||
|
||||
## Task
|
||||
Identify gaps — things implied by VISION.md that are neither reflected in STATE.md nor covered by an existing open issue.
|
||||
Identify gaps — things implied by VISION.md that are neither reflected in AGENTS.md nor covered by an existing open issue.
|
||||
|
||||
For each gap, output a JSON object (one per line, no array wrapper):
|
||||
{\"title\": \"action-oriented title\", \"body\": \"problem statement + why it matters + rough approach\", \"depends\": [list of blocking issue numbers or empty]}
|
||||
|
||||
## Rules
|
||||
- Max 5 new issues — focus on highest-leverage gaps only
|
||||
- Do NOT create issues for things already in STATE.md (already done)
|
||||
- Do NOT create issues for things already described in AGENTS.md (already done)
|
||||
- Do NOT create issues that overlap with ANY existing open issue, even partially
|
||||
- Do NOT create issues about vision items, tech-debt, or in-progress work
|
||||
- Each title should be a plain, action-oriented sentence
|
||||
- Each body should explain: what's missing, why it matters for the vision, rough approach
|
||||
- Reference blocking issues by number in depends array
|
||||
|
|
@ -228,6 +209,7 @@ Output ONLY the JSON lines (or NO_GAPS) — no preamble, no markdown fences."
|
|||
|
||||
PHASE2_OUTPUT=$(timeout "$CLAUDE_TIMEOUT" claude -p "$PHASE2_PROMPT" \
|
||||
--model sonnet \
|
||||
--dangerously-skip-permissions \
|
||||
2>/dev/null) || {
|
||||
log "ERROR: claude exited with code $? during phase 2"
|
||||
exit 1
|
||||
|
|
@ -240,21 +222,18 @@ if echo "$PHASE2_OUTPUT" | grep -q "NO_GAPS"; then
|
|||
fi
|
||||
|
||||
# ── Create issues from gap analysis ──────────────────────────────────────
|
||||
# Find backlog label ID
|
||||
BACKLOG_LABEL_ID=$(codeberg_api GET "/labels" 2>/dev/null | \
|
||||
jq -r '.[] | select(.name == "backlog") | .id' 2>/dev/null || true)
|
||||
|
||||
CREATED=0
|
||||
while IFS= read -r line; do
|
||||
[ -z "$line" ] && continue
|
||||
# Skip non-JSON lines
|
||||
echo "$line" | jq -e . >/dev/null 2>&1 || continue
|
||||
|
||||
TITLE=$(echo "$line" | jq -r '.title')
|
||||
BODY=$(echo "$line" | jq -r '.body')
|
||||
DEPS=$(echo "$line" | jq -r '.depends // [] | map("#\(.)") | join(", ")')
|
||||
|
||||
# Add dependency section if present
|
||||
if [ -n "$DEPS" ] && [ "$DEPS" != "" ]; then
|
||||
BODY="${BODY}
|
||||
|
||||
|
|
@ -262,10 +241,7 @@ while IFS= read -r line; do
|
|||
${DEPS}"
|
||||
fi
|
||||
|
||||
# Create issue
|
||||
CREATE_PAYLOAD=$(jq -nc --arg t "$TITLE" --arg b "$BODY" '{title:$t, body:$b}')
|
||||
|
||||
# Add label if we found the backlog label ID
|
||||
if [ -n "$BACKLOG_LABEL_ID" ]; then
|
||||
CREATE_PAYLOAD=$(echo "$CREATE_PAYLOAD" | jq --argjson lid "$BACKLOG_LABEL_ID" '.labels = [$lid]')
|
||||
fi
|
||||
|
|
@ -273,6 +249,7 @@ ${DEPS}"
|
|||
RESULT=$(codeberg_api POST "/issues" -d "$CREATE_PAYLOAD" 2>/dev/null || true)
|
||||
ISSUE_NUM=$(echo "$RESULT" | jq -r '.number // "?"' 2>/dev/null || echo "?")
|
||||
log "Created #${ISSUE_NUM}: ${TITLE}"
|
||||
matrix_send "planner" "📋 Gap issue #${ISSUE_NUM}: ${TITLE}" 2>/dev/null || true
|
||||
CREATED=$((CREATED + 1))
|
||||
|
||||
[ "$CREATED" -ge 5 ] && break
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue