Phase 1: auditor (audit-task.sh + Gitea Actions workflow); runner crash-loop fix documented

2026-05-12 07:02:55 +00:00
parent f3c38f1017
commit a296b87065
2 changed files with 223 additions and 0 deletions
--- a/agents/audit-task.sh
+++ b/agents/audit-task.sh
@@ -0,0 +1,176 @@
+#!/usr/bin/env bash
+# audit-task.sh <owner>/<repo> <pr-number>
+#
+# Reads a Gitea PR, finds the linked issue (via "Resolves #N" in the PR body),
+# asks claude to audit the diff against the issue's done criteria, and posts
+# a structured review comment on the PR.
+#
+# Env knobs:
+#   MODEL          default sonnet  (the auditor's model)
+#   MAX_WALLCLOCK  default 10m
+#   GITEA_URL      default https://gitea.dannyhaslund.dk
+#   GITEA_TOKEN_FILE  default /etc/agent/gitea-token
+
+set -euo pipefail
+
+REPO="${1:-}"
+PR_NUM="${2:-}"
+[[ -z "$REPO" || -z "$PR_NUM" ]] && { echo "usage: $0 <owner>/<repo> <pr-number>" >&2; exit 64; }
+
+MODEL="${MODEL:-sonnet}"
+MAX_WALLCLOCK="${MAX_WALLCLOCK:-10m}"
+GITEA_URL="${GITEA_URL:-https://gitea.dannyhaslund.dk}"
+GITEA_TOKEN_FILE="${GITEA_TOKEN_FILE:-/etc/agent/gitea-token}"
+LOG_ROOT="${LOG_ROOT:-/var/agent/logs}"
+
+[[ -r "$GITEA_TOKEN_FILE" ]] || { echo "missing $GITEA_TOKEN_FILE" >&2; exit 65; }
+GITEA_TOKEN="$(cat "$GITEA_TOKEN_FILE")"
+
+mkdir -p "$LOG_ROOT"
+LOG_FILE="$LOG_ROOT/audit-pr${PR_NUM}-$(date -u +%Y%m%dT%H%M%S).log"
+log() { printf '[%s] %s\n' "$(date -u +%H:%M:%S)" "$*" | tee -a "$LOG_FILE"; }
+
+# ---------- 1. Fetch PR ----------
+log "Fetching PR $REPO#$PR_NUM"
+pr="$(curl -fsS -H "Authorization: token $GITEA_TOKEN" "$GITEA_URL/api/v1/repos/$REPO/pulls/$PR_NUM")"
+pr_title="$(jq -r .title  <<<"$pr")"
+pr_body="$(jq -r .body   <<<"$pr")"
+pr_head="$(jq -r .head.ref <<<"$pr")"
+pr_base="$(jq -r .base.ref <<<"$pr")"
+
+# ---------- 2. Find linked issue ----------
+issue_num="$(grep -oiE '(resolves|closes|fixes)\s+#[0-9]+' <<<"$pr_body" | head -1 | grep -oE '[0-9]+' || true)"
+if [[ -n "$issue_num" ]]; then
+  log "Linked issue: #$issue_num"
+  issue_body="$(curl -fsS -H "Authorization: token $GITEA_TOKEN" \
+    "$GITEA_URL/api/v1/repos/$REPO/issues/$issue_num" | jq -r .body)"
+else
+  log "WARN: no linked issue found in PR body; auditing against PR description only"
+  issue_body="(no linked issue; audit against PR description and general code quality)"
+fi
+
+# ---------- 3. Get diff ----------
+DIFF_FILE="$(mktemp)"
+trap 'rm -f "$DIFF_FILE" "$AUDIT_OUT" 2>/dev/null' EXIT
+
+curl -fsS -H "Authorization: token $GITEA_TOKEN" \
+  "$GITEA_URL/api/v1/repos/$REPO/pulls/$PR_NUM.diff" > "$DIFF_FILE"
+
+diff_size="$(wc -c < "$DIFF_FILE")"
+log "Diff size: $diff_size bytes"
+
+# Truncate to 32 KB if too large
+if [[ $diff_size -gt 32768 ]]; then
+  log "Truncating diff to 32 KB for claude"
+  head -c 32768 "$DIFF_FILE" > "${DIFF_FILE}.trim"
+  echo -e "\n\n[... diff truncated at 32KB ...]" >> "${DIFF_FILE}.trim"
+  mv "${DIFF_FILE}.trim" "$DIFF_FILE"
+fi
+
+# ---------- 4. Audit via claude ----------
+SCHEMA='{
+  "type": "object",
+  "required": ["verdict", "summary", "criteria"],
+  "properties": {
+    "verdict": { "type": "string", "enum": ["approve", "request_changes", "comment"] },
+    "summary": { "type": "string", "minLength": 10 },
+    "criteria": {
+      "type": "array",
+      "items": {
+        "type": "object",
+        "required": ["criterion", "status"],
+        "properties": {
+          "criterion": { "type": "string" },
+          "status":    { "type": "string", "enum": ["pass", "fail", "unclear"] },
+          "note":      { "type": "string" }
+        }
+      }
+    },
+    "issues_found": { "type": "array", "items": { "type": "string" } }
+  }
+}'
+
+PROMPT="You are the auditor agent in an autonomous coding pipeline. Review the pull request against the linked issue's Done criteria.
+
+Be strict but fair:
+  - pass = the diff clearly satisfies the criterion
+  - fail = the diff clearly does not, or contradicts it
+  - unclear = cannot determine from the diff alone (e.g. requires running tests)
+
+Set verdict:
+  - approve         = all criteria pass, no significant issues
+  - comment         = mostly fine but some criteria are unclear or minor issues
+  - request_changes = at least one criterion fails, or critical issues
+
+issues_found is for code-quality concerns the issue did NOT specify but that
+matter for merge: security holes, broken syntax, obvious bugs, dependency
+problems. Do NOT bikeshed style.
+
+Do not call any tools. Produce the JSON from the prompt text alone.
+
+# Linked issue body
+
+$issue_body
+
+# PR title
+
+$pr_title
+
+# PR body
+
+$pr_body
+
+# Diff ($pr_head into $pr_base)
+
+$(cat "$DIFF_FILE")
+
+Return only the JSON matching the schema."
+
+AUDIT_OUT="$(mktemp)"
+log "Invoking claude (model=$MODEL, timeout=$MAX_WALLCLOCK)"
+set +e
+timeout --signal=INT --kill-after=30s "$MAX_WALLCLOCK" \
+  claude -p "$PROMPT" \
+    --model "$MODEL" \
+    --output-format json \
+    --json-schema "$SCHEMA" \
+    --allowedTools "" \
+    < /dev/null > "$AUDIT_OUT" 2>>"$LOG_FILE"
+rc=$?
+set -e
+log "claude exited rc=$rc"
+
+if [[ $rc -ne 0 ]]; then
+  log "ERROR — auditor failed; posting fallback comment"
+  curl -fsS -X POST -H "Authorization: token $GITEA_TOKEN" -H "Content-Type: application/json" \
+    -d "$(jq -nc --arg b "agent auditor: failed to produce an audit (claude rc=$rc). Log: \`$LOG_FILE\`" '{body:$b}')" \
+    "$GITEA_URL/api/v1/repos/$REPO/issues/$PR_NUM/comments" > /dev/null
+  exit 1
+fi
+
+# ---------- 5. Render review comment ----------
+audit="$(jq -c '.structured_output' "$AUDIT_OUT")"
+verdict="$(jq -r .verdict <<<"$audit")"
+summary="$(jq -r .summary <<<"$audit")"
+criteria_md="$(jq -r '.criteria // [] | map("- **" + (.status|ascii_upcase) + "** — " + .criterion + (if .note then "  _" + .note + "_" else "" end)) | join("\n")' <<<"$audit")"
+issues_md="$(jq -r '.issues_found // [] | if length == 0 then "_none_" else map("- " + .) | join("\n") end' <<<"$audit")"
+
+# Verdict badge
+case "$verdict" in
+  approve)         badge=":white_check_mark: APPROVE" ;;
+  comment)         badge=":speech_balloon: COMMENT" ;;
+  request_changes) badge=":no_entry: REQUEST_CHANGES" ;;
+  *)               badge=":grey_question: $verdict" ;;
+esac
+
+review_body="$(printf '## Auditor review — %s\n\n%s\n\n### Criteria\n\n%s\n\n### Other issues found\n\n%s\n\n---\n_model: %s · log: `%s`_\n' \
+  "$badge" "$summary" "$criteria_md" "$issues_md" "$MODEL" "$LOG_FILE")"
+
+# ---------- 6. Post comment ----------
+log "Posting review (verdict=$verdict)"
+curl -fsS -X POST -H "Authorization: token $GITEA_TOKEN" -H "Content-Type: application/json" \
+  -d "$(jq -nc --arg b "$review_body" '{body:$b}')" \
+  "$GITEA_URL/api/v1/repos/$REPO/issues/$PR_NUM/comments" > /dev/null
+
+log "Done. verdict=$verdict"
+echo "$verdict"
--- a/auditor/workflow-template.yml
+++ b/auditor/workflow-template.yml
@@ -0,0 +1,47 @@
+# Drop into each agent-managed project repo as .gitea/workflows/auditor.yml.
+# Requires the project to have these Gitea Actions secrets configured:
+#   AUDITOR_SSH_KEY  — private ed25519 key whose public counterpart is in
+#                      agent@dev-01:~/.ssh/authorized_keys
+#
+# The workflow SSH's into dev-01 (192.168.1.29) and runs audit-task.sh, which
+# uses claude headless to review the PR against its linked issue's Done
+# criteria, then posts the audit as a PR comment.
+
+name: Auditor
+
+on:
+  pull_request:
+    types: [opened, synchronize, reopened]
+
+jobs:
+  audit:
+    runs-on: ubuntu-latest
+    container:
+      image: debian:bookworm-slim
+    steps:
+      - name: Install ssh + curl
+        run: |
+          apt-get update -qq
+          apt-get install -y -qq openssh-client curl jq ca-certificates
+
+      - name: Audit PR via dev-01
+        env:
+          AUDITOR_KEY: ${{ secrets.AUDITOR_SSH_KEY }}
+          REPO: ${{ github.repository }}
+          PR_NUM: ${{ github.event.pull_request.number }}
+        run: |
+          set -e
+          [ -n "$AUDITOR_KEY" ] || { echo "ERROR: AUDITOR_SSH_KEY secret not set"; exit 1; }
+
+          mkdir -p ~/.ssh
+          printf '%s\n' "$AUDITOR_KEY" > ~/.ssh/id_ed25519
+          chmod 600 ~/.ssh/id_ed25519
+
+          # Trust dev-01's host key — collected at runtime; LAN-only path
+          ssh-keyscan -H 192.168.1.29 >> ~/.ssh/known_hosts 2>/dev/null
+
+          ssh -i ~/.ssh/id_ed25519 \
+              -o BatchMode=yes \
+              -o StrictHostKeyChecking=yes \
+              agent@192.168.1.29 \
+              "PATH=\$HOME/.local/bin:/usr/local/bin:\$PATH MAX_WALLCLOCK=10m /usr/local/bin/audit-task.sh '$REPO' '$PR_NUM'"