Files
agency-agents/scripts/check-divisions.sh
Michael Sitarzewski 04e95b875f Exclude integrations/ from the source-agent scan (it's convert.sh output)
#592 added `integrations` to AGENT_DIRS in convert.sh and lint-agents.sh and to
the lint workflow paths, to make those lists match divisions.json. That was
wrong: integrations/ is not a source-agent category — it's where convert.sh
WRITES per-tool conversions (e.g. openclaw output → integrations/openclaw/<agent>/SOUL.md).
It holds 957 conversion outputs across openclaw/opencode/qwen/antigravity, vs
248 real source agents in the 17 genuine categories.

Scanning integrations/ as source made the toolchain re-convert its own outputs:
the same agent appears under every tool (brand-guardian ×5), output slugs
collide, and convert.sh's last-writer-wins corrupts the catalog — which broke
downstream parity checks. convert.sh originally omitted integrations on purpose;
#592 misread that deliberate exclusion as drift.

Fix: drop integrations from convert.sh / lint-agents.sh AGENT_DIRS and the lint
workflow, remove it from divisions.json (it's not a division), and add it to
NON_DIVISION_DIRS in check-divisions.sh so the guard's canonical set is the real
17 source categories. The `strategy` additions from #592 were correct and stay.

check-divisions.sh now PASSES at 17 divisions consistent across divisions.json,
directories, scripts, and CI.

Note: integrations/mcp-memory holds 2 real source agents stranded in the output
tree; relocating them to a real category is left as separate follow-up.

Co-Authored-By: Claude Opus 4.8 (1M context) <noreply@anthropic.com>
2026-06-15 19:29:02 -05:00

116 lines
4.2 KiB
Bash
Executable File

#!/usr/bin/env bash
#
# check-divisions.sh — enforce a single source of truth for the division set.
#
# divisions.json (repo root) is canonical. This script fails if any of the
# following disagree with it:
# 1. The actual top-level agent directories on disk
# 2. AGENT_DIRS in scripts/convert.sh
# 3. AGENT_DIRS in scripts/lint-agents.sh
# 4. The path filters in .github/workflows/lint-agents.yml
# 5. Every divisions.json entry has label, icon, and color
#
# Add a division: create its directory, add an entry to divisions.json, then
# this script tells you every other place that must be updated. No deps beyond
# bash 3.2 + coreutils (no jq) so it runs the same on macOS and CI.
#
# Usage: ./scripts/check-divisions.sh
set -euo pipefail
cd "$(dirname "$0")/.."
JSON="divisions.json"
# Top-level directories that are NOT divisions. Everything else at the repo
# root that is a directory is treated as a division (so a new division dir is
# caught even if nobody remembered to register it).
# integrations/ is convert.sh's OUTPUT tree (per-tool conversions written back
# into the repo), not a source-agent category — it must never be scanned as one.
NON_DIVISION_DIRS=(examples scripts integrations)
errors=0
fail() { echo "ERROR $*"; errors=$((errors + 1)); }
# --- sorted, newline-delimited helpers -------------------------------------
# Canonical set: object-valued keys inside the "divisions" object. Scoping to
# lines after the `"divisions": {` opener excludes both the wrapper key itself
# and the string-valued "_note" key.
canonical() {
awk '/"divisions"[[:space:]]*:[[:space:]]*\{/{f=1; next} f' "$JSON" \
| grep -oE '"[a-z0-9-]+"[[:space:]]*:[[:space:]]*\{' \
| sed -E 's/"([a-z0-9-]+)".*/\1/' | sort -u
}
# Actual division directories on disk (top-level dirs minus the excludes and
# anything dot-prefixed).
actual_dirs() {
local d base
for d in */; do
base="${d%/}"
[[ "$base" == .* ]] && continue
case " ${NON_DIVISION_DIRS[*]} " in *" $base "*) continue ;; esac
echo "$base"
done | sort -u
}
# Contents of a bash AGENT_DIRS=( ... ) array in the given file, one per line.
agent_dirs_array() {
awk '/AGENT_DIRS=\(/{f=1; next} f && /^\)/{exit} f{print}' "$1" \
| tr ' \t' '\n\n' | grep -E '^[a-z0-9-]+$' | sort -u
}
# Compare canonical vs a candidate set; report both directions.
compare() {
local label="$1" candidate="$2" canon
canon="$(canonical)"
local missing extra
missing="$(comm -23 <(echo "$canon") <(echo "$candidate"))"
extra="$(comm -13 <(echo "$canon") <(echo "$candidate"))"
if [[ -n "$missing" ]]; then
fail "$label is missing division(s) present in $JSON: $(echo "$missing" | tr '\n' ' ')"
fi
if [[ -n "$extra" ]]; then
fail "$label has division(s) not in $JSON: $(echo "$extra" | tr '\n' ' ')"
fi
}
# --- checks ----------------------------------------------------------------
[[ -f "$JSON" ]] || { echo "ERROR $JSON not found at repo root"; exit 1; }
compare "the agent directories on disk" "$(actual_dirs)"
compare "scripts/convert.sh AGENT_DIRS" "$(agent_dirs_array scripts/convert.sh)"
compare "scripts/lint-agents.sh AGENT_DIRS" "$(agent_dirs_array scripts/lint-agents.sh)"
# Workflow path filters: every canonical division must appear as `<div>/` in
# the lint workflow, or new divisions silently skip CI.
WF=".github/workflows/lint-agents.yml"
if [[ -f "$WF" ]]; then
while IFS= read -r div; do
grep -qE "\b${div}/" "$WF" || fail "$WF has no path filter for division '$div'"
done < <(canonical)
else
fail "$WF not found"
fi
# Every entry must have label, icon, and color.
while IFS= read -r div; do
block="$(awk -v d="\"$div\"" '$0 ~ d"[[:space:]]*:[[:space:]]*\\{" {print; found=1; next} found && /\}/ {print; exit} found {print}' "$JSON")"
for field in label icon color; do
echo "$block" | grep -qE "\"$field\"[[:space:]]*:" \
|| fail "division '$div' in $JSON is missing \"$field\""
done
done < <(canonical)
# --- result ----------------------------------------------------------------
count="$(canonical | wc -l | tr -d ' ')"
if [[ $errors -gt 0 ]]; then
echo ""
echo "FAILED: $errors divisions consistency error(s). $JSON is the source of truth."
exit 1
fi
echo "PASSED: $count divisions consistent across $JSON, directories, scripts, and CI."