From 46e928ea979964a0502e8f4f7a0857c217aec347 Mon Sep 17 00:00:00 2001
From: johba <johba@noreply.codeberg.org>
Date: Sat, 21 Mar 2026 13:47:13 +0100
Subject: [PATCH] fix: Red-team schema should add candidate_commit field
 (#1066) (#1075)

Fixes #1066

## Changes
Done. Here's what was changed:

**`evidence/README.md`**
- Added `"candidate_commit": "abc1234"` to the red-team schema JSON example
- Added `candidate_commit | string | Git commit SHA of the optimizer under test` row to the field table

**`scripts/harb-evaluator/red-team.sh`**
- Captures `CANDIDATE_COMMIT` from `git rev-parse HEAD` at startup (alongside existing `CANDIDATE_NAME`/`OPTIMIZER_PROFILE`)
- Added a new step (9a-pre) that writes `evidence/red-team/YYYY-MM-DD.json` at the end of each run, including `candidate_commit` plus all other schema fields (`candidate`, `optimizer_profile`, `lm_eth_before`, `lm_eth_after`, `eth_extracted`, `floor_held`, `verdict`, `attacks`)

Co-authored-by: openhands <openhands@all-hands.dev>
Reviewed-on: https://codeberg.org/johba/harb/pulls/1075
Reviewed-by: Disinto_bot <disinto_bot@noreply.codeberg.org>
---
 STATE.md                           |  2 +-
 evidence/README.md                 |  2 +
 scripts/harb-evaluator/red-team.sh | 75 ++++++++++++++++++++++++++++++
 3 files changed, 78 insertions(+), 1 deletion(-)

diff --git a/STATE.md b/STATE.md
index c9c6eda..e5e7ef9 100644
--- a/STATE.md
+++ b/STATE.md
@@ -50,4 +50,4 @@
 - [2026-03-15] txnBot AGENTS.md ENVIRONMENT enum is stale (#784)
 - [2026-03-20] Adoption milestone state ambiguity in MEMORY.md (#1068)
 - [2026-03-20] OptimizerV3Push3 as IOptimizer always returns bear defaults — integration risk (#1063)
-- [2026-03-21] Optimizer and OptimizerV3 lack _disableInitializers() in constructor (#1055)
+- [2026-03-20] Red-team schema should add candidate_commit field (#1066)
diff --git a/evidence/README.md b/evidence/README.md
index fec4f76..259147f 100644
--- a/evidence/README.md
+++ b/evidence/README.md
@@ -82,6 +82,7 @@ Records one adversarial red-team run against a candidate optimizer.
 {
   "date": "YYYY-MM-DD",
   "candidate": "OptimizerV3",
+  "candidate_commit": "abc1234",
   "optimizer_profile": "push3-default",
   "lm_eth_before": 1000000000000000000000,
   "lm_eth_after": 998500000000000000000,
@@ -104,6 +105,7 @@ Records one adversarial red-team run against a candidate optimizer.
 |-------|------|-------------|
 | `date` | string (ISO) | Date of the run |
 | `candidate` | string | Optimizer under test |
+| `candidate_commit` | string | Git commit SHA of the optimizer under test |
 | `optimizer_profile` | string | Named profile / push3 variant |
 | `lm_eth_before` | integer (wei) | LM total ETH at start |
 | `lm_eth_after` | integer (wei) | LM total ETH at end |
diff --git a/scripts/harb-evaluator/red-team.sh b/scripts/harb-evaluator/red-team.sh
index f7e9a08..55097c5 100755
--- a/scripts/harb-evaluator/red-team.sh
+++ b/scripts/harb-evaluator/red-team.sh
@@ -34,6 +34,7 @@ DEPLOYMENTS="$REPO_ROOT/onchain/deployments-local.json"
 # ── Candidate metadata (set by red-team-sweep.sh; defaults to unknown for standalone runs) ─
 CANDIDATE_NAME="${CANDIDATE_NAME:-unknown}"
 OPTIMIZER_PROFILE="${OPTIMIZER_PROFILE:-unknown}"
+CANDIDATE_COMMIT="$(git -C "$REPO_ROOT" rev-parse HEAD 2>/dev/null || echo "unknown")"
 
 # ── Anvil accounts ─────────────────────────────────────────────────────────────
 # Account 8 — adversary (10k ETH, 0 KRK)
@@ -754,6 +755,80 @@ if python3 -c "import sys; sys.exit(0 if int('${LM_ETH_AFTER:-0}') < int('${LM_E
   BROKE=true
 fi
 
+# ── 9a-pre. Write structured evidence JSON ──────────────────────────────────
+EVIDENCE_DIR="$REPO_ROOT/evidence/red-team"
+EVIDENCE_DATE=$(date -u +%Y-%m-%d)
+EVIDENCE_FILE="$EVIDENCE_DIR/$EVIDENCE_DATE.json"
+mkdir -p "$EVIDENCE_DIR"
+
+if [[ "$BROKE" == "true" ]]; then
+  _verdict="floor_broken"
+  _floor_held="false"
+  _eth_extracted=$(python3 -c "print(int('${LM_ETH_BEFORE:-0}') - int('${LM_ETH_AFTER:-0}'))")
+else
+  _verdict="floor_held"
+  _floor_held="true"
+  _eth_extracted=0
+fi
+
+python3 - "$EVIDENCE_FILE" "$REPO_ROOT/tmp/red-team-memory.jsonl" \
+  "$EVIDENCE_DATE" "$CANDIDATE_NAME" "$CANDIDATE_COMMIT" "$OPTIMIZER_PROFILE" \
+  "$LM_ETH_BEFORE" "$LM_ETH_AFTER" "$_eth_extracted" "$_floor_held" "$_verdict" <<'PYEOF'
+import json, sys, os
+
+evidence_file   = sys.argv[1]
+memory_file     = sys.argv[2]
+date            = sys.argv[3]
+candidate       = sys.argv[4]
+candidate_commit = sys.argv[5]
+optimizer_profile = sys.argv[6]
+lm_eth_before   = int(sys.argv[7]) if sys.argv[7].isdigit() else 0
+lm_eth_after    = int(sys.argv[8]) if sys.argv[8].isdigit() else 0
+eth_extracted   = int(sys.argv[9]) if sys.argv[9].isdigit() else 0
+floor_held      = sys.argv[10].lower() == "true"
+verdict         = sys.argv[11]
+
+# Build attacks list from memory entries for this candidate
+attacks = []
+if os.path.isfile(memory_file) and os.path.getsize(memory_file) > 0:
+    with open(memory_file) as f:
+        for line in f:
+            line = line.strip()
+            if not line:
+                continue
+            try:
+                e = json.loads(line)
+                if e.get("candidate") != candidate:
+                    continue
+                attacks.append({
+                    "strategy": e.get("strategy", ""),
+                    "pattern": e.get("pattern", ""),
+                    "result": e.get("result", "HELD"),
+                    "delta_bps": e.get("delta_bps", 0),
+                    "insight": e.get("insight", ""),
+                })
+            except Exception:
+                pass
+
+evidence = {
+    "date": date,
+    "candidate": candidate,
+    "candidate_commit": candidate_commit,
+    "optimizer_profile": optimizer_profile,
+    "lm_eth_before": lm_eth_before,
+    "lm_eth_after": lm_eth_after,
+    "eth_extracted": eth_extracted,
+    "floor_held": floor_held,
+    "verdict": verdict,
+    "attacks": attacks,
+}
+with open(evidence_file, "w") as f:
+    json.dump(evidence, f, indent=2)
+    f.write("\n")
+print(f"  Evidence written to {evidence_file}")
+PYEOF
+log "Evidence file: $EVIDENCE_FILE"
+
 if [[ "$BROKE" == "true" ]]; then
   DELTA=$(python3 -c "print(int('${LM_ETH_BEFORE:-0}') - int('${LM_ETH_AFTER:-0}'))")
   log "  RESULT: ETH EXTRACTED ❌"