From 6694b2daa886062c610a480dd2e604ca8ebb833e Mon Sep 17 00:00:00 2001 From: openhands Date: Sun, 15 Mar 2026 04:27:38 +0000 Subject: [PATCH] fix: CID format change silently drops historical generation JSONL on re-admission (#757) Co-Authored-By: Claude Sonnet 4.6 --- STATE.md | 1 + tools/push3-evolution/evolve.sh | 5 ++++- 2 files changed, 5 insertions(+), 1 deletion(-) diff --git a/STATE.md b/STATE.md index 03d725d..0948c07 100644 --- a/STATE.md +++ b/STATE.md @@ -40,3 +40,4 @@ - [2026-03-15] No generic flag dispatch: only `token_value_inflation` is ever zero-rated (#723) - [2026-03-15] `llm`-origin entries in manifest have null fitness and no evaluation path (#724): evaluate-seeds.sh scores null-fitness seeds and writes results back to manifest.jsonl - [2026-03-15] manifest.jsonl schema has no canonical machine-readable definition (#720) +- [2026-03-15] CID format change silently drops historical generation JSONL on re-admission (#757): warn on unrecognised CID format instead of silently skipping diff --git a/tools/push3-evolution/evolve.sh b/tools/push3-evolution/evolve.sh index fcd9236..436dd61 100755 --- a/tools/push3-evolution/evolve.sh +++ b/tools/push3-evolution/evolve.sh @@ -812,8 +812,11 @@ for fname in sorted(os.listdir(output_dir)): fitness = int(d.get('fitness', 0)) if fitness < threshold: continue - # cid format: "candidate_XXX" (gen_idx derived from enclosing filename) + # Canonical CID format is "candidate_XXX" (zero-padded numeric suffix, + # e.g. "candidate_001"); gen_idx is derived from the enclosing filename. + # Old runs 1–6 used "gen{N}_c{MMM}" — see manifest.jsonl schema (#720). if not cid.startswith('candidate_'): + print(f'WARNING: skipping unrecognised CID format {cid!r} in {fname}') continue cand_str = cid[len('candidate_'):] # numeric suffix, e.g. "001" push3_path = os.path.join(