Human-Agent-Society · BobbyZhouZijian · Apr 25, 2026 · Apr 25, 2026
diff --git a/coral/config.py b/coral/config.py
@@ -80,6 +80,7 @@ class AgentConfig:
             HeartbeatActionConfig(name="consolidate", every=10, is_global=True),
             HeartbeatActionConfig(name="pivot", every=5, trigger="plateau"),
             HeartbeatActionConfig(name="lint_wiki", every=10, is_global=True),
+            HeartbeatActionConfig(name="challenge", every=10, is_global=True),
         ]
     )
     research: bool = True  # enable web search / literature review step in workflow

diff --git a/coral/hub/heartbeat.py b/coral/hub/heartbeat.py
@@ -36,6 +36,7 @@ def _load_prompt(name: str) -> str:
     "consolidate": _load_prompt("consolidate"),
     "pivot": _load_prompt("pivot"),
     "lint_wiki": _load_prompt("lint_wiki"),
+    "challenge": _load_prompt("challenge"),
 }
 
 # Which built-in actions default to global scope
@@ -44,6 +45,7 @@ def _load_prompt(name: str) -> str:
     "consolidate": True,
     "pivot": False,
     "lint_wiki": True,
+    "challenge": True,
 }
 
 # Which built-in actions use plateau trigger instead of interval
@@ -52,6 +54,7 @@ def _load_prompt(name: str) -> str:
     "consolidate": "interval",
     "pivot": "plateau",
     "lint_wiki": "interval",
+    "challenge": "interval",
 }
 
 # Protected actions: reflect is always local, consolidate is always global

diff --git a/coral/hub/prompts/challenge.md b/coral/hub/prompts/challenge.md
@@ -0,0 +1,58 @@
+## Heartbeat: Challenge — Audit Shared Memory for Drift
+
+**Shared memory accumulates faster than it is questioned.** As notes and skills pile up across the run, the working set quietly picks up assumptions that are unsupported, stale, or one-off accidents that got promoted to "common knowledge" — even while overall scores keep climbing on unrelated dimensions. Your job in this pass is to *act as the adversary* against shared memory.
+
+This runs on a regular cadence regardless of how the run is going: drift can happen on a healthy upward trajectory just as easily as on a plateau, and an audit that only fires when things go wrong audits too late.
+
+This is **not** lint_wiki — that pass merges duplicates and fixes orphan pages. This pass questions whether the surviving content is actually *true*.
+
+### Step 1: Identify high-impact shared content
+
+- List the most-cited notes in `{shared_dir}/notes/` (look at recent attempts in `coral log` and which notes they reference).
+- List the skills in `{shared_dir}/skills/` ranked by how often they appear in attempt commit messages or note bodies.
+- Prioritize the top ~5 notes and top ~3 skills. Low-traffic content is not the drift risk.
+
+### Step 2: For each high-impact item, attempt to falsify it
+
+Read the note/skill and ask, *adversarially*:
+
+- **Evidence check** — does this claim cite specific attempt hashes, scores, or measurements? Or is it a confident assertion with no receipts?
+- **Generalization check** — was this learned from one attempt, one task instance, or one narrow regime? Is it being applied beyond what the evidence supports?
+- **Staleness check** — when was it written? Has the codebase, grader, or task constraints changed since? (`git log` the file.)
+- **Counter-search** — find the top-scoring attempts that *did not* follow this note/skill. If high scores exist without it, the note is at best optional and at worst misleading.
+
+You are looking for confident-but-thin claims. "Always do X" with no evidence is a red flag. "We tried X and Y, X scored higher in cases A/B" is fine.
+
+### Step 3: Re-classify, do not delete
+
+Do **not** silently remove notes — that erases evidence of past reasoning. Instead, edit the frontmatter / heading to mark status:
+
+- **`status: validated`** — backed by attempt hashes that reproduce the claim.
+- **`status: hypothesis`** — plausible but unverified; downgrade confident language ("always" → "in cases X we observed").
+- **`status: stale`** — written against an earlier version of the codebase/grader and no longer applies. Add a one-line "superseded by …" note.
+- **`status: disputed`** — top attempts contradict it. Leave the original text but add a "Counter-evidence" section citing the contradicting hashes.
+
+For skills, the same applies: a one-off skill that has only ever been used by its author should be marked `status: experimental` rather than presented as general practice.
+
+### Step 4: Write a challenge note
+
+Append a single dated entry to `{shared_dir}/notes/challenge_log.md` summarizing:
+
+- Which items you re-classified and why (one line each).
+- Any *pattern* you noticed — e.g. "three of the top-cited notes all assume the grader weights latency, but the current grader does not."
+- What a future agent should be skeptical of going forward.
+
+This log is the institutional memory of *what we used to believe and why we stopped*.
+
+### Step 5: Hand back, do not pivot
+
+This action does **not** ask you to change your current strategy or run a counter-attempt. It only audits memory. After writing the challenge log, return to whatever you were doing. The signal will reach other agents through the re-classified notes.
+
+---
+
+**Heuristics:**
+
+- A note with no attempt-hash citations is suspicious by default.
+- A skill used only by its author is not yet a skill — it is a personal habit.
+- "Everyone agrees" inside a CORAL run is a *symptom*, not a *signal* — your job here is to make sure the agreement is earned.
+- Re-classification beats deletion. Future agents need to see what was once believed in order to evaluate whether to re-believe it.
diff --git a/tests/test_heartbeat.py b/tests/test_heartbeat.py
@@ -117,3 +117,36 @@ def test_plateau_default_evals_since_improvement():
 
     # Default evals_since_improvement=0, should never fire
     assert runner.check(local_eval_count=5, global_eval_count=5) == []
+
+
+# --- Built-in 'challenge' action registration ---
+
+def test_challenge_action_registered_as_global_interval():
+    """The 'challenge' built-in must default to global scope + interval trigger.
+
+    Drift audits are a population property: one challenger pass across the run
+    is enough. Interval (not plateau) so the audit fires on a regular cadence
+    regardless of whether scores are improving — drift can happen on a healthy
+    trajectory, and an audit that only fires on plateau audits too late.
+    """
+    from coral.hub.heartbeat import (
+        DEFAULT_GLOBAL,
+        DEFAULT_PROMPTS,
+        DEFAULT_TRIGGER,
+    )
+
+    assert "challenge" in DEFAULT_PROMPTS
+    assert DEFAULT_PROMPTS["challenge"], "challenge prompt should not be empty"
+    assert DEFAULT_GLOBAL["challenge"] is True
+    assert DEFAULT_TRIGGER["challenge"] == "interval"
+
+
+def test_challenge_default_in_config():
+    """The default heartbeat list should include 'challenge' as interval+global."""
+    from coral.config import CoralConfig
+
+    config = CoralConfig()
+    by_name = {h.name: h for h in config.agents.heartbeat}
+    assert "challenge" in by_name, "challenge should ship in default heartbeat list"
+    assert by_name["challenge"].is_global is True
+    assert by_name["challenge"].trigger == "interval"