Shared memory and context tools for agentic work.
Code Rooms
{"command": null, "event_source": "harness", "event_type": "lane_assigned", "exit_code": null, "files": ["lane-prompts/judge-1.md", "lane-results/judge-1.json"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "Agents should append JSONL events with event_source=agent.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Lane prompt, result template, and event stream were created.", "task_id": null, "timestamp": "2026-05-13T23:18:27.913328+00:00"}
{"command": "python3 /Users/kle1nz/.codex/skills/m1nd-operator/scripts/probe_m1nd.py ...", "event_source": "agent", "event_type": "m1nd_call", "exit_code": null, "files": ["scripts/benchmark/real_world_agent_round.py"], "lane_id": "judge-1", "m1nd_tool": "trust_selftest/search/view", "notes": "Used probe_m1nd.py tools/trust/search/view; final truth still came from answer-key and file evidence.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Confirmed the live m1nd probe surface and harness event vocabulary before adjudication.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400717+00:00"}
{"command": null, "event_source": "agent", "event_type": "file_read", "exit_code": null, "files": ["/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/operator-only/judge-input.json", "/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/operator-only/answer-key.json", "/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/report-prejudge.json"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "Primary result count was 6 lanes x 10 tasks; answer-key task count was 10.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Read judge inputs, answer key, prejudge report, all primary lane results, and all primary event streams.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400722+00:00"}
{"command": null, "event_source": "agent", "event_type": "shell_command", "exit_code": null, "files": [".m1nd-benchmark-fixtures/real-world-lanes"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "All patch lanes kept code changes scoped to src/click/types.py or src/metadata.rs.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Verified primary patch-task fixture diffs for Click and human-panic across all six primary lanes.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400725+00:00"}
{"command": null, "event_source": "agent", "event_type": "finding", "exit_code": null, "files": ["/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/lane-results/judge-1.json"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "m1nd_available had one adjudicated partial for missing parser coverage in m1nd-2 architecture audit; no_m1nd had all tasks adjudicated success.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Adjudicated 60 primary lane/task entries with all entries comparable and no exclusions.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400726+00:00"}
{"command": null, "event_source": "agent", "event_type": "finding", "exit_code": null, "files": ["/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/event-streams"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "The judge event stream itself uses only harness-valid event types.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Recorded event-stream provenance risk from invalid primary event types.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400735+00:00"}
{"command": null, "event_source": "agent", "event_type": "handoff", "exit_code": null, "files": ["/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/lane-results/judge-1.json", "/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/event-streams/judge-1.jsonl"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "Te was not externally measured for this judge pass.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Wrote Judge-1 result JSON and finalized the Judge-1 event stream.", "task_id": null, "timestamp": "2026-05-13T23:43:31.400737+00:00"}
{"command": "python3 correction rewrite for judge-1 lane-result schema", "event_source": "agent", "event_type": "handoff", "exit_code": 0, "files": ["/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/lane-results/judge-1.json", "/Users/kle1nz/m1nd/docs/benchmarks/real-world-rounds/real-world-v2-20260513T231822Z/event-streams/judge-1.jsonl"], "lane_id": "judge-1", "m1nd_tool": null, "notes": "Preserved 60 adjudications, mapped judge_score_detail into harness adjudicated_scores, and kept task_results empty.", "proof_ref": null, "repo_id": null, "round_id": "real-world-v2-20260513T231822Z", "schema": "m1nd-real-world-agent-event-v0", "summary": "Corrected judge-1.json to the harness lane-result schema so the scorer includes adjudications.", "task_id": null, "timestamp": "2026-05-13T23:46:07.291422+00:00"}