submission_id: 2026-04-29__001_synthetic_mine_throughput__claude-code__claude-opus-4-7__plan-mode
date: 2026-04-29
benchmark_id: 001_synthetic_mine_throughput
harness:
name: claude-code
version: tbc
notes: vanilla, plan mode enabled
model:
name: claude-opus-4-7
vendor: anthropic
notes: 1M context, max thinking budget
run_tag: plan-mode
operator: harry
status: complete
intervention:
category: autonomous
notes: "Single autonomous run; plan reviewed before exit-plan-mode, then executed end-to-end without nudges."
submission.yaml
← Back to submission · View raw on GitHub