submission.yaml

← Back to submission · View raw on GitHub

submission_id: 2026-04-29__001_synthetic_mine_throughput__claude-code__claude-opus-4-7__plan-mode
date: 2026-04-29
benchmark_id: 001_synthetic_mine_throughput
harness:
  name: claude-code
  version: tbc
  notes: vanilla, plan mode enabled
model:
  name: claude-opus-4-7
  vendor: anthropic
  notes: 1M context, max thinking budget
run_tag: plan-mode
operator: harry
status: complete
intervention:
  category: autonomous
  notes: "Single autonomous run; plan reviewed before exit-plan-mode, then executed end-to-end without nudges."