metric,value
input_path,results/execution/state_reconstruction_direct_sample500_k5.jsonl
dataset_path,data/mathlib_subset_s4_submission_main_steps_checked.jsonl
dataset_rows,3723
seed,42
sample_size,500
max_k,5
lean_version,Lean 4.28.0
runtime,Lean 4.28 direct checking with cached build artifacts
job_id,redacted
walltime,redacted
n_queries,500
n_candidates,12500
executed_candidates,12255
candidate_execution_coverage,0.9804
executed_accept,4910
executed_reject,7345
reconstruction_unknown_identifier,198
reconstruction_elaboration,47
parse_error,0
timeout,0
infrastructure_error,0
best_accept_at_5_all,unguided
