script: run_mcts.py
initial-algorithm: null
default-algorithm: "gradient descent"
new-steps: 3

# Search configuration
n-playouts: 1000000
c: 1.0
score-fn: uct
temperature: 0.0
tree-reuse: true
early-stopping: true
stopping-factor: 1.0
use-lucb: true
best-action-metric: "q_value"

# Environment configuration
system-type: MID_COND
num-rows: 10000
num-cols: 50
condition-number: 2.0
prop-range: 1.0
lev: low
vt-dis: gauss

# Loop configuration
setup-loop: true
forward-loop: false
update-loop: false

# Solver configuration
max-iterations: 10
learning-rate: 0.5
sampling-factor: 8
batch-size: 100

# Reward configuration
base-weight: 1.0
decay-weight: 10.0
complexity-weight: 8.0
condition-weight: 1.0
reward-type: log
iterative-sketch: false
condition-reward-only: true

# Output configuration
log-dir: null
db-path: null
random-seed: 42

# Experiment tracking
target-algorithm: "preconditioner R1"
focus-operator: "HHQR,MAT_INV,MAT_MAT_TRANS_MUL"
