# MRP config
mrp: boyan
num_states: 5
num_cartpole_bins: 2
gamma: 0.9

#feature config
feature_dim: 5
feature_mode: one-hot
representable: false
expected_feature: true

# model config
layer_num: 30
context_len: 5
activation: identity
tf_mode: auto
constrained: true

# training config
enumerated_context: true
lr: 0.001
weight_decay: 0.0
batch_size: 64
target: TD
MC_steps: 200
steps: 20000
log_interval: 1000

# evaluation config for msve vs. context length
val_instances: 10
val_ctxt_start: 5
val_ctxt_end: 100
val_ctxt_step: 5
val_plot_log_scale: true