# MRP config
mrp: boyan
num_states: 5
num_cartpole_bins: 2
gamma: 0.9

#feature config
feature_dim: 5
feature_mode: one-hot
representable: false
expected_feature: true

# model config
layer_num: 2
context_len: 5
activation: identity
tf_mode: auto
constrained: true

# training config
enumerated_context: true
lr: 0.001
weight_decay: 0.0
batch_size: 16
target: TD
MC_steps: 100
steps: 1000
log_interval: 100

# evaluation config for msve vs. context length
val_instances: 2
val_ctxt_start: 5
val_ctxt_end: 50
val_ctxt_step: 5
val_plot_log_scale: true