ACT: EPS_GREEDY
ALPHA: 1.3
BATCH_SIZE: 5
BOARD_SIZE: 6
BUCKET_SPACE: 4
COLOR_SPACE: 4
EPS_DECAY: 200
EPS_END: 0.001
EPS_START: 0.9
FEATURIZATION: ONE_STEP_UNARY_BINARY_WITHOUT_INDEX
FINITE: true
FIX_CGS_SEED: false
GAMMA: 1
GRAD_BATCH_SIZE: 128
INIT_OBJ_COUNT: 5
LEARNER: DQN
LR: 0.01
NORMALIZE: false
OBJECT_SPACE: 16
OPTIMIZER: ADAM
OUTPUT_DIR: outputs/B_t_T
RECORD: 1
REPEAT: 5
REPLAY_BUFFER_SIZE: 1000
RULE_NAME: bottom_then_top
RUN_MODE: TRIAL
R_ACCEPT: 0
R_REJECT: -1
SEED: -1
SHAPE_SPACE: 4
SHAPING: false
TAG:
- last summer rule
- DQN
- bottom_then_top
- full random
TARGET_UPDATE_FREQ: 200
TEST_EPISODES: 40
TEST_FREQ: 30
TRAIN_EPISODES: 200
TRAIN_HORIZON: 100
TRIAL_NAME: broad_clock_shape.csv
VERBOSE: 0
WEIGHT_SAVE_FREQ: 100
