---
  record:
    # record_rollouts: ""
    record_recycle: -1
    # log_filename: /nfs/data//object_data/all/randomdist/default/attn/log/inter.log
    # load_dir: /nfs/data//object_data/all/breakout/attn/testrun/
    # save_dir: /nfs/data//object_data/all/randomdist/attn/default/
    # load_intermediate: /hdd/datasets/ac_data/null/1innull
    # save_intermediate: /hdd/datasets/ac_data/null/1innull
  environment:
    env: Box2D
    variant: default-all
    # load_environment: /work/pi__umass_edu//object_data/RandomDAG/1_in/
    load_trace: True
  torch:
    gpu: 0
    no_cuda: False
  pretrain:
    num_iters: 0
  train:
    train: True
    num_frames: 500000
    train_test_order: time
    # load_rollouts: /work/pi__umass_edu//object_data/RandomDAG/1_in/
    load_rollouts: /data//object_data/box2d/default_all/
    num_iters: 0
    batch_size: 256
    log_interval: 1000
    num_iters: 40000
    param_update_frequency: 10000
  multi_inter:
    # evaluate: True
    max_combination: 1
    dist_epsilon: 0.1
  active:
    full_weighting: 1 -1
  inter:
    train_names: Target
    pretrain_forms: full
    train_forms: full
    predict_dynamics: True
    weighting_type: trace
  infer:
    infer_types: gradient
    infer_interval: 1000
    infer_names: Target
    train_weight_infer: sample_active_full_weights
    eval_weight_infer: trace_weights
    train_mask_mode: full
    gradient:
      select_ideal: True
  interaction_net:
    hidden_sizes: 512 512 512
    net_type: keypair
    init_form: xnorm
    embed_dim: 512
    activation: leakyrelu
    factor_net:
      repeat_layers: False
      reduce_function: sum
      num_pair_layers: 1
      # embed_layers: 512
      # final_layers: 512
    mask_attn:
      model_dim: 256
      num_heads: 16
      num_layers: 2
      cluster: False
      num_clusters: 0
      attention_dropout: 0.1
      merge_function: sum
      mask_mode: query
      gumbel_attention: -1
      append_keys: True
      no_hidden: True
    optimizer:
      lr: .0001
      alt_lr: .00009
      eps: .00001
      alpha: 0.99
      betas: 0.9 0.999
      weight_decay: 0.0000
...