log_dir: tb-large-rm
device: auto

algo: tb
training_steps: 300000
eval_every: 2000
print_every: 100
save_at_valid: True
seed: 42
lr: 0.0005
compute_automorphism: False
scale_reward: False

env:
  name: graphenv
  graphenv:
    num_node_types: 1
    num_edge_types: 1
    max_nodes: 10
    max_edges: 9
    max_degree: 4
    remove_duplicates: True
    min_reward: 0.1
    reward_name: num_cycles

featurizer:
  random_walk_length: 4
  add_degree: True
  add_clustering_coef: True

model:
  embed_dim: 256
  num_layers: 5
  num_heads: 4


tb:
  algo:
    grad_norm_clip: 1.0
    learn_backward: False
  dataset:
    num_online_samples: 32
    num_buffer_samples: 32
    buffer_size: 2000
    exploration_epsilon: 0.1
  dataloader:
    num_workers: 64
    prefetch_factor: 2
    persistent_workers: True
    batch_size: 