desc: noDesc
log_dir: logs/synflow_64_1
env_dir: ./data/envs/synflow_64
device: cpu
seed: 0
validate_every: 1000
checkpoint_every: null
store_all_checkpoints: false
print_every: 1
start_at_step: 0
num_final_gen_steps: 100
num_training_steps: 5000
num_workers: 0
num_workers_retrosynthesis: 8
hostname: piotr-gainski2.laptop.matinf.uj.edu.pl
pickle_mp_messages: false
git_hash: 38176b9
overwrite_existing_exp: false
algo:
  method: TB
  global_batch_size: 64
  min_len: 2
  max_len: 5
  max_nodes: 9
  max_edges: 128
  illegal_action_logreward: -75.0
  offline_ratio: 0.0
  valid_offline_ratio: 0.0
  train_random_action_prob: 0.05
  train_det_after: null
  valid_random_action_prob: 0.0
  sampling_tau: 0.9
  tb:
    bootstrap_own_reward: false
    epsilon: null
    reward_loss_multiplier: 1.0
    variant: TB
    do_correct_idempotent: false
    do_parameterize_p_b: false
    do_predict_n: false
    do_sample_p_b: false
    do_length_normalize: false
    subtb_max_len: 128
    Z_learning_rate: 0.001
    Z_lr_decay: 50000.0
    cum_subtb: true
  action_sampling:
    num_mc_sampling: 1
    num_sampling_add_first_reactant: 629
    sampling_ratio_reactbi: 0.01
    max_sampling_reactbi: 629
    min_sampling_reactbi: 100
    onpolicy_temp: 1.0
  moql:
    gamma: 1.0
    num_omega_samples: 32
    num_objectives: 2
    lambda_decay: 10000
    penalty: -10.0
  a2c:
    entropy: 0.01
    gamma: 1.0
    penalty: -10.0
  fm:
    epsilon: 1.0e-38
    balanced_loss: false
    leaf_coef: 10.0
    correct_idempotent: false
  sql:
    alpha: 0.01
    gamma: 1.0
    penalty: -10.0
model:
  num_layers: 4
  num_emb: 128
  dropout: 0.0
  fp_radius_building_block: 2
  fp_nbits_building_block: 1024
  num_layers_building_block: 0
  num_emb_building_block: 64
  graph_transformer:
    num_heads: 2
    ln_type: pre
    num_mlp_layers: 0
  seq_transformer:
    num_heads: 2
    posenc: Rotary
opt:
  opt: adam
  learning_rate: 0.0001
  lr_decay: 20000.0
  weight_decay: 1.0e-08
  momentum: 0.9
  clip_grad_type: norm
  clip_grad_param: 10.0
  adam_eps: 1.0e-08
replay:
  use: false
  capacity: 10000
  warmup: 0
  hindsight_ratio: 0.0
task:
  moo:
    n_valid: 15
    n_valid_repeats: 128
    objectives:
    - vina
    - qed
    log_topk: false
    online_pareto_front: true
  sbdd:
    proxy: ???
    pocket_db: ???
    pocket_dim: 128
  docking:
    protein_path: ???
    center: ???
cond:
  valid_sample_cond_info: true
  temperature:
    sample_dist: uniform
    dist_params:
    - 16
    - 64
    num_thermometer_dim: 32
  moo:
    num_objectives: 2
    num_thermometer_dim: 16
  weighted_prefs:
    preference_type: dirichlet
    preference_param: 1.5
  focus_region:
    focus_type: centered
    use_steer_thermomether: false
    focus_cosim: 0.98
    focus_limit_coef: 0.1
    focus_model_training_limits:
    - 0.25
    - 0.75
    focus_model_state_space_res: 30
    max_train_it: 20000
