# Model settings
type: 'discrete'
transition: 'marginal'                          # uniform or marginal
model: 'graph_tf'
diffusion_steps: 500
diffusion_noise_schedule: 'cosine'              # 'cosine', 'polynomial_2'
n_layers: 5

extra_features: null        # 'all', 'cycles', 'eigenvalues' or null

# Do not set hidden_mlp_E, dim_ffE too high, computing large tensors on the edges is costly
# At the moment (03/08), y contains quite little information
hidden_mlp_dims: {'X': 256, 'E': 128, 'y': 128, 'pos': 64, 's': 256}
hidden_dims : {'dx': 256, 'de': 64, 'dy': 64, 'n_head': 8, 'dim_ffX': 256, 'dim_ffE': 128, 'dim_ffy': 128}

#lambda_train: [0.4, 2, 0, 1, 5] #Old: p,x,c,e,y; new = x,e,y,c,p
lambda_train: [1, 2, 0, 0.5, 0]

nu:
  p: 2.5
  x: 1
  c: 1
  e: 1.5
  y: 1

n_layers_delt: 1
# The dimensions should satisfy dx % n_head == 0
hidden_mlp_dims_delt: {'X': 64, 'E': 32, 'y': 64, 'pos': 8, 's': 8}
hidden_dims_delt : {'dx': 64, 'de': 16, 'dy': 32, 'n_head': 8, 'dim_ffX': 64, 'dim_ffE': 32, 'dim_ffy': 64}
# hidden_mlp_dims_delt: {'X': 256, 'E': 128, 'y': 256, 'pos': 8, 's': 8}
# hidden_dims_delt : {'dx': 256, 'de': 64, 'dy': 64, 'n_head': 8, 'dim_ffX': 256, 'dim_ffE': 128, 'dim_ffy': 256}