# @package _global_
defaults:
  - /experiment/equities/base_equities.yaml


scheduler:
  num_training_steps: ${eval:"${trainer.max_epochs} * ${dataset.steps_per_epoch} / ( ${loader.batch_size} * ${trainer.devices} )"} #300000
  num_warmup_steps: ${eval:"${scheduler.num_training_steps} / 10"} 

trainer:
  devices: 1
  max_epochs: 30
  accelerator: gpu

train:
  seed: 1  #2222

encoder:
  _name_: set_encoder
  chunk_size: 3
  architecture: MLP
  nr_attention_heads: 1
  feature_embedding_dim: 5
  n_attn_summary_statistics: True
  dropout: 0.1 # 0
  debug: False
dataset:
  _name_: equities_dataset
  num_states: 77
  dataset_config:
      daily_price_data_path: "${oc.env:EQUITIES_DATA_PATH,}/daily_price_data_n_equities_4000.npz"
      train_beg_date: 20110101 
      train_end_date: 20181231
      val_beg_date: 20190101
      val_end_date: 20191231
      test_beg_date: 20200101
      test_end_date: 20201231
  train_frac: 0.8
  val_frac: 0.1
  test_frac: 0.1
  alpha_price: 100
  alpha_vol: 0.5
  sequence_length: 246 # nr_timesteps
  stocks_sample: 500 # cross section
  nr_loans_to_sample: 500
  load_data: True
  save_data: False
  data_path: "${oc.env:BASE_PATH,}/data/equities/equity_dataset_2019.npz"
  steps_per_epoch: 50
  feature_set: [
    "return", # daily return
    "suv",
    "beta",
    "spread",
    "residual_volatility",
    "return_1week", # weekly return
    "ST_Rev", # short term return (1 month)
    "r2_1", # 2->1 month momentum
    "r12_2", # 12->2 month momentum
    "r12_7", # 12->7 month momentum
    "r36_13", # 36->13 month momentum
    "Rel2High", # relative to high (1 year)
    "volume", 
    "risk_free_rate", 
    "yearly_accounting_vars", 
    "trailing_volatility",   
    ]

model:
  n_layers: 6  #1
  dropout: ${encoder.dropout}  #0
  d_model: 64
  layer:
    kernel_dropout: ${encoder.dropout}  #0
    weight_init: random
    use_set_mixing: True
    set_mixing_architecture: MLP
    nr_layers_with_set: 6  # 1
    set_mixing_dropout: ${encoder.dropout} # 0
    set_feature_embedding_dim: 5 # 5
    set_debug: ${encoder.debug}
    set_nr_attn_heads: 1
    l_max: ${dataset.sequence_length}
    kernel_len: 30 # 20
  __l_max: ${model.layer.l_max}

optimizer:
  lr: 0.003 #0.003
  weight_decay: 0.05 #0.05 0

loader:
  batch_size: 1

decoder:
  output_scale: 600
  l1_normalize: True
wandb:
  name: ${eval:"'equities_set_seq_seed' + str(${train.seed})"}
  project: 'equities-set-seq-model'