# @package _global_
defaults:
  - /experiment/equities/base_equities.yaml


scheduler:
  num_training_steps: ${eval:"${trainer.max_epochs} * ${dataset.steps_per_epoch} / ( ${loader.batch_size} * ${trainer.devices} )"} #300000
  num_warmup_steps: ${eval:"${scheduler.num_training_steps} / 10"} 

trainer:
  devices: 1
  max_epochs: 30
  accelerator: gpu ## Change to gpu if available later

decoder:
  output_scale: 350
  l1_normalize: True

encoder:
  _name_: set_encoder
  chunk_size: 3
  architecture: MLP
  nr_attention_heads: 1
  feature_embedding_dim: 5
  n_attn_summary_statistics: True
  dropout: 0.1 # 0
  debug: True
  include_y_in_output: True
  return_raw_input: False
  
dataset:
  _name_: equities_dataset
  num_states: 77 #15 # num_features -2
  dataset_config:
      daily_price_data_path: "${oc.env:EQUITIES_DATA_PATH,}/daily_price_data_n_equities_4000.npz"
      train_beg_date: 20130101 #19900101 # try later (8 years)
      train_end_date: 20201231
      val_beg_date: 20210101
      val_end_date: 20211231
      test_beg_date: 20220101
      test_end_date: 20221231
      #train_beg_date: 19900101
      #train_end_date: 20201231
      #val_beg_date: 20210101
      #val_end_date: 20211231
      #test_beg_date: 20220101
      #test_end_date: 20221231
  train_frac: 0.8
  val_frac: 0.1
  test_frac: 0.1
  alpha_price: 100
  alpha_vol: 0.5
  sequence_length: 246 # nr_timesteps
  stocks_sample: 500 # cross section
  nr_loans_to_sample: 500
  load_data: True
  save_data: False
  data_path: "${oc.env:BASE_PATH,}/data/equities/equity_dataset_2021.npz"
  steps_per_epoch: 25
  feature_set: [
    "return", # daily return
    "suv",
    "beta",
    "spread",
    "residual_volatility",
    "return_1week", # weekly return
    "ST_Rev", # short term return (1 month)
    "r2_1", # 2->1 month momentum
    "r12_2", # 12->2 month momentum
    "r12_7", # 12->7 month momentum
    "r36_13", # 36->13 month momentum
    "Rel2High", # relative to high (1 year)
    "volume", 
    "risk_free_rate", 
    "yearly_accounting_vars", 
    "trailing_volatility",     # 2 dim
    ]

model:
  n_layers: 1
  dropout: ${encoder.dropout}  #0
  d_model: 32 #300 # 32
  layer:
    _name_: attention_factors
    n_factors: 30  #30 # 10
    #no_factors: True
    kernel_dropout: ${encoder.dropout}  #0
    weight_init: double_exp
    use_set_mixing: False
    set_mixing_architecture: MLP
    nr_layers_with_set: 1
    set_mixing_dropout: ${encoder.dropout} # 0
    set_feature_embedding_dim: 5 # 5
    set_debug: ${encoder.debug}
    set_nr_attn_heads: 1
    l_max: ${dataset.sequence_length}
    use_attention_factors: True
    n_assets: ${dataset.stocks_sample}
    use_factor_portfolio: True
    kernel_len: 30 # 20
  __l_max: ${model.layer.l_max}

optimizer:
  lr: 0.003 #0.003
  weight_decay: 0.05 #0.05 0

loader:
  batch_size: 1
  #batch_size: 1

wandb:
  project: 'attention-factors-equities'
  name: "attention_factors_equities"

task:
  loss: next_step_sharpe_ratio_with_residual_loss   
  metrics: [res_loss, next_step_sharpe_ratio_with_residual_loss, next_step_sharpe_ratio_positive, sharpe_ratio_market, compute_portfolio_metrics]