# @package _global_
defaults:
  - /experiment/timeseries/base_corelogic.yaml
  - override /model: id


scheduler:
  num_training_steps: ${eval:"${trainer.max_epochs} * ${dataset.steps_per_epoch} / ( ${loader.batch_size} * ${trainer.devices} )"} #300000
  num_warmup_steps: ${eval:"${scheduler.num_training_steps} / 10"} 

trainer:
  devices: 1
  max_epochs: 34
  accelerator: gpu ## Change to gpu if available later

encoder:
  _name_: set_encoder
  chunk_size: 3
  architecture: MLP
  nr_attention_heads: 5
  feature_embedding_dim: 5
  debug: True
  #feature_embedding_dim: 100
  #common_pool_embedding_dim: 5
  #num_states:  # total number of states minus 2
  n_attn_summary_statistics: True
  dropout: 0.1 # 0
#total 142000 loans
dataset:
  load_data: True
  data_path: "${oc.env:BASE_PATH,}/data/corelogic/loan_data_top4_zip_52.npz" #"/data/mortgage_new2/"
  num_states: 50 #Total number of features minus 2 
  save_data: False
  max_to_sample: 4500
  nr_loans_to_sample: 2500 #1 #700   # 6000
  steps_per_epoch: 40 #40 #28000 #40 #40  #40 # sum to 60 000
  val_split: 0.3 # Let's not use these
  test_split: 0.1
  sample_random_loan_index: True
  sample_random_time_index: True
  val_split_date: "2002-06"
  test_split_date: "2003-06"
  eval_mode: False
  rolling_model: True
  rolling_start_epoch: 15
  rolling_epoch_interval: 1
  use_time_weighting: True
  time_weighting_half_life: 24
  dataset_config:
    database_size: 400000

model:
  # TODO examine this achitecture in detail.
  n_layers: 4 # 3 for nn
  d_model: 32
  dropout: 0.1
  transposed: false # Actually faster than "true"
  tie_dropout: true
  norm: null
  #prenorm
  layer:
    _name_: id_lookback
    activation: relu #gelu # gelu for nn
    dropout: 0.1
    T: 0 # Lookback 1.

optimizer:
  lr: 0.003
  weight_decay: 0.05 #0.05 0

loader:
  batch_size: 1
  #batch_size: 1

wandb:
  name: "nn_cl_4zip_forward_shift"
  project: "corelogic-mortgage"