# @package _global_
defaults:
  - /pipeline: timeseries_synthetics
  - /model: long-conv
  - override /scheduler: cosine_warmup

model:
  dropout: 0.1
  tie_dropout: true
  n_layers: 6
  d_model: 32 #4
  prenorm: false
  layer:
    l_max: 50
    learning_rate: 0.001
    lam: 0.001
    kernel_dropout: 0.2
    postact: glu
    bidirectional: false
 # transposed: true

loader:
  batch_size: 100 #50
  num_workers: 0 #4
  pin_memory: false
  #multiprocessing_context: spawn

optimizer:
  lr: 0.01
  weight_decay: 0.05

trainer:
  max_epochs: 100
  devices: 1


train:
  seed: 2222
  monitor: val/next_step_log_loss_valid_indices  #val/next_step_log_loss
  mode: min
  #ckpt: "${oc.env:BASE_PATH,}/outputs"

task:
  loss: next_step_log_loss_valid_indices
  metrics: [next_step_log_loss_valid_indices]  #performance_decay log_loss_not_using_path_variable 

#task:
#  loss: next_step_log_loss_ignore_terminal
#  metrics: [next_step_log_loss_ignore_terminal]


wandb:
  name: ts
  #save_dir: ${oc.env:BASE_PATH,}/

encoder:
  _name_: timeseries_synthetics
  #  _name_: absolute_time
  #  _name_: positional_linear
  #  _name_: timeseries_synthetics
  # _name_: calendar_positional_linear
  # _name_: set_encoder

dataset:
  _name_: corelogic_loan_dataset
  dataset_name: "corelogic_loan_dataset"
  num_states: 50 #Total number of features minus 2  # Total minus 2 # 10
  num_terminal_states: 2 # 2
  val_split: 0.15
  test_split: 0.15
  load_data: True
  data_path: "${oc.env:BASE_PATH,}/data/corelogic/loan_data.npz" #"/data/mortgage_new2/"
  save_data: True
  nr_sampling_timesteps: ${model.layer.l_max}
  max_to_sample: 100
  nr_loans_to_sample: 70
  sample_random_loan_index: True,
  sample_random_time_index: True,
  dataset_config:
    path_origination: "${oc.env:CORELOGIC_DATA_PATH,}/filtered_origination_data_top_4_zips.csv"
    path_performance: "${oc.env:CORELOGIC_DATA_PATH,}/filtered_performance_data_top_4_zips.csv"
    database_size: 1000
    start_year: 1988
    end_year: 2023
    columns_to_normalize_origination: [
                "fico_score_at_origination", 
                "original_balance", 
                "initial_interest_rate", 
                "original_ltv"
                ]
    columns_to_normalize_performance: [
                "current_balance", 
                "current_interest_rate", 
                "scheduled_monthly_pi",
                "scheduled_principal",
                "mba_days_delinquent"
                ]
    feature_set: [
                "current_state", #8
                'fico_score_at_origination', # 1
                "original_balance",  # 1
                "initial_interest_rate", # 1 
                "original_ltv", # 1
                "unemployment_rate",  # 1
                "national_mortgage_rate", # 1 
                "current_balance",  # 2
                "current_interest_rate", # 2 
                "scheduled_monthly_pi", # 2
                "scheduled_principal", # 2 
                "mba_days_delinquent", # 2
                "inferred_collateral_type", # 2
                "convertible_flag", # 2
                "pool_insurance_flag", # 2
                "io_flag", # 2
                "prepay_penalty_flag", # 2
                "negative_amortization_flag", # 2
                "buydown_flag", # 2,
                "lagged_foreclosure_rate", # 1
                "lagged_prepayment_rate", # 1
                ] 
    nr_classes: 8
  __l_max: ${model.layer.l_max}

decoder:
  _name_: tranistion_step_decoder 
  hidden_dim: ${model.d_model}
  num_states: 8
  lookback_horizon: 25
  forecast: false
  forecast_horizon: 5
  loan_pool_size: 1