data_params:
  data_seed: 2024
  train_path: /path/to/data/wikipedia/wikitext_train.txt
  test_path: /path/to/data/wikipedia/wikitext_test.txt
model_params:
  latent_dim: 8
  eps: 1.0e-6
  hidden_size: 128
  model_name: gpt2
  load_in_8bit: False   # only used for LLM backbone and will overwrite the optimizer_name to use Adam8bits provided by bitsandbytes
loss_params:
  loss: cl_loss
  name: triplet
optim_params:
  batch_size: 32
  optimizer_name: SGD
  decay_steps: 5.0e+4
  decay_factor: 0.01
  learning_rate: 0.0001
  moving_average_decay: 0.9999
  momentum: 0.9
experiment_params:
  checkpoint_epochs: 10
  num_epochs: 4
  device: cuda
  seed: 2024
  data_loader_workers: 4
  exp_dir: /path/to/output
  exp_name: CLencoder_gpt_nll
doc_params:
  sigma_ti_path: "/path/to/output/sigma/wikisection_sigma_Ti_inv.pkl" # Change me to the path where you saved the sigma_ti_inv file
  eval_batch_size: 64
  sigma_eps: 1.0e-3
  var_eps: 1.0e-6
  sigma_multiplier: 1.0e+4
  sigma_type: "standard" # standard, eye or var
