# Configuration file for Semi-supervised GNN IRT Edge Weight Theta 16

# Data paths
data:
  train_data: "../data/train_data.csv"
  test_data: "../data/test_data.csv"
  model_responses: "../data/model_responses.csv"
  model_costs: "../data/model_costs_and_tokens.csv"

# BERT embeddings paths
embeddings:
  train_embeds: "../train_embeds.npy"
  test_embeds: "../test_embeds.npy"

# BERT model configuration
bert:
  model_name: "bert-base-uncased"
  max_length: 512
  truncation: true
  padding: "max_length"

# Graph construction parameters
graph:
  k_neighbors: 3
  metric: "cosine"

# Model architecture parameters
model:
  hidden_dim: 64
  theta_dim: 16
  dropout: 0.3

# Training parameters
training:
  epochs: 200
  learning_rate: 1e-3
  weight_decay: 1e-5
  batch_size: null  # Not used in current implementation

# Semi-supervised learning parameters
semi_supervised:
  mask_ratio: 0.9
  seed: 42

# Inference parameters
inference:
  k_neighbors: 3
  metric: "cosine"

# Output file paths
output:
  train_mask_info: "train_mask_info_mask_ratio_{mask_ratio}.csv"
  cost_saving: "cost_saving_mask_ratio_{mask_ratio}.txt"
  predictions: "predicted_llm_performance_theta_{theta_dim}_mask_ratio_{mask_ratio}.csv"
  a_train: "a_train_mask_ratio_{mask_ratio}.csv"
  b_train: "b_train_mask_ratio_{mask_ratio}.csv"
  theta: "theta_mask_ratio_{mask_ratio}.csv"
  a_test: "a_test_mask_ratio_{mask_ratio}.csv"
  b_test: "b_test_mask_ratio_{mask_ratio}.csv"

# Device configuration
device:
  use_cuda: true
  device_id: 0

# Random seed
random_seed: 42
