# Configuration file for GNN IRT LLM Edge Weight

# Data paths
data:
  train_data: "../data/train_data.csv"
  test_data: "../data/test_data.csv"
  model_responses: "../data/model_responses.csv"
  model_costs: "../data/model_costs_and_tokens.csv"

# BERT embeddings paths
embeddings:
  train_embeds: "train_embeds.npy"
  test_embeds: "test_embeds.npy"

# BERT model configuration
bert:
  model_name: "bert-base-uncased"
  max_length: 512
  truncation: true
  padding: "max_length"

# Graph construction parameters
graph:
  k_neighbors: 3
  metric: "cosine"

# Model architecture parameters
model:
  hidden_dim: 64
  theta_dim: 16
  dropout: 0.3

# Training parameters
training:
  epochs: 300
  learning_rate: 1e-3
  weight_decay: 1e-5

# Inference parameters
inference:
  k_neighbors: 3
  metric: "cosine"

# Output file paths
output:
  graph_metrics: "graph_metrics.txt"
  predictions: "predicted_llm_performance_theta_{theta_dim}_ep_{epochs}.csv"
  a_train: "a_train_ep_{epochs}.csv"
  b_train: "b_train_ep_{epochs}.csv"
  theta: "theta_ep_{epochs}.csv"
  a_test: "a_test_ep_{epochs}.csv"
  b_test: "b_test_ep_{epochs}.csv"

# Device configuration
device:
  use_cuda: true
  device_id: 0

# Random seed
random_seed: 42
