
program: ./foundation_main.py

method: grid  # Using grid search to exhaustively find the best hyperparameters

metric:
  name: best_val_AUC  # Using validation AUC to evaluate performance
  goal: maximize  # We want to maximize the validation AUC

parameters:
  # Training settings
  num_epochs:
    values: [5]
  batch_size:
    values: [128]
  patience:
    values: [30]
  seed:
    values: [0]

 # Model architecture
  probe_model:
    values: ["ACT-Vit-foundation", "ACT-MLP-foundation"]
  hidden_dim:
    values: [128]
  num_layers:
    values: [3]
  heads:
    values: [4]
  dropout:
    values: [0.3]
  pool:
    values: ["cls"]

  # Optimization settings
  lr:
    values: [1e-3, 5e-4]
  weight_decay:
    values: [0.001, 10]

  # Dataset and input settings
  train_dataset:
    values:
      - "Qwen/Qwen2.5-7B-Instruct:imdb Qwen/Qwen2.5-7B-Instruct:hotpotqa Qwen/Qwen2.5-7B-Instruct:triviaqa Qwen/Qwen2.5-7B-Instruct:movies Qwen/Qwen2.5-7B-Instruct:hotpotqa_with_context mistralai/Mistral-7B-Instruct-v0.2:imdb mistralai/Mistral-7B-Instruct-v0.2:hotpotqa mistralai/Mistral-7B-Instruct-v0.2:triviaqa mistralai/Mistral-7B-Instruct-v0.2:movies mistralai/Mistral-7B-Instruct-v0.2:hotpotqa_with_context meta-llama/Meta-Llama-3-8B-Instruct:imdb meta-llama/Meta-Llama-3-8B-Instruct:hotpotqa meta-llama/Meta-Llama-3-8B-Instruct:triviaqa meta-llama/Meta-Llama-3-8B-Instruct:movies meta-llama/Meta-Llama-3-8B-Instruct:hotpotqa_with_context"
  test_dataset:
    values:
      - "Qwen/Qwen2.5-7B-Instruct:imdb_test Qwen/Qwen2.5-7B-Instruct:hotpotqa_test Qwen/Qwen2.5-7B-Instruct:triviaqa_test Qwen/Qwen2.5-7B-Instruct:movies_test Qwen/Qwen2.5-7B-Instruct:hotpotqa_with_context_test mistralai/Mistral-7B-Instruct-v0.2:imdb_test mistralai/Mistral-7B-Instruct-v0.2:hotpotqa_test mistralai/Mistral-7B-Instruct-v0.2:triviaqa_test mistralai/Mistral-7B-Instruct-v0.2:movies_test mistralai/Mistral-7B-Instruct-v0.2:hotpotqa_with_context_test meta-llama/Meta-Llama-3-8B-Instruct:imdb_test meta-llama/Meta-Llama-3-8B-Instruct:hotpotqa_test meta-llama/Meta-Llama-3-8B-Instruct:triviaqa_test meta-llama/Meta-Llama-3-8B-Instruct:movies_test meta-llama/Meta-Llama-3-8B-Instruct:hotpotqa_with_context_test"
  input_type:
    values: ["activations"]
  input_output_type:
    values: ["output"]
  num_workers:
    values: [4]
  pin_memory:
    values: [1]
  down_sample_strategy:
    values: ["pool"]
  patch_size:
    values: 
      - (1, 1)
      - (1, 2)
      - (1, 4)
      - (2, 1)
      - (4, 1)
  # Cross-validation
  num_folds:
    values: [5]
  fold_to_run:
    values: [0]

  # Paths
  base_pre_processed_data_dir:
    values: ['/home/user/ACT-ViT/pre_processed_data']


  # Hardware settings
  cuda_idx:
    values: [0]
