{
    "model_config": "anonymous/legato-small",
    "pretrained_model": null,

    "dataset_path": "datasets/PDMX-Synth",
    "mini_val_file": "datasets/mini_val.json",
    "mini_test_file": "datasets/mini_test.json",
    "dummy_data": false,

    "output_dir": "outputs/legato-small-lr-3e-4/",
    "remove_unused_columns": false,

    "run_name": "legato-small-lr-3e-4",
    "do_train": true,
    "do_eval": true,
    "do_predict": false,
    "dataloader_num_workers": 8,
    "dataloader_prefetch_factor": 2,
    "ddp_find_unused_parameters": false,
    "bf16": true,
    "num_train_epochs": 10,
    "learning_rate": 3e-4,
    "per_device_train_batch_size": 2,
    "gradient_accumulation_steps": 4,
    "warmup_ratio": 0.03,
    "logging_steps": 100,
    "save_strategy": "steps",
    "save_steps": 5000,
    "per_device_eval_batch_size": 1,
    "eval_strategy": "steps",
    "eval_steps": 5000,
    "metric_for_best_model": "eval_SER",
    "greater_is_better": false,
    "load_best_model_at_end": true,
    "bf16_full_eval": true,
    "predict_with_generate": true,
    "generation_max_length": 2048,
    "generation_num_beams": 3,
    "torch_compile": true,
    "report_to": "wandb",
    "restore_callback_states_from_checkpoint": true,
    "log_level": "info"
}