train:
  _target_: data_module.dataset.TextToMusicDataset
  content: data/msd/all/caption.jsonl
  audio: data/msd/all/audio.jsonl
  base_audio_path: /cpfs02/shared/speechllm/data/MillionSongDataset/files/MSD/songs/
  target_sr: ${sample_rate}
  use_h5_cache: false
  task_instruction: ${instruction_embedding}
  max_duration: 10.0
val:
  _target_: data_module.dataset.TextToMusicDataset
  content: data/msd/val/caption.jsonl
  audio: data/msd/val/audio.jsonl
  base_audio_path: /cpfs02/shared/speechllm/data/MillionSongDataset/files/MSD/songs/
  target_sr: ${sample_rate}
  use_h5_cache: false
  task_instruction: ${instruction_embedding}
  max_samples: ${max_val_samples}
  max_duration: 10.0
