defaults:
  - datasets@libritts: libritts
  - datasets@audiocaps: audiocaps
  - datasets@opencpop: opencpop
  - datasets@popcs: popcs
  - datasets@ttshq: ttshq
  - datasets@musdb: musdb
  - datasets@moises: moises
  - datasets@vggsound_clip: vggsound_clip
  - datasets@visual_sound_clip: visual_sound_clip
  - datasets@libritts_100_wham: libritts_100+wham
  - datasets@libritts_360_wham: libritts_360+wham
  - datasets@ljspeech_musan: ljspeech+musan
  - datasets@vctk_wham: vctk+wham
  - datasets@voicebank_demand: voicebank+demand
  - datasets@m4singer: m4singer
  - datasets@msd: msd
  - datasets@music_caps: music_caps
  - datasets@esc_audiosr: esc_audiosr
  - datasets@vctk_audiosr: vctk_audiosr