# chinese related
- name: aishell
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/aishell/aishell_test.jsonl.gz
  lang: zh
- name: aishell2
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/aishell2/aishell2_test.jsonl.gz
  lang: zh

# english related
- name: librispeech-test-clean
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/librispeech/librispeech_test-clean.jsonl.gz
  lang: en
- name: librispeech-test-other
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/librispeech/librispeech_test-other.jsonl.gz
  lang: en

# fleurs related
- name: fleurs-zh-CN
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/cmn_hans_cn/fleurs-cmn_hans_cn_test.jsonl.gz
  lang: zh
- name: fleurs-en
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/en_us/fleurs-en_us_test.jsonl.gz
  lang: en
- name: fleurs-ja
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/ja_jp/fleurs-ja_jp_test.jsonl.gz
  lang: ja
- name: fleurs-ko
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/ko_kr/fleurs-ko_kr_test.jsonl.gz
  lang: ko
- name: fleurs-ru
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/ru_ru/fleurs-ru_ru_test.jsonl.gz
  lang: ru
- name: fleurs-vi
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/vi_vn/fleurs-vi_vn_test.jsonl.gz
  lang: vi
- name: fleurs-id
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/id_id/fleurs-id_id_test.jsonl.gz
  lang: id
- name: fleurs-fr
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/fr_fr/fleurs-fr_fr_test.jsonl.gz
  lang: fr
- name: fleurs-es
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/es_419/fleurs-es_419_test.jsonl.gz
  lang: es
- name: fleurs-pt
  manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/fleurs/pt_br/fleurs-pt_br_test.jsonl.gz
  lang: pt

# ------------------ S2TT translation data------------------
- name: CoVoSTv2_zh-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/zh-CN_en/zh-CN_en_test_cuts.jsonl.gz
  lang: zh
- name: CoVoSTv2_ja-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/ja_en/ja_en_test_cuts.jsonl.gz
  lang: ja
- name: CoVoSTv2_ru-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/ru_en/ru_en_test_cuts.jsonl.gz
  lang: ru
- name: CoVoSTv2_id-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/id_en/id_en_test_cuts.jsonl.gz
  lang: id
- name: CoVoSTv2_fr-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/fr_en/fr_en_test_cuts.jsonl.gz
  lang: fr
- name: CoVoSTv2_es-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/es_en/es_en_test_cuts.jsonl.gz
  lang: es
- name: CoVoSTv2_pt-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/pt_en/pt_en_test_cuts.jsonl.gz
  lang: pt