# ------------------ chinese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/aishell/aishell_test.jsonl.gz
  lang: zh
# ------------------ japanese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ja/ja_test_cuts_5k.jsonl.gz
  lang: ja
# ------------------ korean data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ko/ko_test_cuts.jsonl.gz
  lang: ko
# ------------------ english data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/en/en_test_cuts_5k.jsonl.gz
  lang: en
# ------------------ french data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/fr/fr_test_cuts_5k.jsonl.gz
  lang: fr
# ------------------ spanish data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/es/es_test_cuts_5k.jsonl.gz
  lang: es
# ------------------ portuguese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/pt/pt_test_cuts_5k.jsonl.gz
  lang: pt
# ------------------ vietnamese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/vi/vi_test_cuts.jsonl.gz
  lang: vi
# ------------------ indonesian data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/id/id_test_cuts.jsonl.gz
  lang: id
# ------------------ russian data------------------ 
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ru/ru_test_cuts_5k.jsonl.gz
  lang: ru
# ------------------ S2TT translation data------------------
- name: CoVoSTv2_zh-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/zh-CN_en/zh-CN_en_test_cuts.jsonl.gz
  lang: zh
- name: CoVoSTv2_ja-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/ja_en/ja_en_test_cuts.jsonl.gz
  lang: ja
- name: CoVoSTv2_ru-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/ru_en/ru_en_test_cuts.jsonl.gz
  lang: ru
- name: CoVoSTv2_id-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/id_en/id_en_test_cuts.jsonl.gz
  lang: id
- name: CoVoSTv2_fr-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/fr_en/fr_en_test_cuts.jsonl.gz
  lang: fr
- name: CoVoSTv2_es-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/es_en/es_en_test_cuts.jsonl.gz
  lang: es
- name: CoVoSTv2_pt-en
  manifest: /apdcephfs_cq12/share_302080740/data/st_train_data/raw/covost2/speech2text_format/pt_en/pt_en_test_cuts.jsonl.gz
  lang: pt