# ------------------ chinese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/aishell/aishell_test_fix.jsonl.gz
  lang: zh
# ------------------ japanese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ja/ja_test_cuts_5k.jsonl.gz
  lang: ja
# ------------------ korean data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ko/ko_test_cuts.jsonl.gz
  lang: ko
# ------------------ english data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/en/en_test_cuts_5k.jsonl.gz
  lang: en
# ------------------ french data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/fr/fr_test_cuts_5k.jsonl.gz
  lang: fr
# ------------------ spanish data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/es/es_test_cuts_5k.jsonl.gz
  lang: es
# ------------------ portuguese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/pt/pt_test_cuts_5k.jsonl.gz
  lang: pt
# ------------------ vietnamese data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/vi/vi_test_cuts.jsonl.gz
  lang: vi
# ------------------ indonesian data------------------
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/id/id_test_cuts.jsonl.gz
  lang: id
# ------------------ russian data------------------ 
- manifest: /apdcephfs_cq12/share_302080740/data/asr_test_data/multilingual/commonvoice/cv-corpus-20.0/ru/ru_test_cuts_5k.jsonl.gz
  lang: ru