speech | en | -- | LibriSpeech | v12 | |
speech | en | -- | How2 | | |
speech | en | -- | Mozilla Common Voice | v11.0 | |
speech | en | -- | TED LIUM | V2/V3 | |
speech | en | -- | Vox Populi | | |
speech-to-text-parallel | en | all | MuST-C | v1.2/v2.0/v3.0 | (10) ar, zh, nl, fr, de, ja, fa, pt, ru, tr |
speech-to-text-parallel | en | all | CoVoST | v2 | (10) ar, zh, nl, fr, de, ja, fa, pt, ru, tr |
speech-to-text-parallel | en | all | Europarl-ST | v1.1 | (4) fr, de, pt, tr |
text-parallel | en | all | Europarl | v10 | (2) fr, de |
text-parallel | en | all | Europarl | v7 | (4) nl, fr, de, pt |
text-parallel | en | all | NewsCommentary | v16 | (8) ar, zh, nl, fr, de, ja, pt, ru |
text-parallel | en | all | OpenSubtitles | v2018 | (10) ar, zh, nl, fr, de, ja, fa, pt, ru, tr |
text-parallel | en | de | TED2020 | v1 | (1) de |
text-parallel | en | all | Tatoeba | v2022-03-03 | (10) ar, zh, nl, fr, de, ja, fa, pt, ru, tr |
text-parallel | en | de | ELRC-CORDIS_News | v1 | (1) de |