Datasets
wmt/wmt20_mlqe_task1
420 downloads
['task_categories:translation''annotations_creators:expert-generated''annotations_creators:machine-generated'
ShoukanLabs/AniSpeech
420 downloads
['task_categories:text-to-speech''language:en''license:mit'
pourmand1376/asr-farsi-youtube-chunked-30-seconds
420 downloads
['task_categories:automatic-speech-recognition''language:fa''license:apache-2.0'
bertram-gilfoyle/CC-MAIN-2020-29-raw
420 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
SKNahin/open-large-bengali-asr-data
420 downloads
['task_categories:automatic-speech-recognition''language:bn''size_categories:1M<n<10M'
Salama1429/tarteel-ai-everyayah-Quran
418 downloads
['task_categories:automatic-speech-recognition''annotations_creators:expert-generated''language_creators:crowdsourced'
louisbrulenaudet/code-impots-annexe-ii
420 downloads
['task_categories:text-generation''task_categories:table-question-answering''task_categories:summarization'
text-machine-lab/vocab_filtered_dataset_22B
420 downloads
['size_categories:100M<n<1B''format:parquet''modality:text'
k-mktr/improved-flux-prompts
420 downloads
['task_categories:text-classification''language:en''license:mit'
mesolitica/Malaysian-Speech-Instructions
420 downloads
['language:ms''size_categories:100K<n<1M''format:parquet'