Datasets
bertram-gilfoyle/CC-MAIN-2023-40-raw
1572 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
stemdataset/STEM
1572 downloads
['language:en''license:apache-2.0''size_categories:1M<n<10M'
recursal/Europarl-Translation-Instruct
1572 downloads
['task_categories:text-generation''task_categories:fill-mask''task_ids:language-modeling'
WhissleAI/indicvoices_pa_tagged_transcripts
1572 downloads
['task_categories:automatic-speech-recognition''annotations_creators:other''language_creators:other'
jon-tow/okapi_hellaswag
1571 downloads
['language:ar''language:bn''language:ca'
james-1111/x_dataset_030237
1570 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
Alphonsce/cif-dataset
1570 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
liuhuanjim013/kinetics400
1570 downloads
['size_categories:10K<n<100K''format:parquet''modality:tabular'
distil-whisper/librispeech_asr-noise
1568 downloads
['size_categories:100K<n<1M''format:parquet''modality:audio'
asahi417/seamless-align-deA-enA.speaker-embedding.xlsr-2b
1567 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'