Datasets
nhagar/hplt2.0_cleaned_urls
310 downloads
['license:cc0-1.0''size_categories:10B<n<100B''format:parquet'
SwayStar123/cc12m_imagenet21k_invae-latents
310 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
m-a-p/CMMMU
309 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
wenknow/reddit_dataset_209
309 downloads
['task_categories:text-classification''task_categories:token-classification''task_categories:question-answering'
Mechanistic-Anomaly-Detection/llama3-short-generic-backdoor-dataset
309 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
TwinkStart/llama-questions
309 downloads
['size_categories:n<1K''format:parquet''modality:audio'
thainq107/iwslt2015-en-vi
309 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
EGLima/pen_task_v4
309 downloads
['task_categories:robotics''license:apache-2.0''size_categories:10K<n<100K'
apayan/so100_dice4
309 downloads
['task_categories:robotics''license:apache-2.0''size_categories:10K<n<100K'
andresnowak/MNLP_M2_mcqa_dataset
309 downloads
['task_categories:question-answering''task_categories:text-generation''size_categories:100K<n<1M'