Datasets
wikimedia/structured-wikipedia
1412 downloads
['task_ids:language-modeling''task_ids:masked-language-modeling''language:en'
Xkev/LLaVA-CoT-100k
1412 downloads
['task_categories:visual-question-answering''language:en''license:apache-2.0'
Liu-Hy/GenoTEX
1412 downloads
['task_categories:text-generation''task_categories:text2text-generation''task_categories:table-question-answering'
Skywork/Skywork-OR1-RL-Data
1411 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
EleutherAI/advanced_ai_risk
1410 downloads
['region:us']
facebook/natural_reasoning
1410 downloads
['task_categories:text-generation''language:en''license:cc-by-nc-4.0'
Biocollab/SCREEN
1409 downloads
['region:us']
ShoukanLabs/OpenNiji-Dataset-Aesthetic-Finetune-0-15K
1408 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
KwaiVGI/MultiCamVideo-Dataset
1407 downloads
['license:apache-2.0''arxiv:2503.11647''region:us']
fracapuano/brainformer-e-large
1406 downloads
['size_categories:1K<n<10K''format:arrow''modality:tabular'