Datasets
ranWang/UN_Sitemap_Multilingual_HTML_Corpus
323 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
MakiPan/hagrid-hand-enc-250k
323 downloads
['size_categories:100K<n<1M''format:parquet''modality:image'
sproos/SlimPajama-6B-embedded
323 downloads
['size_categories:1M<n<10M''format:parquet''modality:text'
hf-vision/chest-xray-pneumonia
323 downloads
['license:cc-by-4.0''size_categories:1K<n<10K''format:parquet'
nomic-ai/nomic-bert-2048-pretraining-data
323 downloads
['size_categories:1M<n<10M''format:parquet''library:datasets'
HiTZ/Multilingual-Medical-Corpus
323 downloads
['language:en''language:es''language:fr'
astro21/coco-caption-train-split-10k
323 downloads
['size_categories:1K<n<10K''format:parquet''modality:image'
jingjietan/essays-big5
323 downloads
['task_categories:text-classification''language:en''license:apache-2.0'
neuralmagic/mmlu_fr
323 downloads
['size_categories:10K<n<100K''format:parquet''modality:text'
ai4bharat/NPTEL
323 downloads
['multilinguality:multilingual''language:as''language:bn'