Datasets
CoIR-Retrieval/CodeSearchNet-ccr-python-queries-corpus
605 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
0x-YuAN/bbc-news-fkl
605 downloads
['size_categories:1K<n<10K''format:parquet''modality:tabular'
Zellic/all-ethereum-contracts
605 downloads
['language:en''size_categories:n<1K''format:imagefolder'
ShirohAO/tuxun
605 downloads
['language:en''size_categories:n<1K''format:csv'
drkvcsstvn/smearshare_allocation_activity_fast
605 downloads
['size_categories:1K<n<10K''format:parquet''modality:text'
BangumiBase/masamunekunnorevenge
604 downloads
['license:mit''size_categories:1K<n<10K''modality:image'
princeton-nlp/HELMET
604 downloads
['size_categories:n<1K''format:webdataset''modality:text'
OpenCoder-LLM/RefineCode-code-corpus-meta
604 downloads
['license:mit''size_categories:100M<n<1B''format:parquet'
Curiousfox/NRP_NIE04B_Hokkien_dataset
604 downloads
['task_categories:automatic-speech-recognition''size_categories:10K<n<100K''region:us']
ling99/OCRBench_v2
604 downloads
['license:mit''size_categories:10K<n<100K''format:parquet'