Datasets
BangumiBase/theidolmastercinderellagirlsu149
418 downloads
['license:mit''size_categories:1K<n<10K''modality:image'
catherinearnett/monolingual-tokenizer-data
421 downloads
['source_datasets:oscar-corpus/OSCAR-2301''license:cc0-1.0''size_categories:100M<n<1B'
NoahEJ/fineweb-sample-100BT_over-2048-tokens-subset-split
421 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
Asap7772/d1shs0ap-easy-hintgen-qwen3-4b-lr1e6
421 downloads
['size_categories:10K<n<100K''format:parquet''modality:tabular'
pzxszbry/HO-Cap-Dataset
421 downloads
['language:en''license:cc-by-4.0''size_categories:n<1K'
helven/flock-1
421 downloads
['size_categories:n<1K''format:json''modality:text'
wmt/wmt20_mlqe_task1
420 downloads
['task_categories:translation''annotations_creators:expert-generated''annotations_creators:machine-generated'
sayakpaul/ucf101-subset
420 downloads
['license:apache-2.0''size_categories:n<1K''format:webdataset'
keremberke/hard-hat-detection
420 downloads
['task_categories:object-detection''size_categories:10K<n<100K''modality:image'
ShoukanLabs/AniSpeech
420 downloads
['task_categories:text-to-speech''language:en''license:mit'