Datasets
Multimodal-Fatima/StanfordCars_test
254 downloads
['size_categories:1K<n<10K''format:parquet''modality:image'
BAAI/CMMU
254 downloads
['task_categories:visual-question-answering''language:zh''license:apache-2.0'
FBK-TeV/WildBe
254 downloads
['task_categories:object-detection''license:cc-by-nc-4.0''size_categories:1K<n<10K'
hf-internal-testing/document-visual-retrieval-test
254 downloads
['language:en''license:mit''size_categories:n<1K'
CreatlV/cova-coco-v2
253 downloads
['size_categories:1K<n<10K''format:parquet''modality:image'
dinhanhx/crossmodal-3600
253 downloads
['task_categories:image-to-text''task_ids:image-captioning''source_datasets:wikipedia'
BangumiBase/spiceandwolf
253 downloads
['license:mit''size_categories:1K<n<10K''modality:image'
ccmusic-database/Guzheng_Tech99
253 downloads
['task_categories:audio-classification''language:zh''language:en'
noahshinn/cifar100_2_to_100_constant_size_dataset
253 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
pumb-ai/synthetic-cyrillic-large
253 downloads
['task_categories:image-to-text''language:uk''language:ru'