Datasets
bot-yaya/undl_es2en_translation
363 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
recursal/reprocessed_singapore_national_speech_corpus
363 downloads
['task_categories:text-generation''task_categories:text-classification''task_categories:automatic-speech-recognition'
bigdata-pw/playground-prompts
363 downloads
['task_categories:text-to-image''language:en''license:odc-by'
Spawning/PD3M
363 downloads
['language:en''license:cdla-permissive-2.0''size_categories:1M<n<10M'
JetBrains-Research/PandasPlotBench
363 downloads
['license:apache-2.0''size_categories:n<1K''format:parquet'
SherryXTChen/InstructCLIP-InstructPix2Pix-Data
363 downloads
['task_categories:image-to-image''task_categories:text-to-image''language:en'
nomic-ai/VisRAG-Ret-Train-Synthetic-data
363 downloads
['size_categories:100K<n<1M''format:parquet''modality:image'
mlfoundations-dev/openthoughts3_math_300k
363 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'
ivanjaenm/hierarchical_QA_wordnet
363 downloads
['size_categories:100K<n<1M''format:parquet''modality:tabular'
castorini/afriberta-corpus
362 downloads
['task_categories:text-generation''task_ids:language-modeling''language:om'