Datasets
emozilla/pg_books-tokenized-bos-eos-chunked-65536
300 downloads
['size_categories:10K<n<100K''format:parquet''library:datasets'
theblackcat102/llava-instruct-mix
300 downloads
['task_categories:visual-question-answering''language:en''license:cc-by-nc-4.0'
hezarai/parsynth-ocr-200k
300 downloads
['task_categories:image-to-image''language:fa''size_categories:100K<n<1M'
openbmb/UltraInteract_sft
300 downloads
['language:en''license:mit''size_categories:100K<n<1M'
Vi-VLM/Vista
300 downloads
['task_categories:visual-question-answering''language:vi''license:mit'
bitmind/flickr30k-stable-diffusion
300 downloads
['size_categories:10K<n<100K''format:parquet''modality:image'
gallen881/arxiv-physics
300 downloads
['license:mit''size_categories:10K<n<100K''format:parquet'
Reset23/the-stack-v2-blamed
300 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
yzhuang/Agentic-Long-Context-Understanding-QA
300 downloads
['task_categories:question-answering''task_categories:reinforcement-learning''language:en'
lerobot/libero_object_image
300 downloads
['task_categories:robotics''license:apache-2.0''size_categories:10K<n<100K'