Datasets
dalle-mini/wit
662 downloads
['size_categories:1M<n<10M''format:parquet''modality:image'
wenge-research/yayi2_pretrain_data
662 downloads
['language:zh''language:en''license:apache-2.0'
iDRAMALab/iDRAMA-scored-2024
662 downloads
['source_datasets:original''license:cc-by-nc-sa-4.0''size_categories:10M<n<100M'
EleutherAI/SmolLM2-135M-20B
662 downloads
['size_categories:10M<n<100M''format:parquet''modality:text'
MedRAG/wikipedia
661 downloads
['task_categories:question-answering''language:en''size_categories:1M<n<10M'
rootsautomation/websrc
661 downloads
['task_categories:question-answering''language:en''license:mit'
internlm/Lean-Workbook
661 downloads
['language:en''license:apache-2.0''size_categories:10K<n<100K'
CoIR-Retrieval/codefeedback-st-queries-corpus
661 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
BangumiBase/kuroshitsujikishukugakkouhen
661 downloads
['license:mit''size_categories:1K<n<10K''modality:image'
BAAI/IndustryCorpus2_current_affairs_government_administration
661 downloads
['size_categories:10M<n<100M''format:parquet''modality:tabular'