Datasets
gfissore/arxiv-abstracts-2021
581 downloads
['task_categories:summarization''task_categories:text-retrieval''task_categories:text2text-generation'
datablations/c4-filter
581 downloads
['size_categories:100M<n<1B''format:parquet''modality:tabular'
TimKoornstra/financial-tweets-sentiment
581 downloads
['task_categories:text-classification''language:en''license:mit'
maywell/korean_textbooks
581 downloads
['language:ko''license:apache-2.0''size_categories:1M<n<10M'
allganize/RAG-Evaluation-Dataset-KO
581 downloads
['language:ko''license:mit''size_categories:n<1K'
FreedomIntelligence/medical-o1-verifiable-problem
581 downloads
['task_categories:question-answering''task_categories:text-generation''language:en'
Winboy/c8-h8
581 downloads
['size_categories:n<1K''format:json''modality:text'
codeparrot/codeparrot-train-more-filtering
580 downloads
['size_categories:1M<n<10M''format:parquet''modality:tabular'
CoIR-Retrieval/CodeSearchNet-ccr-go-queries-corpus
580 downloads
['size_categories:100K<n<1M''format:parquet''modality:text'
BangumiBase/ningenfushinnoboukenshatachigasekaiwosukuuyoudesu
580 downloads
['license:mit''size_categories:1K<n<10K''modality:image'