Datasets

InfoTokenizers/finewebedu-20B

966 downloads

['language:en''size_categories:10M<n<100M''format:parquet'

Mxode/Chinese-Reasoning-Distil-Data

966 downloads

['task_categories:text-generation''language:zh''license:cc-by-sa-4.0'

fineinstructions-pretraining/nemotron_actual_1T

966 downloads

['size_categories:100M<n<1B''format:parquet''modality:text'

taln-ls2n/kpbiomed

965 downloads

['task_categories:text-generation''annotations_creators:unknown''language_creators:unknown'

orgcatorg/multilingual

965 downloads

['size_categories:10M<n<100M''format:parquet''modality:text'

sailplane/SWE-bench_Lite_filtered

965 downloads

['region:us']

tokyotech-llm/lmsys-chat-1m-synth

965 downloads

['task_categories:text-generation''source_datasets:lmsys-chat-1m''language:ja'

bramtoula/vtab_eurosat

964 downloads

['size_categories:10K<n<100K''format:parquet''modality:image'

John6666/model-mirror-5

964 downloads

['language:en''license:other''region:us'

barc0/200k_HEAVY_gpt4o-description-gpt4omini-code_generated_problems

964 downloads

['task_categories:text-generation''language:en''license:mit'
Previous

Page 414 of 1635

Next