Update README.md
Browse files
README.md
CHANGED
|
@@ -39,8 +39,6 @@ datasets:
|
|
| 39 |
- Rapidata/text-2-video-human-preferences-pika2.2
|
| 40 |
- derek-thomas/ScienceQA
|
| 41 |
- mteb/scifact
|
| 42 |
-
- Kaeyze/computer-science-synthetic-dataset
|
| 43 |
-
- ChristophSchuhmann/basic-math-problems-with-step-by-step-solutions
|
| 44 |
- bh2821/LightNovel5000
|
| 45 |
- ibm-nasa-geospatial/Landslide4sense
|
| 46 |
- hiyouga/geometry3k
|
|
@@ -100,6 +98,74 @@ datasets:
|
|
| 100 |
- divaroffical/real_estate_ads
|
| 101 |
- LLM360/MegaMath
|
| 102 |
- manycore-research/SpatialLM-Testset
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 103 |
language:
|
| 104 |
- fr
|
| 105 |
- en
|
|
@@ -107,6 +173,7 @@ language:
|
|
| 107 |
- es
|
| 108 |
- ja
|
| 109 |
- zh
|
|
|
|
| 110 |
- ga
|
| 111 |
metrics:
|
| 112 |
- accuracy
|
|
|
|
| 39 |
- Rapidata/text-2-video-human-preferences-pika2.2
|
| 40 |
- derek-thomas/ScienceQA
|
| 41 |
- mteb/scifact
|
|
|
|
|
|
|
| 42 |
- bh2821/LightNovel5000
|
| 43 |
- ibm-nasa-geospatial/Landslide4sense
|
| 44 |
- hiyouga/geometry3k
|
|
|
|
| 98 |
- divaroffical/real_estate_ads
|
| 99 |
- LLM360/MegaMath
|
| 100 |
- manycore-research/SpatialLM-Testset
|
| 101 |
+
- vincentmin/eli5_rlhf_explainlikeim5
|
| 102 |
+
- nvidia/OpenMathReasoning
|
| 103 |
+
- PrimeIntellect/INTELLECT-2-RL-Dataset
|
| 104 |
+
- openbmb/Ultra-FineWeb
|
| 105 |
+
- nvidia/Nemotron-CrossThink
|
| 106 |
+
- Intelligent-Internet/ii-agent_gaia-benchmark_validation
|
| 107 |
+
- Intelligent-Internet/II-Thought-RL-v0
|
| 108 |
+
- Intelligent-Internet/OpenAI-HealthBench-II-Medical-8B-GPT-4.1
|
| 109 |
+
- sailor2/sea-internet
|
| 110 |
+
- Intelligent-Internet/pd12m
|
| 111 |
+
- Intelligent-Internet/wikipedia_en
|
| 112 |
+
- SciKnowOrg/ontolearner-web_and_internet
|
| 113 |
+
- Guillem21/yahoo_computers_internet_dataset
|
| 114 |
+
- Intelligent-Internet/II-Thought-RL-v0-Math-50K
|
| 115 |
+
- Anthropic/llm_global_opinions
|
| 116 |
+
- timchen0618/OpinionQA
|
| 117 |
+
- forcemultiplier/supreme_court_opinions_corpus_pdfwebAug24
|
| 118 |
+
- HiTZ/Multilingual-Opinion-Target-Extraction
|
| 119 |
+
- Insects/ContextSpeech
|
| 120 |
+
- bdotloh/empathetic-dialogues-contexts
|
| 121 |
+
- Salesforce/ContextualBench
|
| 122 |
+
- kothasuhas/nys-ethics-opinions
|
| 123 |
+
- socialtrait/opinion_qa_panel_W49_train-sample_100-responses
|
| 124 |
+
- JesusAura999/BELIEFS_OPINIONS_DATASET_QWEN_FORMAT
|
| 125 |
+
- ScratchThePlan/novel_cn_roleplay_dataset_liars_lips_fall_apart_in_love
|
| 126 |
+
- arthurcolle/open-computer-using-agent
|
| 127 |
+
- agentlans/literary-reasoning
|
| 128 |
+
- tiny-agents/tiny-agents
|
| 129 |
+
- agents-course/course-certificates-of-excellence
|
| 130 |
+
- MiniMaxAI/TTS-Multilingual-Test-Set
|
| 131 |
+
- osunlp/Multimodal-Mind2Web
|
| 132 |
+
- Mxode/Chinese-Multimodal-Instruct
|
| 133 |
+
- omegalabsinc/omega-multimodal
|
| 134 |
+
- princeton-nlp/SWE-bench_Multimodal
|
| 135 |
+
- DMindAI/DMind_Benchmark
|
| 136 |
+
- xDAN-Vision/xDAN-Agentic-DeepSearch-example
|
| 137 |
+
- enosislabs/deepsearch-mini-shareGPT
|
| 138 |
+
- enosislabs/deepsearch-llama-finetune
|
| 139 |
+
- Jady-Zhao/DeepSea-Biological-Data
|
| 140 |
+
- HP6669/BGI_Deepsea_CLIP
|
| 141 |
+
- amazon-agi/SIFT-50M
|
| 142 |
+
- agibot-world/GenieSimAssets
|
| 143 |
+
- agibot-world/AgiBotWorld-Beta
|
| 144 |
+
- arcprize/arc_agi_2_human_testing
|
| 145 |
+
- hails/agieval-gaokao-chemistry
|
| 146 |
+
- agibot-world/AgiBotDigitalWorld
|
| 147 |
+
- InnerI/Universal-Christ-Consciousness-Dataset
|
| 148 |
+
- groWsoul/ERROR_Insights_on_Consciousness_and_Psychology
|
| 149 |
+
- Guilherme34/a-theory-of-consciouness-experiment
|
| 150 |
+
- ConsciousEnergies/JRsLENRBibliography
|
| 151 |
+
- AI-Ethics/Consciousness_Knowledge_Graph_Exploration
|
| 152 |
+
- dreamerdeo/finqa
|
| 153 |
+
- dataset-org/dream
|
| 154 |
+
- AgenTao/cerebro
|
| 155 |
+
- cerebras/Synth-Long-SFT32K
|
| 156 |
+
- bwittmann/syn-cerebral-octa-seg
|
| 157 |
+
- open-llm-leaderboard-old/details_cerebras__Cerebras-GPT-111M
|
| 158 |
+
- Rapidata/text-2-video-human-preferences-veo2
|
| 159 |
+
- SAAgent/MCPWorld
|
| 160 |
+
- mcp-course/images
|
| 161 |
+
- DeepNLP/mcp-servers
|
| 162 |
+
- ai2-adapt-dev/synth-mcp-test
|
| 163 |
+
- ai2-adapt-dev/multi_step_reasoning_tool_use_mcp_4omini
|
| 164 |
+
- ai2-adapt-dev/mcp-server-dump-smithery
|
| 165 |
+
- maiia-bocharova/mcphrasy_test_skill_tok
|
| 166 |
+
- tobySolutions/mcp-agent
|
| 167 |
+
- jerin1982/mcp_info_data
|
| 168 |
+
- vitaliy-sharandin/pollution-absolute-variation-co2
|
| 169 |
language:
|
| 170 |
- fr
|
| 171 |
- en
|
|
|
|
| 173 |
- es
|
| 174 |
- ja
|
| 175 |
- zh
|
| 176 |
+
- ak
|
| 177 |
- ga
|
| 178 |
metrics:
|
| 179 |
- accuracy
|