Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
title: Open CoT Leaderboard | |
emoji: 🥇 | |
colorFrom: red | |
colorTo: yellow | |
sdk: gradio | |
sdk_version: 4.36.0 | |
app_file: app.py | |
pinned: true | |
license: apache-2.0 | |
duplicated_from: logikon/open_cot_leaderboard | |
fullWidth: true | |
tags: | |
- leaderboard | |
- CoT | |
- chain-of-thought | |
short_description: Track, rank and evaluate open LLMs' CoT quality | |
models: | |
- 0-hero/Matter-0.2-7B-DPO | |
- 01-ai/Yi-1.5-34B-Chat | |
- 01-ai/Yi-1.5-9B | |
- 01-ai/Yi-1.5-9B-32K | |
- 01-ai/Yi-1.5-9B-Chat | |
- 01-ai/Yi-1.5-9B-Chat-16K | |
- 01-ai/Yi-34B | |
- 01-ai/Yi-34B-Chat | |
- 01-ai/Yi-6B | |
- BSC-LT/salamandra-7b-instruct | |
- ChavyvAkvar/habib-DPO-v3 | |
- CohereForAI/aya-23-35B | |
- CohereForAI/aya-23-8B | |
- CohereForAI/aya-expanse-32b | |
- CohereForAI/aya-expanse-8b | |
- CohereForAI/c4ai-command-r-plus-08-2024 | |
- CohereForAI/c4ai-command-r-plus-08-2024 | |
- DebateLabKIT/Llama-3.1-Argunaut-1-8B-SFT | |
- DebateLabKIT/Llama-3.1-Argunaut-1-8B-SPIN | |
- DebateLabKIT/Llama-3.3-Argunaut-1-70B-SFT | |
- DebateLabKIT/Llama-3.3-Argunaut-1-70B-SPIN | |
- Deci/DeciLM-7B | |
- Deci/DeciLM-7B-instruct | |
- HuggingFaceH4/zephyr-7b-beta | |
- HuggingFaceTB/SmolLM-1.7B-Instruct | |
- HuggingFaceTB/SmolLM-135M-Instruct | |
- HuggingFaceTB/SmolLM2-1.7B-Instruct | |
- Intel/neural-chat-7b-v3-1 | |
- Kukedlc/NeuralLLaMa-3-8b-DT-v0.1 | |
- Kukedlc/NeuralLLaMa-3-8b-ORPO-v0.3 | |
- Kukedlc/NeuralSynthesis-7b-v0.4-slerp | |
- LeroyDyer/Mixtral_AI_Chat_1.0 | |
- LeroyDyer/Mixtral_AI_CyberTron_DeepMind_III_UFT | |
- LeroyDyer/Mixtral_AI_Cyber_Boss | |
- Locutusque/Hercules-4.0-Mistral-v0.2-7B | |
- Locutusque/OpenCerebrum-1.0-7b-DPO | |
- NousResearch/Hermes-2-Pro-Mistral-7B | |
- NousResearch/Hermes-3-Llama-3.1-70B | |
- NousResearch/Nous-Hermes-llama-2-7b | |
- OpenBuddy/openbuddy-llama3-8b-v21.1-8k | |
- OpenBuddy/openbuddy-mistral2-7b-v20.2-32k | |
- OpenBuddy/openbuddy-yi1.5-9b-v21.1-32k | |
- OpenBuddy/openbuddy-zen-3b-v21.1-32k | |
- OpenBuddy/openbuddy-zen-3b-v21.2-32k | |
- Qwen/Qwen2-72B-Instruct | |
- Qwen/Qwen2-7B-Instruct | |
- Qwen/Qwen2.5-14B-Instruct | |
- Qwen/Qwen2.5-32B-Instruct | |
- Qwen/Qwen2.5-3B-Instruct | |
- Qwen/Qwen2.5-72B-Instruct | |
- Qwen/Qwen2.5-7B-Instruct | |
- Salesforce/LLaMA-3-8B-SFR-Iterative-DPO-R | |
- ai21labs/AI21-Jamba-1.5-Mini | |
- allenai/OLMo-7B-0724-Instruct-hf | |
- allenai/tulu-2-13b | |
- allenai/tulu-2-70b | |
- allenai/tulu-2-7b | |
- allenai/tulu-2-dpo-13b | |
- allenai/tulu-2-dpo-70b | |
- allenai/tulu-2-dpo-7b | |
- arcee-ai/Llama-3.1-SuperNova-Lite | |
- arcee-ai/SuperNova-Medius | |
- bunnycore/Mnemosyne-7B | |
- cognitivecomputations/Llama-3-8B-Instruct-abliterated-v2 | |
- cookinai/LlamaReflect-8B-CoT-safetensors | |
- cookinai/LlamaReflect-8B-CoT-safetensors | |
- databricks/dbrx-instruct | |
- databricks/dolly-v2-3b | |
- deepseek-ai/DeepSeek-R1-Distill-Llama-70B | |
- deepseek-ai/DeepSeek-R1-Distill-Llama-8B | |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B | |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-32B | |
- deepseek-ai/DeepSeek-R1-Distill-Qwen-7B | |
- google/gemma-2-27b-it | |
- google/gemma-2-2b-it | |
- google/gemma-2-9b-it | |
- google/gemma-2b | |
- google/gemma-2b-it | |
- google/gemma-7b | |
- google/gemma-7b-it | |
- ibm/merlinite-7b | |
- ichigoberry/pandafish-2-7b-32k | |
- internlm/internlm2-7b | |
- internlm/internlm2-chat-20b | |
- internlm/internlm2-chat-7b | |
- internlm/internlm2-math-20b | |
- internlm/internlm2-math-7b | |
- meta-llama/Llama-2-13b-chat-hf | |
- meta-llama/Llama-2-13b-hf | |
- meta-llama/Llama-2-70b-chat-hf | |
- meta-llama/Llama-2-70b-hf | |
- meta-llama/Llama-2-70b-hf | |
- meta-llama/Llama-2-7b-hf | |
- meta-llama/Llama-3.2-1B-Instruct | |
- meta-llama/Llama-3.2-3B-Instruct | |
- meta-llama/Meta-Llama-3-70B | |
- meta-llama/Meta-Llama-3-70B-Instruct | |
- meta-llama/Meta-Llama-3-8B | |
- meta-llama/Meta-Llama-3-8B-Instruct | |
- meta-llama/Meta-Llama-3.1-70B-Instruct | |
- meta-llama/Meta-Llama-3.1-8B-Instruct | |
- microsoft/Orca-2-13b | |
- microsoft/Orca-2-7b | |
- microsoft/Phi-3-medium-4k-instruct | |
- microsoft/Phi-3-mini-4k-instruct | |
- microsoft/Phi-3-small-8k-instruct | |
- microsoft/Phi-3.5-MoE-instruct | |
- microsoft/Phi-3.5-mini-instruct | |
- microsoft/phi-2 | |
- mistralai/Ministral-8B-Instruct-2410 | |
- mistralai/Mistral-7B-Instruct-v0.2 | |
- mistralai/Mistral-7B-Instruct-v0.3 | |
- mistralai/Mistral-7B-v0.1 | |
- mistralai/Mistral-Nemo-Instruct-2407 | |
- mistralai/Mistral-Small-Instruct-2409 | |
- mistralai/Mixtral-8x22B-Instruct-v0.1 | |
- mistralai/Mixtral-8x7B-Instruct-v0.1 | |
- mistralai/Mixtral-8x7B-v0.1 | |
- mlabonne/AlphaMonarch-7B | |
- mlabonne/Daredevil-8B-abliterated | |
- nvidia/Llama-3.1-Nemotron-70B-Instruct-HF | |
- openbmb/Eurus-70b-sft | |
- openbmb/Eurus-7b-kto | |
- openchat/openchat-3.5-0106 | |
- princeton-nlp/gemma-2-9b-it-SimPO | |
- teknium/OpenHermes-2.5-Mistral-7B | |
- terrycraddock/Reflection-Llama-3.1-8B | |
- unsloth/Phi-3.5-mini-instruct | |
- upstage/SOLAR-10.7B-Instruct-v1.0 | |
- upstage/SOLAR-10.7B-v1.0 | |
- vicgalle/Configurable-Hermes-2-Pro-Llama-3-8B | |
- vicgalle/Configurable-Janus-7B | |
- vicgalle/Configurable-Yi-1.5-9B-Chat | |
- wandb/gemma-2b-zephyr-dpo | |
- wenbopan/Faro-Yi-9B-DPO | |