Yeyito commited on
Commit
91ac6f1
ยท
1 Parent(s): e87b0e5

current eval

Browse files
Files changed (1) hide show
  1. data/code_eval_board.csv +2 -0
data/code_eval_board.csv CHANGED
@@ -11,4 +11,6 @@ T,Models,ARC,HellaSwag,MMLU,TruthfulQA,Winogrande,GSM8K,Reference Model
11
  ๐Ÿ”ถ,openchat/openchat_3.5,0.13,0.13,0.23,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
12
  ๐Ÿ”ถ,meta-math/MetaMath-Mistral-7B,0.08,0.1,0.17,0.42,0.0,0.97,mistralai/Mistral-7B-v0.1
13
  ๐Ÿ”ถ,teknium/OpenHermes-2.5-Mistral-7B,0.07,0.13,0.23,0.39,0.0,0.96,mistralai/Mistral-7B-v0.1
 
 
14
 
 
11
  ๐Ÿ”ถ,openchat/openchat_3.5,0.13,0.13,0.23,0.45,0.0,0.97,mistralai/Mistral-7B-v0.1
12
  ๐Ÿ”ถ,meta-math/MetaMath-Mistral-7B,0.08,0.1,0.17,0.42,0.0,0.97,mistralai/Mistral-7B-v0.1
13
  ๐Ÿ”ถ,teknium/OpenHermes-2.5-Mistral-7B,0.07,0.13,0.23,0.39,0.0,0.96,mistralai/Mistral-7B-v0.1
14
+ ๐Ÿ”ถ,microsoft/Orca-2-7b,0.88,0.8,0.77,0.91,0.0,1.0,mistralai/Mistral-7B-v0.1
15
+ ๐Ÿ”ถ,WizardLM/WizardMath-7B-V1.1,0.1,0.11,0.21,0.4,0.0,0.99,mistralai/Mistral-7B-v0.1
16