Delete model_performance.csv
Browse files- model_performance.csv +0 -19
model_performance.csv
DELETED
@@ -1,19 +0,0 @@
|
|
1 |
-
Model,Type,finqa,dm-simplong,xbrl-math
|
2 |
-
4o,instruction-tuned,72.49,60.0,72.22
|
3 |
-
o1,instruction-tuned,49.07,56.0,74.44
|
4 |
-
o3-mini,instruction-tuned,60.87,59.0,76.67
|
5 |
-
v3,instruction-tuned,73.2,53.0,76.67
|
6 |
-
r1,instruction-tuned,65.13,53.0,86.67
|
7 |
-
deepseek-70b,instruction-tuned,66.73,53.0,86.67
|
8 |
-
llama3-70B-instruct,instruction-tuned,58.92,41.0,56.67
|
9 |
-
llama31-70B-instruct,instruction-tuned,63.18,48.0,63.33
|
10 |
-
llama33-70B-instruct,instruction-tuned,68.15,54.0,70.0
|
11 |
-
deepseek-32b,instruction-tuned,65.48,55.0,84.44
|
12 |
-
deepseek-14b,instruction-tuned,63.27,44.0,84.44
|
13 |
-
deepseek-8b,instruction-tuned,45.96,33.0,81.11
|
14 |
-
llama3 8b-instruct,instruction-tuned,41.97,29.0,48.89
|
15 |
-
llama31 8b-instruct,instruction-tuned,54.13,34.0,62.22
|
16 |
-
Qwen2.5-32B-Instruct,instruction-tuned,,,
|
17 |
-
Qwen2.5-72B-Instruct,instruction-tuned,73.38,59.0,67.78
|
18 |
-
Qwen2.5-72B-Instruct-math,instruction-tuned,69.74,42.0,83.33
|
19 |
-
Fino1-8B,instruction-tuned,60.87,40.0,82.22
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|