BlinkCode_leaderboard / leader_board.json
yajuniverse's picture
Create leader_board.json
7cbf279 verified
{
"Rank": {
"0": 1,
"1": 2,
"2": 3,
"3": 4,
"4": 5,
"5": 6,
"6": 7,
"7": 8,
"8": 9,
"9": 10,
"10": 11,
"11": 12,
"12": 13,
"13": 14,
"14": 15
},
"Model Type": {
"0": "api",
"1": "api",
"2": "api",
"3": "api",
"4": "api",
"5": "api",
"6": "api",
"7": "api",
"8": "OpenSource",
"9": "api",
"10": "OpenSource",
"11": "OpenSource",
"12": "OpenSource",
"13": "OpenSource",
"14": "OpenSource"
},
"Model Size": {
"0": "Unknown",
"1": "Unknown",
"2": "Unknown",
"3": "Unknown",
"4": "Unknown",
"5": "Unknown",
"6": "Unknown",
"7": "Unknown",
"8": "4B-10B",
"9": "Unknown",
"10": "4B-10B",
"11": "10B-20B",
"12": "4B-10B",
"13": "4B-10B",
"14": "<4B"
},
"Model": {
"0": "Claude3.5-Sonnet",
"1": "GPT-4o(0513)",
"2": "GPT-4-turbo(0409)",
"3": "Claude-3-Sonnet",
"4": "Claude-3-Opus",
"5": "GPT-4v(1106)",
"6": "Claude-3-Haiku",
"7": "Gemini-Pro-Vision",
"8": "InternLM-XComposer2-VL-7B",
"9": "Qwen-VL-Max",
"10": "LLaVA-v1.6-Mistral-7B-HF",
"11": "LLaVA-v1.6-Vicuna-13B-HF",
"12": "IDEFICS2-8B",
"13": "Fuyu-8B",
"14": "Paligemma-3B-Mix-224"
},
"Params (B)": {
"0": "",
"1": "",
"2": "",
"3": "",
"4": "",
"5": "",
"6": "",
"7": "",
"8": "7B",
"9": "",
"10": "7.57B",
"11": "13.4B",
"12": "8.4B",
"13": "9.41B",
"14": "2.92B"
},
"Supports multiple images": {
"0": true,
"1": true,
"2": true,
"3": true,
"4": true,
"5": true,
"6": true,
"7": true,
"8": false,
"9": true,
"10": false,
"11": true,
"12": true,
"13": false,
"14": false
},
"Avg Score\u2b06\ufe0f": {
"0": 70.7,
"1": 67.06,
"2": 54.58,
"3": 43.6,
"4": 41.99,
"5": 37.74,
"6": 36.42,
"7": 35.96,
"8": 18.71,
"9": 12.89,
"10": 11.13,
"11": 6.7,
"12": 2.08,
"13": 0.0,
"14": 0.0
},
"Avg Score\u2b50": {
"0": 71.37,
"1": 68.53,
"2": 57.97,
"3": 45.15,
"4": 42.88,
"5": 46.44,
"6": 33.94,
"7": 36.56,
"8": 19.7,
"9": 12.53,
"10": 11.72,
"11": 5.35,
"12": 2.0,
"13": 0.0,
"14": 0.0
},
"HumanEval-V": {
"0": 78.33,
"1": 75.83,
"2": 76.67,
"3": 41.67,
"4": 52.5,
"5": 78.33,
"6": 43.33,
"7": 46.96,
"8": 15.0,
"9": 20.83,
"10": 6.67,
"11": 8.33,
"12": 5.0,
"13": 0.0,
"14": 0.0
},
"HumanEval-V\u2b50": {
"0": 84.17,
"1": 85.83,
"2": 85.83,
"3": 55.83,
"4": 61.67,
"5": 78.33,
"6": 45.0,
"7": 49.57,
"8": 20.83,
"9": 22.5,
"10": 9.17,
"11": 8.33,
"12": 4.17,
"13": 0.0,
"14": 0.0
},
"MBPP-V": {
"0": 60.83,
"1": 60.0,
"2": 60.83,
"3": 48.33,
"4": 57.5,
"5": 55.83,
"6": 49.17,
"7": 42.74,
"8": 29.17,
"9": 18.33,
"10": 20.83,
"11": 13.33,
"12": 5.0,
"13": 0.0,
"14": 0.0
},
"MBPP-V\u2b50": {
"0": 60.0,
"1": 60.83,
"2": 60.83,
"3": 47.5,
"4": 54.17,
"5": 59.17,
"6": 45.0,
"7": 47.86,
"8": 31.67,
"9": 20.0,
"10": 20.83,
"11": 15.0,
"12": 4.17,
"13": 0.0,
"14": 0.0
},
"GSM8K-V": {
"0": 92.98,
"1": 93.86,
"2": 92.98,
"3": 82.46,
"4": 55.26,
"5": 94.74,
"6": 47.37,
"7": 67.54,
"8": 51.75,
"9": 34.21,
"10": 4.39,
"11": 3.51,
"12": 1.75,
"13": 0.0,
"14": 0.0
},
"GSM8K-V\u2b50": {
"0": 92.11,
"1": 92.98,
"2": 92.98,
"3": 79.82,
"4": 49.12,
"5": 94.74,
"6": 55.26,
"7": 63.16,
"8": 51.75,
"9": 39.47,
"10": 4.39,
"11": 3.51,
"12": 1.75,
"13": 0.0,
"14": 0.0
},
"MATH-V": {
"0": 53.85,
"1": 53.85,
"2": 50.55,
"3": 29.67,
"4": 18.68,
"5": 39.56,
"6": 10.99,
"7": 14.29,
"8": 8.79,
"9": 4.4,
"10": 4.4,
"11": 6.59,
"12": 1.1,
"13": 0.0,
"14": 0.0
},
"MATH-V\u2b50": {
"0": 56.04,
"1": 56.04,
"2": 52.75,
"3": 26.37,
"4": 18.68,
"5": 40.66,
"6": 15.38,
"7": 13.19,
"8": 9.89,
"9": 2.2,
"10": 4.44,
"11": 6.59,
"12": 2.2,
"13": 0.0,
"14": 0.0
},
"VP": {
"0": 61.54,
"1": 74.36,
"2": 2.56,
"3": 35.9,
"4": 46.15,
"5": 18.8,
"6": 47.86,
"7": 29.06,
"8": 0.85,
"9": 1.74,
"10": 17.95,
"11": 0.0,
"12": 0.0,
"13": 0.0,
"14": 0.0
},
"VP\u2b50": {
"0": 50.43,
"1": 67.52,
"2": 18.8,
"3": 37.61,
"4": 50.43,
"5": 49.57,
"6": 15.38,
"7": 29.06,
"8": 0.0,
"9": 2.65,
"10": 20.51,
"11": 0.0,
"12": 0.0,
"13": 0.0,
"14": 0.0
},
"Matplotlib": {
"0": 53.41,
"1": 46.14,
"2": 41.28,
"3": 23.18,
"4": 19.55,
"5": 4.77,
"6": 18.86,
"7": 29.55,
"8": 6.59,
"9": 2.05,
"10": 3.18,
"11": 3.41,
"12": 1.36,
"13": 0.0,
"14": 0.0
},
"Matplotlib\u2b50": {
"0": 56.36,
"1": 54.09,
"2": 48.85,
"3": 26.36,
"4": 21.36,
"5": 10.0,
"6": 23.18,
"7": 29.17,
"8": 6.82,
"9": 0.0,
"10": 2.5,
"11": 0.0,
"12": 0.68,
"13": 0.0,
"14": 0.0
},
"SVG": {
"0": 89.81,
"1": 56.84,
"2": 44.05,
"3": 33.49,
"4": 25.71,
"5": 3.3,
"6": 32.31,
"7": 25.71,
"8": 19.34,
"9": 9.43,
"10": 9.43,
"11": 4.01,
"12": 3.3,
"13": 0.0,
"14": 0.0
},
"SVG\u2b50": {
"0": 87.26,
"1": 59.43,
"2": 43.1,
"3": 32.78,
"4": 21.93,
"5": 12.74,
"6": 31.37,
"7": 24.76,
"8": 21.23,
"9": 7.55,
"10": 8.25,
"11": 4.72,
"12": 3.54,
"13": 0.0,
"14": 0.0
},
"TikZ": {
"0": 54.47,
"1": 54.5,
"2": 40.75,
"3": 16.75,
"4": 19.75,
"5": 10.5,
"6": 9.0,
"7": 9.5,
"8": 1.0,
"9": 0.0,
"10": 0.75,
"11": 1.0,
"12": 0.0,
"13": 0.0,
"14": 0.0
},
"TikZ\u2b50": {
"0": 65.26,
"1": 52.5,
"2": 39.25,
"3": 20.75,
"4": 23.97,
"5": 32.0,
"6": 12.0,
"7": 7.0,
"8": 1.5,
"9": 0.0,
"10": 1.75,
"11": 2.0,
"12": 0.25,
"13": 0.0,
"14": 0.0
},
"Webpage": {
"0": 91.12,
"1": 88.12,
"2": 81.56,
"3": 80.99,
"4": 82.79,
"5": 33.81,
"6": 68.85,
"7": 58.26,
"8": 35.86,
"9": 25.0,
"10": 32.58,
"11": 20.08,
"12": 1.23,
"13": 0.0,
"14": 0.0
},
"Webpage\u2b50": {
"0": 90.7,
"1": 87.5,
"2": 79.3,
"3": 79.34,
"4": 84.63,
"5": 40.78,
"6": 62.91,
"7": 65.32,
"8": 33.61,
"9": 18.39,
"10": 33.61,
"11": 7.99,
"12": 1.23,
"13": 0.0,
"14": 0.0
}
}