Spaces:

Duplicated from TheFinAI/Open-Greek-Financial-LLM-Leaderboard

TheFinAI
/

Open-FinLLM-Leaderboard

Running

App Files Files Community

Open-FinLLM-Leaderboard / frontend /src /pages /LeaderboardPage /components /Leaderboard /hooks /useDataUtils.js

mirageco's picture

fix logo display

fc869a4 16 days ago

history blame contribute delete

12.4 kB

	import { useMemo } from "react";
	import {
	looksLikeRegex,
	parseSearchQuery,
	getValueByPath,
	} from "../utils/searchUtils";
	import { ALLOWED_MODELS, isModelAllowed } from "../constants/allowedModels";

	// 硬编码数据集
	const HARDCODED_SCORES = {
	vision: {
	"GPT-4o": 55.54, "o3-Mini": 0.00, "Deepseek-V3": 0.00, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 16.27,
	"meta-llama/Llama-3.1-70B-Instruct": 0.00, "google/gemma-3-4b-it": 14.97, "google/gemma-3-27b-it": 25.57,
	"Qwen/Qwen2.5-32B-Instruct": 0.00, "Qwen/Qwen2.5-Omni-7B": 24.97, "TheFinAI/finma-7b-full": 0.00,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 0.00, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 0.00,
	"TheFinAI/FinMA-ES-Bilingual": 0.00, "TheFinAI/plutus-8B-instruct": 0.00, "Qwen-VL-MAX": 18.47,
	"LLaVA-1.6 Vicuna-13B": 19.77, "Deepseek-VL-7B-Chat": 19.10, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	audio: {
	"GPT-4o": 55.56, "o3-Mini": 0.00, "Deepseek-V3": 0.00, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 0.00,
	"meta-llama/Llama-3.1-70B-Instruct": 0.00, "google/gemma-3-4b-it": 0.00, "google/gemma-3-27b-it": 0.00,
	"Qwen/Qwen2.5-32B-Instruct": 0.00, "Qwen/Qwen2.5-Omni-7B": 48.22, "TheFinAI/finma-7b-full": 0.00,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 0.00, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 0.00,
	"TheFinAI/FinMA-ES-Bilingual": 0.00, "TheFinAI/plutus-8B-instruct": 0.00, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 51.58, "Qwen2-Audio-7B": 48.02,
	"Qwen2-Audio-7B-Instruct": 50.06, "SALMONN-7B": 24.24, "SALMONN-13B": 24.59
	},
	english: {
	"GPT-4o": 42.18, "o3-Mini": 20.20, "Deepseek-V3": 18.04, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 24.16,
	"meta-llama/Llama-3.1-70B-Instruct": 38.71, "google/gemma-3-4b-it": 16.13, "google/gemma-3-27b-it": 17.19,
	"Qwen/Qwen2.5-32B-Instruct": 32.01, "Qwen/Qwen2.5-Omni-7B": 24.99, "TheFinAI/finma-7b-full": 28.89,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 29.39, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 26.38,
	"TheFinAI/FinMA-ES-Bilingual": 31.72, "TheFinAI/plutus-8B-instruct": 27.82, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	chinese: {
	"GPT-4o": 60.34, "o3-Mini": 0.00, "Deepseek-V3": 60.94, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 64.51,
	"meta-llama/Llama-3.1-70B-Instruct": 56.74, "google/gemma-3-4b-it": 26.23, "google/gemma-3-27b-it": 26.24,
	"Qwen/Qwen2.5-32B-Instruct": 56.62, "Qwen/Qwen2.5-Omni-7B": 53.09, "TheFinAI/finma-7b-full": 24.42,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 23.04, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 13.18,
	"TheFinAI/FinMA-ES-Bilingual": 21.50, "TheFinAI/plutus-8B-instruct": 31.04, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	japanese: {
	"GPT-4o": 0.00, "o3-Mini": 0.00, "Deepseek-V3": 0.00, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 48.43,
	"meta-llama/Llama-3.1-70B-Instruct": 32.17, "google/gemma-3-4b-it": 8.98, "google/gemma-3-27b-it": 23.96,
	"Qwen/Qwen2.5-32B-Instruct": 4.54, "Qwen/Qwen2.5-Omni-7B": 44.35, "TheFinAI/finma-7b-full": 46.94,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 47.59, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 23.96,
	"TheFinAI/FinMA-ES-Bilingual": 57.36, "TheFinAI/plutus-8B-instruct": 34.62, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	spanish: {
	"GPT-4o": 29.80, "o3-Mini": 4.53, "Deepseek-V3": 25.49, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 47.90,
	"meta-llama/Llama-3.1-70B-Instruct": 37.84, "google/gemma-3-4b-it": 27.66, "google/gemma-3-27b-it": 27.77,
	"Qwen/Qwen2.5-32B-Instruct": 37.47, "Qwen/Qwen2.5-Omni-7B": 39.16, "TheFinAI/finma-7b-full": 27.04,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 42.86, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 28.01,
	"TheFinAI/FinMA-ES-Bilingual": 38.69, "TheFinAI/plutus-8B-instruct": 40.16, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	greek: {
	"GPT-4o": 43.04, "o3-Mini": 9.48, "Deepseek-V3": 39.07, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 48.95,
	"meta-llama/Llama-3.1-70B-Instruct": 43.60, "google/gemma-3-4b-it": 15.45, "google/gemma-3-27b-it": 15.44,
	"Qwen/Qwen2.5-32B-Instruct": 44.32, "Qwen/Qwen2.5-Omni-7B": 23.45, "TheFinAI/finma-7b-full": 17.93,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 29.49, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 20.91,
	"TheFinAI/FinMA-ES-Bilingual": 15.47, "TheFinAI/plutus-8B-instruct": 60.19, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	bilingual: {
	"GPT-4o": 92.29, "o3-Mini": 90.13, "Deepseek-V3": 86.26, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 89.17,
	"meta-llama/Llama-3.1-70B-Instruct": 92.13, "google/gemma-3-4b-it": 35.92, "google/gemma-3-27b-it": 35.92,
	"Qwen/Qwen2.5-32B-Instruct": 92.29, "Qwen/Qwen2.5-Omni-7B": 91.80, "TheFinAI/finma-7b-full": 69.24,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 91.60, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 71.81,
	"TheFinAI/FinMA-ES-Bilingual": 66.57, "TheFinAI/plutus-8B-instruct": 91.59, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	},
	multilingual: {
	"GPT-4o": 6.53, "o3-Mini": 7.80, "Deepseek-V3": 36.99, "meta-llama/Llama-4-Scout-17B-16E-Instruct": 13.52,
	"meta-llama/Llama-3.1-70B-Instruct": 21.97, "google/gemma-3-4b-it": 0.00, "google/gemma-3-27b-it": 0.00,
	"Qwen/Qwen2.5-32B-Instruct": 18.48, "Qwen/Qwen2.5-Omni-7B": 16.29, "TheFinAI/finma-7b-full": 3.10,
	"Duxiaoman-DI/Llama3.1-XuanYuan-FinX1-Preview": 1.76, "cyberagent/DeepSeek-R1-Distill-Qwen-32B-Japanese": 10.25,
	"TheFinAI/FinMA-ES-Bilingual": 0.35, "TheFinAI/plutus-8B-instruct": 7.24, "Qwen-VL-MAX": 0.00,
	"LLaVA-1.6 Vicuna-13B": 0.00, "Deepseek-VL-7B-Chat": 0.00, "Whisper-V3": 0.00, "Qwen2-Audio-7B": 0.00,
	"Qwen2-Audio-7B-Instruct": 0.00, "SALMONN-7B": 0.00, "SALMONN-13B": 0.00
	}
	};

	// Calculate min/max averages
	export const useAverageRange = (data) => {
	return useMemo(() => {
	const averages = data.map((item) => item.model.average_score);
	return {
	minAverage: Math.min(...averages),
	maxAverage: Math.max(...averages),
	};
	}, [data]);
	};

	// Generate colors for scores
	export const useColorGenerator = (minAverage, maxAverage) => {
	return useMemo(() => {
	const colorCache = new Map();
	return (value) => {
	const cached = colorCache.get(value);
	if (cached) return cached;

	const normalizedValue = (value - minAverage) / (maxAverage - minAverage);
	const red = Math.round(255 * (1 - normalizedValue) * 1);
	const green = Math.round(255 * normalizedValue) * 1;
	// const color = `rgba(${red}, ${green}, 0, 1)`;
	const color = `rgba(${red}, 0, ${green}, 1)`;
	colorCache.set(value, color);
	return color;
	};
	}, [minAverage, maxAverage]);
	};

	// Process data with boolean standardization
	export const useProcessedData = (data, averageMode, visibleColumns) => {
	return useMemo(() => {
	// 直接使用硬编码数据创建模型列表
	const modelList = [];

	// 从HARDCODED_SCORES中获取所有模型名称
	const modelNames = new Set();
	Object.values(HARDCODED_SCORES).forEach(categoryData => {
	Object.entries(categoryData).forEach(([modelName, score]) => {
	// 添加所有模型，不管分数是否为0
	modelNames.add(modelName);
	});
	});

	// 为每个模型创建条目
	Array.from(modelNames).forEach((modelName, index) => {
	// 创建硬编码评估数据
	const hardcodedEvaluations = {
	vision_average: getHardcodedScore(modelName, 'vision'),
	audio_average: getHardcodedScore(modelName, 'audio'),
	english_average: getHardcodedScore(modelName, 'english'),
	chinese_average: getHardcodedScore(modelName, 'chinese'),
	japanese_average: getHardcodedScore(modelName, 'japanese'),
	spanish_average: getHardcodedScore(modelName, 'spanish'),
	greek_average: getHardcodedScore(modelName, 'greek'),
	bilingual_average: getHardcodedScore(modelName, 'bilingual'),
	multilingual_average: getHardcodedScore(modelName, 'multilingual')
	};

	// 计算总平均分（包含分数为0的类别）
	const scores = Object.values(hardcodedEvaluations).filter(score => score !== null);
	const averageScore = scores.length > 0 ? scores.reduce((a, b) => a + b, 0) / scores.length : null;

	// 创建模型数据
	modelList.push({
	id: `model-${index}`,
	model: {
	name: modelName,
	average_score: averageScore,
	type: "chat", // 统一设为chat类型
	},
	evaluations: hardcodedEvaluations,
	features: {
	is_moe: false,
	is_flagged: false,
	is_highlighted_by_maintainer: false,
	is_merged: false,
	is_not_available_on_hub: false,
	},
	metadata: {
	submission_date: new Date().toISOString(),
	},
	isMissing: false,
	});
	});

	// 根据平均分排序
	modelList.sort((a, b) => {
	if (a.model.average_score === null && b.model.average_score === null)
	return 0;
	if (a.model.average_score === null) return 1;
	if (b.model.average_score === null) return -1;
	return b.model.average_score - a.model.average_score;
	});

	// 添加排名
	return modelList.map((item, index) => ({
	...item,
	static_rank: index + 1,
	}));
	}, [data, averageMode, visibleColumns]);
	};

	// 辅助函数：从硬编码数据中获取分数
	function getHardcodedScore(modelName, category) {
	if (!HARDCODED_SCORES[category]) return null;

	// 尝试精确匹配
	if (HARDCODED_SCORES[category][modelName] !== undefined) {
	return HARDCODED_SCORES[category][modelName];
	}

	// 尝试部分匹配
	for (const key in HARDCODED_SCORES[category]) {
	if (modelName.includes(key) \|\| key.includes(modelName)) {
	return HARDCODED_SCORES[category][key];
	}
	}

	return null;
	}

	// Common filtering logic
	export const useFilteredData = (
	processedData,
	selectedPrecisions,
	selectedTypes,
	paramsRange,
	searchValue,
	selectedBooleanFilters,
	rankingMode,
	pinnedModels = [],
	isOfficialProviderActive = false
	) => {
	return useMemo(() => {
	// 由于使用的是硬编码数据，这里直接返回所有数据而不进行过滤
	return processedData.map((item, index) => ({
	...item,
	dynamic_rank: index + 1,
	rank: rankingMode === "static" ? item.static_rank : index + 1,
	isPinned: pinnedModels.includes(item.id),
	}));
	}, [
	processedData,
	rankingMode,
	pinnedModels,
	]);
	};

	// Column visibility management
	export const useColumnVisibility = (visibleColumns = []) => {
	// Create secure visibility object
	const columnVisibility = useMemo(() => {
	// Check visible columns
	const safeVisibleColumns = Array.isArray(visibleColumns)
	? visibleColumns
	: [];

	const visibility = {};
	try {
	safeVisibleColumns.forEach((columnKey) => {
	if (typeof columnKey === "string") {
	visibility[columnKey] = true;
	}
	});
	} catch (error) {
	console.warn("Error in useColumnVisibility:", error);
	}
	return visibility;
	}, [visibleColumns]);

	return columnVisibility;
	};