import pandas as pd import gradio as gr def compare_csv_files(): # 文件名 file1 = "fish-speech-1.5.csv" file2 = "fish-speech-1.4.csv" # 读取 CSV 文件 df1 = pd.read_csv(file1) df2 = pd.read_csv(file2) # 使用 SourceText 进行合并 merged_df = pd.merge(df1, df2, on="SourceText", suffixes=("_1", "_2")) if merged_df.empty: return "两个文件中没有相同的 SourceText,请检查数据。" # 计算差异 merged_df["WordErrorRate_Diff"] = merged_df["WordErrorRate_1"] - merged_df["WordErrorRate_2"] merged_df["CharacterErrorRate_Diff"] = merged_df["CharacterErrorRate_1"] - merged_df["CharacterErrorRate_2"] # 返回对比结果 comparison = merged_df[[ "SourceText", "UUID_1", "WhisperText_1", "WordErrorRate_1", "CharacterErrorRate_1", "UUID_2", "WhisperText_2", "WordErrorRate_2", "CharacterErrorRate_2", "WordErrorRate_Diff", "CharacterErrorRate_Diff" ]] return comparison.to_html(index=False) # Gradio 界面 gr.Interface( fn=compare_csv_files, inputs=None, outputs="html", title="CSV 文件对比工具", description="自动加载目录下的 fish-speech-1.5.csv 和 fish-speech-1.4.csv,对比它们的 WordErrorRate 和 CharacterErrorRate 差异。", ).launch()