Spaces:
Running
Running
File size: 1,341 Bytes
bdee176 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 |
import pandas as pd
import gradio as gr
def compare_csv_files():
# 文件名
file1 = "fish-speech-1.5.csv"
file2 = "fish-speech-1.4.csv"
# 读取 CSV 文件
df1 = pd.read_csv(file1)
df2 = pd.read_csv(file2)
# 使用 SourceText 进行合并
merged_df = pd.merge(df1, df2, on="SourceText", suffixes=("_1", "_2"))
if merged_df.empty:
return "两个文件中没有相同的 SourceText,请检查数据。"
# 计算差异
merged_df["WordErrorRate_Diff"] = merged_df["WordErrorRate_1"] - merged_df["WordErrorRate_2"]
merged_df["CharacterErrorRate_Diff"] = merged_df["CharacterErrorRate_1"] - merged_df["CharacterErrorRate_2"]
# 返回对比结果
comparison = merged_df[[
"SourceText",
"UUID_1", "WhisperText_1", "WordErrorRate_1", "CharacterErrorRate_1",
"UUID_2", "WhisperText_2", "WordErrorRate_2", "CharacterErrorRate_2",
"WordErrorRate_Diff", "CharacterErrorRate_Diff"
]]
return comparison.to_html(index=False)
# Gradio 界面
gr.Interface(
fn=compare_csv_files,
inputs=None,
outputs="html",
title="CSV 文件对比工具",
description="自动加载目录下的 fish-speech-1.5.csv 和 fish-speech-1.4.csv,对比它们的 WordErrorRate 和 CharacterErrorRate 差异。",
).launch()
|