Spaces:

Rozeeeee
/

evo

Sleeping

App Files Files Community

Rozeeeee commited on Jan 29

Commit

0e115ff

verified ·

1 Parent(s): 9a16016

Update app.py

Browse files

Files changed (1) hide show

app.py +28 -58

app.py CHANGED Viewed

@@ -1,81 +1,51 @@
 import streamlit as st
 import pandas as pd
 import requests
 import plotly.express as px
 import io
 # 設置全局主題
-THEME = px.colors.qualitative.Bold
-# 下載並載入 CSV 數據
-@st.cache_data
-def download_and_clean_csv(url):
     response = requests.get(url)
     response.encoding = 'utf-8'
     df = pd.read_csv(io.StringIO(response.text), encoding='utf-8')
-    # 資料清理
-    df = df.dropna().drop_duplicates()  # 移除缺失值與重複數據
-    df.columns = df.columns.str.strip()  # 去除欄位名稱前後空格
-    df = df.applymap(lambda x: x.strip() if isinstance(x, str) else x)  # 去除字串內的空格
-    # 嘗試轉換數值欄位
-    num_cols = ["範疇一排放量(噸CO2e)", "範疇二排放量(噸CO2e)", "範疇三排放量(噸CO2e)"]
-    for col in num_cols:
-        if col in df.columns:
-            df[col] = pd.to_numeric(df[col], errors='coerce').fillna(0)
     return df
-# 美化圖表
-def beautify_chart(fig):
-    fig.update_layout(
-        font_family="Arial",
-        font_color="#444",
-        title_font_family="Arial",
-        title_font_color="#000",
-        legend_title_font_color="#000",
-        plot_bgcolor='rgba(0,0,0,0)',
-        paper_bgcolor='rgba(0,0,0,0)',
-    )
-    fig.update_xaxes(showline=True, linewidth=2, linecolor='lightgray', gridcolor='lightgray')
-    fig.update_yaxes(showline=True, linewidth=2, linecolor='lightgray', gridcolor='lightgray')
-    return fig
-# 下載、清理並合併數據
 urls = [
     "https://mopsfin.twse.com.tw/opendata/t187ap46_L_1.csv",
     "https://mopsfin.twse.com.tw/opendata/t187ap46_O_2.csv",
     "https://mopsfin.twse.com.tw/opendata/t187ap46_L_6.csv"
 ]
-dfs = [download_and_clean_csv(url) for url in urls]
-combined_df = pd.concat(dfs, ignore_index=True)
-# 進一步清理 combined_df
-combined_df = combined_df.dropna().drop_duplicates()
-combined_df.columns = combined_df.columns.str.strip()
-combined_df = combined_df.applymap(lambda x: x.strip() if isinstance(x, str) else x)
-for col in ["範疇一排放量(噸CO2e)", "範疇二排放量(噸CO2e)", "範疇三排放量(噸CO2e)"]:
-    if col in combined_df.columns:
-        combined_df[col] = pd.to_numeric(combined_df[col], errors='coerce').fillna(0)
-# 合併數據
-df_final = combined_df.groupby("公司名稱", as_index=False).sum()
-# 設定 Streamlit 介面
-st.title("台灣企業ESG數據分析與揭露")
 # 顯示清理後的數據
-st.subheader("清理後的數據預覽")
-st.dataframe(df_final)
-# 可視化數據
-emission_columns = ["範疇一排放量(噸CO2e)", "範疇二排放量(噸CO2e)", "範疇三排放量(噸CO2e)"]
-selected_columns = [col for col in emission_columns if col in df_final.columns]
-if selected_columns:
-    st.subheader("排放量折線圖")
-    fig_line = px.line(df_final, x="公司名稱", y=selected_columns, title="企業排放量趨勢", color_discrete_sequence=THEME)
-    st.plotly_chart(beautify_chart(fig_line))
-else:
-    st.write("未找到有效的排放數據")

 import streamlit as st
 import pandas as pd
+import numpy as np
 import requests
 import plotly.express as px
 import io
 # 設置全局主題
+theme = px.colors.qualitative.Bold
+# 下載 CSV 數據
+def download_and_load_csv(url):
     response = requests.get(url)
     response.encoding = 'utf-8'
     df = pd.read_csv(io.StringIO(response.text), encoding='utf-8')
     return df
+# 清理數據並合併
+def clean_and_merge_data(urls):
+    dfs = [download_and_load_csv(url) for url in urls]
+    # 合併所有數據
+    combined_df = pd.concat(dfs, ignore_index=True)
+    # 指定要清理的排放量欄位
+    emission_columns = ["範疇一排放量(噸CO2e)", "範疇二排放量(噸CO2e)", "範疇三排放量(噸CO2e)"]
+    # 只清理 emission_columns 內的 0 值，不影響其他欄位
+    combined_df[emission_columns] = combined_df[emission_columns].replace(0, np.nan).dropna(subset=emission_columns)
+    # 依據 "公司名稱" 進行合併，將相同公司名稱的數據進行加總
+    merged_df = combined_df.groupby("公司名稱", as_index=False).sum()
+    return merged_df
+# CSV 來源
 urls = [
     "https://mopsfin.twse.com.tw/opendata/t187ap46_L_1.csv",
     "https://mopsfin.twse.com.tw/opendata/t187ap46_O_2.csv",
     "https://mopsfin.twse.com.tw/opendata/t187ap46_L_6.csv"
 ]
+# 清理並合併數據
+cleaned_df = clean_and_merge_data(urls)
+# 設置 Streamlit 標題
+st.title("台灣企業 ESG 數據分析與揭露")
 # 顯示清理後的數據
+st.subheader("清理 & 合併後的數據預覽")
+st.dataframe(cleaned_df)