Spaces:

mgbam
/

BizIntel_AI

Sleeping

File size: 9,974 Bytes

221fe0a
e490e03
309eec4
 
f0be302
773f0cf
2c362d2
309eec4
10c7dea
3acbc9c
309eec4
221fe0a
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
10c7dea
e490e03
9414ba2
e490e03
10c7dea
2c362d2
b3a1f0c
221fe0a
 
 
 
 
2c362d2
67e3963
e490e03
221fe0a
e490e03
221fe0a
 
67e3963
72a73ff
 
e490e03
221fe0a
e490e03
221fe0a
f0be302
 
221fe0a
 
c7c64f3
f0be302
 
c7c64f3
773f0cf
221fe0a
 
 
 
f0be302
9414ba2
f0be302
9414ba2
f0be302
 
 
221fe0a
d037161
f0be302
221fe0a
773f0cf
9414ba2
c7c64f3
773f0cf
221fe0a
 
c7c64f3
221fe0a
 
773f0cf
 
 
 
 
309eec4
 
773f0cf
221fe0a
10c7dea
773f0cf
221fe0a
773f0cf
9414ba2
 
 
221fe0a
9414ba2
221fe0a
10c7dea
e490e03
221fe0a
e490e03
f0be302
2c362d2
10c7dea
221fe0a
9414ba2
 
 
773f0cf
9414ba2
10c7dea
221fe0a
9414ba2
e490e03
221fe0a
 
 
 
 
 
 
 
 
773f0cf
e490e03
221fe0a
e490e03
523228c
 
9414ba2
 
221fe0a
 
 
e490e03
 
523228c
 
221fe0a
773f0cf
3acbc9c
d826a13
221fe0a
c7c64f3
 
221fe0a
c7c64f3
9414ba2
c7c64f3
d037161
c7c64f3
 
f0be302
 
d037161
221fe0a
 
 
523228c
221fe0a
c7c64f3
 
 
 
 
773f0cf
e490e03
c7c64f3
e490e03
523228c
3acbc9c
 
773f0cf
221fe0a
 
d826a13
221fe0a
9414ba2
d037161
 
3acbc9c
221fe0a
773f0cf

# app.py  —  BizIntel AI Ultra  (Any metric, CSV/Excel/DB, Plotly, Gemini 1.5 Pro)

import os
import tempfile
from typing import Literal

import pandas as pd
import streamlit as st
import google.generativeai as genai
import plotly.graph_objects as go

# ──────────────────────────────────────────────────────────────
# SAFELY REDIRECT ALL write_image CALLS TO /tmp
# ──────────────────────────────────────────────────────────────
_tmp = tempfile.gettempdir()
_orig_write = go.Figure.write_image

def _safe_write(self, path, *args, **kwargs):
    # keep only filename, write into tempdir
    fname = os.path.basename(path)
    safe_path = os.path.join(_tmp, fname)
    return _orig_write(self, safe_path, *args, **kwargs)

go.Figure.write_image = _safe_write

# ──────────────────────────────────────────────────────────────
# TOOL IMPORTS
# ──────────────────────────────────────────────────────────────
from tools.csv_parser     import parse_csv_tool
from tools.plot_generator import plot_metric_tool       # generic: date + metric
from tools.forecaster     import forecast_metric_tool   # generic: date + metric
from tools.visuals        import (
    histogram_tool,
    scatter_matrix_tool,
    corr_heatmap_tool,
)
from db_connector         import fetch_data_from_db, list_tables, SUPPORTED_ENGINES

# ──────────────────────────────────────────────────────────────
# 1.  GEMINI CONFIG
# ──────────────────────────────────────────────────────────────
genai.configure(api_key=os.getenv("GEMINI_APIKEY"))
gemini = genai.GenerativeModel(
    "gemini-1.5-pro-latest",
    generation_config={
        "temperature": 0.7,
        "top_p": 0.9,
        "response_mime_type": "text/plain",
    },
)

# ──────────────────────────────────────────────────────────────
# 2.  PAGE SETUP
# ──────────────────────────────────────────────────────────────
st.set_page_config(page_title="BizIntel AI Ultra", layout="wide")
st.title("📊 BizIntel AI Ultra – Advanced Analytics + Gemini 1.5 Pro")

TEMP_DIR = tempfile.gettempdir()

# ──────────────────────────────────────────────────────────────
# 3.  DATA SOURCE (CSV, Excel, or DB)
# ──────────────────────────────────────────────────────────────
source = st.radio("Select data source", ["Upload CSV / Excel", "Connect to SQL Database"])
csv_path: str | None = None

if source == "Upload CSV / Excel":
    up = st.file_uploader("Upload CSV or Excel (≤ 500 MB)", type=["csv", "xlsx", "xls"])
    if up:
        temp_path = os.path.join(TEMP_DIR, up.name)
        with open(temp_path, "wb") as f:
            f.write(up.read())

        if up.name.lower().endswith(".csv"):
            csv_path = temp_path
        else:
            # Excel → load sheet0 → write out to CSV
            try:
                df_xl = pd.read_excel(temp_path, sheet_name=0)
                csv_path = os.path.splitext(temp_path)[0] + ".csv"
                df_xl.to_csv(csv_path, index=False)
            except Exception as e:
                st.error(f"Excel parsing failed: {e}")
                st.stop()

        st.success(f"{up.name} saved ✅")

else:
    engine = st.selectbox("DB engine", SUPPORTED_ENGINES)
    conn   = st.text_input("SQLAlchemy connection string")
    if conn:
        try:
            tables = list_tables(conn)
            table  = st.selectbox("Table", tables)
            if st.button("Fetch table"):
                csv_path = fetch_data_from_db(conn, table)
                st.success(f"Fetched **{table}** as CSV ✅")
        except Exception as e:
            st.error(f"Connection failed: {e}")
            st.stop()

if csv_path is None:
    st.stop()

with open(csv_path, "rb") as f:
    st.download_button("⬇️ Download working CSV", f, file_name=os.path.basename(csv_path))

# ──────────────────────────────────────────────────────────────
# 4.  COLUMN SELECTION
# ──────────────────────────────────────────────────────────────
df_head = pd.read_csv(csv_path, nrows=5)
st.dataframe(df_head)

date_col    = st.selectbox("Select date/time column", df_head.columns)
numeric_cols = df_head.select_dtypes("number").columns
metric_col  = st.selectbox("Select numeric metric column", numeric_cols)

# ──────────────────────────────────────────────────────────────
# 5.  LOCAL ANALYTICS: SUMMARY, TREND, FORECAST
# ──────────────────────────────────────────────────────────────
with st.spinner("Parsing dataset…"):
    summary_text = parse_csv_tool(csv_path)

with st.spinner("Building trend chart…"):
    trend_fig = plot_metric_tool(csv_path, date_col, metric_col)
if isinstance(trend_fig, go.Figure):
    st.plotly_chart(trend_fig, use_container_width=True)
else:
    st.warning(trend_fig)

with st.spinner("Forecasting…"):
    forecast_text = forecast_metric_tool(csv_path, date_col, metric_col)

# Show forecast interactive (PNG saved safely in /tmp)
st.subheader(f"🔮 {metric_col} Forecast")
with st.spinner("Rendering forecast…"):
    # read PNG from tempdir if exists
    png_path = os.path.join(TEMP_DIR, "forecast_plot.png")
    if os.path.exists(png_path):
        st.image(png_path, use_column_width=True)
    else:
        st.warning("Forecast image not found.")

# ──────────────────────────────────────────────────────────────
# 6.  GEMINI STRATEGY
# ──────────────────────────────────────────────────────────────
prompt = (
    f"You are **BizIntel Strategist AI**.\n\n"
    f"### Dataset Summary\n```\n{summary_text}\n```\n\n"
    f"### {metric_col} Forecast\n```\n{forecast_text}\n```\n\n"
    "Return **Markdown** with:\n"
    "1. Five key insights\n"
    "2. Three actionable strategies\n"
    "3. Risk factors or anomalies\n"
    "4. Suggested additional visuals\n"
)

st.subheader("🚀 Strategy Recommendations (Gemini 1.5 Pro)")
with st.spinner("Generating insights…"):
    strategy_md = gemini.generate_content(prompt).text
st.markdown(strategy_md)
st.download_button("⬇️ Download Strategy (.md)", strategy_md, file_name="strategy.md")

# ──────────────────────────────────────────────────────────────
# 7.  KPI CARDS + DETAILED STATS
# ──────────────────────────────────────────────────────────────
full_df    = pd.read_csv(csv_path, low_memory=False)
total_rows = len(full_df)
num_cols   = len(full_df.columns)
missing_pct = full_df.isna().mean().mean() * 100

st.markdown("---")
st.subheader("📑 Dataset Overview")
c1, c2, c3 = st.columns(3)
c1.metric("Rows",     f"{total_rows:,}")
c2.metric("Columns",  str(num_cols))
c3.metric("Missing %", f"{missing_pct:.1f}%")

with st.expander("🔎 Detailed descriptive statistics"):
    stats_df = full_df.describe().T.reset_index().rename(columns={"index": "Feature"})
    st.dataframe(
        stats_df.style.format(precision=2).background_gradient(cmap="Blues"),
        use_container_width=True,
    )

# ──────────────────────────────────────────────────────────────
# 8.  OPTIONAL EXPLORATORY VISUALS
# ──────────────────────────────────────────────────────────────
st.markdown("---")
st.subheader("🔍 Optional Exploratory Visuals")

if st.checkbox("Histogram"):
    hcol = st.selectbox("Variable", numeric_cols, key="hist")
    st.plotly_chart(histogram_tool(csv_path, hcol), use_container_width=True)

if st.checkbox("Scatter-matrix"):
    sel = st.multiselect("Choose columns", numeric_cols, default=numeric_cols[:3])
    if sel:
        st.plotly_chart(scatter_matrix_tool(csv_path, sel), use_container_width=True)

if st.checkbox("Correlation heat-map"):
    st.plotly_chart(corr_heatmap_tool(csv_path), use_container_width=True)