euler314's picture
Update app.py
0357330 verified
import streamlit as st
import sympy as sp
import numpy as np
import plotly.graph_objects as go
from scipy.optimize import fsolve
from scipy.stats import gaussian_kde
# Configure Streamlit for Hugging Face Spaces
st.set_page_config(
page_title="Cubic Root Analysis",
layout="wide",
initial_sidebar_state="collapsed"
)
def add_sqrt_support(expr_str):
"""Replace 'sqrt(' with 'sp.sqrt(' for sympy compatibility"""
return expr_str.replace('sqrt(', 'sp.sqrt(')
#############################
# 1) Define the discriminant
#############################
# Symbolic variables for the cubic discriminant
z_sym, beta_sym, z_a_sym, y_sym = sp.symbols("z beta z_a y", real=True, positive=True)
# Define coefficients a, b, c, d in terms of z_sym, beta_sym, z_a_sym, y_sym
a_sym = z_sym * z_a_sym
b_sym = z_sym * z_a_sym + z_sym + z_a_sym - z_a_sym*y_sym
c_sym = z_sym + z_a_sym + 1 - y_sym*(beta_sym*z_a_sym + 1 - beta_sym)
d_sym = 1
# Symbolic expression for the cubic discriminant
Delta_expr = (
((b_sym*c_sym)/(6*a_sym**2) - (b_sym**3)/(27*a_sym**3) - d_sym/(2*a_sym))**2
+ (c_sym/(3*a_sym) - (b_sym**2)/(9*a_sym**2))**3
)
# Fast numeric function for the discriminant
discriminant_func = sp.lambdify((z_sym, beta_sym, z_a_sym, y_sym), Delta_expr, "numpy")
@st.cache_data
def find_z_at_discriminant_zero(z_a, y, beta, z_min, z_max, steps):
"""
Scan z in [z_min, z_max] for sign changes in the discriminant,
and return approximated roots (where the discriminant is zero).
"""
z_grid = np.linspace(z_min, z_max, steps)
disc_vals = discriminant_func(z_grid, beta, z_a, y)
roots_found = []
for i in range(len(z_grid) - 1):
f1, f2 = disc_vals[i], disc_vals[i+1]
if np.isnan(f1) or np.isnan(f2):
continue
if f1 == 0.0:
roots_found.append(z_grid[i])
elif f2 == 0.0:
roots_found.append(z_grid[i+1])
elif f1 * f2 < 0:
zl, zr = z_grid[i], z_grid[i+1]
for _ in range(50):
mid = 0.5 * (zl + zr)
fm = discriminant_func(mid, beta, z_a, y)
if fm == 0:
zl = zr = mid
break
if np.sign(fm) == np.sign(f1):
zl, f1 = mid, fm
else:
zr, f2 = mid, fm
roots_found.append(0.5 * (zl + zr))
return np.array(roots_found)
@st.cache_data
def sweep_beta_and_find_z_bounds(z_a, y, z_min, z_max, beta_steps, z_steps):
"""
For each beta in [0,1] (with beta_steps points), find the minimum and maximum z
for which the discriminant is zero.
Returns: betas, lower z*(β) values, and upper z*(β) values.
"""
betas = np.linspace(0, 1, beta_steps)
z_min_values = []
z_max_values = []
for b in betas:
roots = find_z_at_discriminant_zero(z_a, y, b, z_min, z_max, z_steps)
if len(roots) == 0:
z_min_values.append(np.nan)
z_max_values.append(np.nan)
else:
z_min_values.append(np.min(roots))
z_max_values.append(np.max(roots))
return betas, np.array(z_min_values), np.array(z_max_values)
# Removed the compute_low_y_curve function
@st.cache_data
def compute_high_y_curve(betas, z_a, y):
"""
Compute the "High y Expression" curve.
"""
a = z_a
betas = np.array(betas)
denominator = 1 - 2*a
if denominator == 0:
return np.full_like(betas, np.nan)
numerator = -4*a*(a-1)*y*betas - 2*a*y - 2*a*(2*a-1)
return numerator/denominator
def compute_alternate_low_expr(betas, z_a, y):
"""
Compute the alternate low expression:
(z_a*y*beta*(z_a-1) - 2*z_a*(1-y) - 2*z_a**2) / (2+2*z_a)
"""
betas = np.array(betas)
return (z_a * y * betas * (z_a - 1) - 2*z_a*(1 - y) - 2*z_a**2) / (2 + 2*z_a)
@st.cache_data
def compute_derivatives(curve, betas):
"""Compute first and second derivatives of a curve"""
d1 = np.gradient(curve, betas)
d2 = np.gradient(d1, betas)
return d1, d2
def compute_all_derivatives(betas, z_mins, z_maxs, low_y_curve, high_y_curve, alt_low_expr, custom_curve1=None, custom_curve2=None):
"""Compute derivatives for all curves"""
derivatives = {}
# Upper z*(β)
derivatives['upper'] = compute_derivatives(z_maxs, betas)
# Lower z*(β)
derivatives['lower'] = compute_derivatives(z_mins, betas)
# Low y Expression (only if provided)
if low_y_curve is not None:
derivatives['low_y'] = compute_derivatives(low_y_curve, betas)
# High y Expression
derivatives['high_y'] = compute_derivatives(high_y_curve, betas)
# Alternate Low Expression
derivatives['alt_low'] = compute_derivatives(alt_low_expr, betas)
# Custom Expression 1 (if provided)
if custom_curve1 is not None:
derivatives['custom1'] = compute_derivatives(custom_curve1, betas)
# Custom Expression 2 (if provided)
if custom_curve2 is not None:
derivatives['custom2'] = compute_derivatives(custom_curve2, betas)
return derivatives
def compute_custom_expression(betas, z_a, y, s_num_expr, s_denom_expr, is_s_based=True):
"""
Compute custom curve. If is_s_based=True, compute using s substitution.
Otherwise, compute direct z(β) expression.
"""
beta_sym, z_a_sym, y_sym = sp.symbols("beta z_a y", positive=True)
local_dict = {"beta": beta_sym, "z_a": z_a_sym, "y": y_sym, "sp": sp}
try:
# Add sqrt support
s_num_expr = add_sqrt_support(s_num_expr)
s_denom_expr = add_sqrt_support(s_denom_expr)
num_expr = sp.sympify(s_num_expr, locals=local_dict)
denom_expr = sp.sympify(s_denom_expr, locals=local_dict)
if is_s_based:
# Compute s and substitute into main expression
s_expr = num_expr / denom_expr
a = z_a_sym
numerator = y_sym*beta_sym*(z_a_sym-1)*s_expr + (a*s_expr+1)*((y_sym-1)*s_expr-1)
denominator = (a*s_expr+1)*(s_expr**2 + s_expr)
final_expr = numerator/denominator
else:
# Direct z(β) expression
final_expr = num_expr / denom_expr
except sp.SympifyError as e:
st.error(f"Error parsing expressions: {e}")
return np.full_like(betas, np.nan)
final_func = sp.lambdify((beta_sym, z_a_sym, y_sym), final_expr, modules=["numpy"])
with np.errstate(divide='ignore', invalid='ignore'):
result = final_func(betas, z_a, y)
if np.isscalar(result):
result = np.full_like(betas, result)
return result
def generate_z_vs_beta_plot(z_a, y, z_min, z_max, beta_steps, z_steps,
s_num_expr=None, s_denom_expr=None,
z_num_expr=None, z_denom_expr=None,
show_derivatives=False):
if z_a <= 0 or y <= 0 or z_min >= z_max:
st.error("Invalid input parameters.")
return None
betas = np.linspace(0, 1, beta_steps)
betas, z_mins, z_maxs = sweep_beta_and_find_z_bounds(z_a, y, z_min, z_max, beta_steps, z_steps)
# Removed low_y_curve computation
high_y_curve = compute_high_y_curve(betas, z_a, y)
alt_low_expr = compute_alternate_low_expr(betas, z_a, y)
# Compute both custom curves
custom_curve1 = None
custom_curve2 = None
if s_num_expr and s_denom_expr:
custom_curve1 = compute_custom_expression(betas, z_a, y, s_num_expr, s_denom_expr, True)
if z_num_expr and z_denom_expr:
custom_curve2 = compute_custom_expression(betas, z_a, y, z_num_expr, z_denom_expr, False)
# Compute derivatives if needed
if show_derivatives:
derivatives = compute_all_derivatives(betas, z_mins, z_maxs, None, high_y_curve,
alt_low_expr, custom_curve1, custom_curve2)
fig = go.Figure()
# Original curves
fig.add_trace(go.Scatter(x=betas, y=z_maxs, mode="markers+lines",
name="Upper z*(β)", line=dict(color='blue')))
fig.add_trace(go.Scatter(x=betas, y=z_mins, mode="markers+lines",
name="Lower z*(β)", line=dict(color='lightblue')))
# Removed the Low y Expression trace
fig.add_trace(go.Scatter(x=betas, y=high_y_curve, mode="markers+lines",
name="High y Expression", line=dict(color='green')))
fig.add_trace(go.Scatter(x=betas, y=alt_low_expr, mode="markers+lines",
name="Alternate Low Expression", line=dict(color='orange')))
if custom_curve1 is not None:
fig.add_trace(go.Scatter(x=betas, y=custom_curve1, mode="markers+lines",
name="Custom 1 (s-based)", line=dict(color='purple')))
if custom_curve2 is not None:
fig.add_trace(go.Scatter(x=betas, y=custom_curve2, mode="markers+lines",
name="Custom 2 (direct)", line=dict(color='magenta')))
if show_derivatives:
# First derivatives
curve_info = [
('upper', 'Upper z*(β)', 'blue'),
('lower', 'Lower z*(β)', 'lightblue'),
# Removed low_y curve
('high_y', 'High y', 'green'),
('alt_low', 'Alt Low', 'orange')
]
if custom_curve1 is not None:
curve_info.append(('custom1', 'Custom 1', 'purple'))
if custom_curve2 is not None:
curve_info.append(('custom2', 'Custom 2', 'magenta'))
for key, name, color in curve_info:
fig.add_trace(go.Scatter(x=betas, y=derivatives[key][0], mode="lines",
name=f"{name} d/dβ", line=dict(color=color, dash='dash')))
fig.add_trace(go.Scatter(x=betas, y=derivatives[key][1], mode="lines",
name=f"{name} d²/dβ²", line=dict(color=color, dash='dot')))
fig.update_layout(
title="Curves vs β: z*(β) Boundaries and Asymptotic Expressions",
xaxis_title="β",
yaxis_title="Value",
hovermode="x unified",
showlegend=True,
legend=dict(
yanchor="top",
y=0.99,
xanchor="left",
x=0.01
)
)
return fig
def compute_cubic_roots(z, beta, z_a, y):
"""
Compute the roots of the cubic equation for given parameters.
"""
a = z * z_a
b = z * z_a + z + z_a - z_a*y
c = z + z_a + 1 - y*(beta*z_a + 1 - beta)
d = 1
coeffs = [a, b, c, d]
roots = np.roots(coeffs)
return roots
def generate_root_plots(beta, y, z_a, z_min, z_max, n_points):
"""
Generate Im(s) and Re(s) vs. z plots.
"""
if z_a <= 0 or y <= 0 or z_min >= z_max:
st.error("Invalid input parameters.")
return None, None
z_points = np.linspace(z_min, z_max, n_points)
ims, res = [], []
for z in z_points:
roots = compute_cubic_roots(z, beta, z_a, y)
roots = sorted(roots, key=lambda x: abs(x.imag))
ims.append([root.imag for root in roots])
res.append([root.real for root in roots])
ims = np.array(ims)
res = np.array(res)
fig_im = go.Figure()
for i in range(3):
fig_im.add_trace(go.Scatter(x=z_points, y=ims[:, i], mode="lines", name=f"Im{{s{i+1}}}",
line=dict(width=2)))
fig_im.update_layout(title=f"Im{{s}} vs. z (β={beta:.3f}, y={y:.3f}, z_a={z_a:.3f})",
xaxis_title="z", yaxis_title="Im{s}", hovermode="x unified")
fig_re = go.Figure()
for i in range(3):
fig_re.add_trace(go.Scatter(x=z_points, y=res[:, i], mode="lines", name=f"Re{{s{i+1}}}",
line=dict(width=2)))
fig_re.update_layout(title=f"Re{{s}} vs. z (β={beta:.3f}, y={y:.3f}, z_a={z_a:.3f})",
xaxis_title="z", yaxis_title="Re{s}", hovermode="x unified")
return fig_im, fig_re
@st.cache_data
def generate_eigenvalue_distribution(beta, y, z_a, n=1000, seed=42):
"""
Generate the eigenvalue distribution of B_n = S_n T_n as n→∞
Parameters:
-----------
beta : float
Fraction of components equal to z_a
y : float
Aspect ratio p/n
z_a : float
Value for the delta mass at z_a
n : int
Number of samples
seed : int
Random seed for reproducibility
"""
# Set random seed
np.random.seed(seed)
# Compute dimension p based on aspect ratio y
p = int(y * n)
# Constructing T_n (Population / Shape Matrix)
T_diag = np.where(np.random.rand(p) < beta, z_a, 1.0)
T_n = np.diag(T_diag)
# Generate the data matrix X with i.i.d. standard normal entries
X = np.random.randn(p, n)
# Compute the sample covariance matrix S_n = (1/n) * XX^T
S_n = (1 / n) * (X @ X.T)
# Compute B_n = S_n T_n
B_n = S_n @ T_n
# Compute eigenvalues of B_n
eigenvalues = np.linalg.eigvalsh(B_n)
# Use KDE to compute a smooth density estimate
kde = gaussian_kde(eigenvalues)
x_vals = np.linspace(min(eigenvalues), max(eigenvalues), 500)
kde_vals = kde(x_vals)
# Create figure
fig = go.Figure()
# Add histogram trace
fig.add_trace(go.Histogram(x=eigenvalues, histnorm='probability density',
name="Histogram", marker=dict(color='blue', opacity=0.6)))
# Add KDE trace
fig.add_trace(go.Scatter(x=x_vals, y=kde_vals, mode="lines",
name="KDE", line=dict(color='red', width=2)))
fig.update_layout(
title=f"Eigenvalue Distribution for B_n = S_n T_n (y={y:.1f}, β={beta:.2f}, a={z_a:.1f})",
xaxis_title="Eigenvalue",
yaxis_title="Density",
hovermode="closest",
showlegend=True
)
return fig
# ----------------- Streamlit UI -----------------
st.title("Cubic Root Analysis")
# Define three tabs (removed "Curve Intersections")
tab1, tab2, tab3 = st.tabs(["z*(β) Curves", "Im{s} vs. z", "Differential Analysis"])
# ----- Tab 1: z*(β) Curves -----
with tab1:
st.header("Find z Values where Cubic Roots Transition Between Real and Complex")
col1, col2 = st.columns([1, 2])
with col1:
z_a_1 = st.number_input("z_a", value=1.0, key="z_a_1")
y_1 = st.number_input("y", value=1.0, key="y_1")
z_min_1 = st.number_input("z_min", value=-10.0, key="z_min_1")
z_max_1 = st.number_input("z_max", value=10.0, key="z_max_1")
with st.expander("Resolution Settings"):
beta_steps = st.slider("β steps", min_value=51, max_value=501, value=201, step=50, key="beta_steps")
z_steps = st.slider("z grid steps", min_value=1000, max_value=100000, value=50000, step=1000, key="z_steps")
st.subheader("Custom Expression 1 (s-based)")
st.markdown("""Enter expressions for s = numerator/denominator
(using variables `y`, `beta`, `z_a`, and `sqrt()`)""")
st.latex(r"\text{This s will be inserted into:}")
st.latex(r"\frac{y\beta(z_a-1)\underline{s}+(a\underline{s}+1)((y-1)\underline{s}-1)}{(a\underline{s}+1)(\underline{s}^2 + \underline{s})}")
s_num = st.text_input("s numerator", value="y*beta*(z_a-1)", key="s_num")
s_denom = st.text_input("s denominator", value="z_a", key="s_denom")
st.subheader("Custom Expression 2 (direct z(β))")
st.markdown("""Enter direct expression for z(β) = numerator/denominator
(using variables `y`, `beta`, `z_a`, and `sqrt()`)""")
z_num = st.text_input("z(β) numerator", value="y*beta*(z_a-1)", key="z_num")
z_denom = st.text_input("z(β) denominator", value="1", key="z_denom")
show_derivatives = st.checkbox("Show derivatives", value=False)
if st.button("Compute z vs. β Curves", key="tab1_button"):
with col2:
fig = generate_z_vs_beta_plot(z_a_1, y_1, z_min_1, z_max_1, beta_steps, z_steps,
s_num, s_denom, z_num, z_denom, show_derivatives)
if fig is not None:
st.plotly_chart(fig, use_container_width=True)
st.markdown("### Curve Explanations")
st.markdown("""
- **Upper z*(β)** (Blue): Maximum z value where discriminant is zero
- **Lower z*(β)** (Light Blue): Minimum z value where discriminant is zero
- **High y Expression** (Green): Asymptotic approximation for high y values
- **Alternate Low Expression** (Orange): Alternative asymptotic expression
- **Custom Expression 1** (Purple): Result from user-defined s substituted into the main formula
- **Custom Expression 2** (Magenta): Direct z(β) expression
""")
if show_derivatives:
st.markdown("""
Derivatives are shown as:
- Dashed lines: First derivatives (d/dβ)
- Dotted lines: Second derivatives (d²/dβ²)
""")
# ----- Tab 2: Im{s} vs. z -----
with tab2:
st.header("Plot Complex Roots vs. z")
col1, col2 = st.columns([1, 2])
with col1:
beta = st.number_input("β", value=0.5, min_value=0.0, max_value=1.0, key="beta_tab2")
y_2 = st.number_input("y", value=1.0, key="y_tab2")
z_a_2 = st.number_input("z_a", value=1.0, key="z_a_tab2")
z_min_2 = st.number_input("z_min", value=-10.0, key="z_min_tab2")
z_max_2 = st.number_input("z_max", value=10.0, key="z_max_tab2")
with st.expander("Resolution Settings"):
z_points = st.slider("z grid points", min_value=1000, max_value=10000, value=5000, step=500, key="z_points")
if st.button("Compute Complex Roots vs. z", key="tab2_button"):
with col2:
fig_im, fig_re = generate_root_plots(beta, y_2, z_a_2, z_min_2, z_max_2, z_points)
if fig_im is not None and fig_re is not None:
st.plotly_chart(fig_im, use_container_width=True)
st.plotly_chart(fig_re, use_container_width=True)
# Add a separator
st.markdown("---")
# Add eigenvalue distribution section
st.header("Eigenvalue Distribution for B_n = S_n T_n")
st.markdown("""
This simulation generates the eigenvalue distribution of B_n as n→∞, where:
- B_n = (1/n)XX* with X being a p×n matrix
- p/n → y as n→∞
- All elements of X are i.i.d with distribution β·δ(z_a) + (1-β)·δ(1)
""")
col_eigen1, col_eigen2 = st.columns([1, 2])
with col_eigen1:
n_samples = st.slider("Number of samples (n)", min_value=100, max_value=2000, value=1000, step=100)
sim_seed = st.number_input("Random seed", min_value=1, max_value=1000, value=42, step=1)
if st.button("Generate Eigenvalue Distribution", key="tab2_eigen_button"):
with col_eigen2:
fig_eigen = generate_eigenvalue_distribution(beta, y_2, z_a_2, n=n_samples, seed=sim_seed)
if fig_eigen is not None:
st.plotly_chart(fig_eigen, use_container_width=True)
# ----- Tab 3: Differential Analysis -----
with tab3:
st.header("Differential Analysis vs. β")
st.markdown("This page shows the difference between the Upper (blue) and Lower (lightblue) z*(β) curves, along with their first and second derivatives with respect to β.")
col1, col2 = st.columns([1, 2])
with col1:
z_a_diff = st.number_input("z_a", value=1.0, key="z_a_diff")
y_diff = st.number_input("y", value=1.0, key="y_diff")
z_min_diff = st.number_input("z_min", value=-10.0, key="z_min_diff")
z_max_diff = st.number_input("z_max", value=10.0, key="z_max_diff")
with st.expander("Resolution Settings"):
beta_steps_diff = st.slider("β steps", min_value=51, max_value=501, value=201, step=50, key="beta_steps_diff")
z_steps_diff = st.slider("z grid steps", min_value=1000, max_value=100000, value=50000, step=1000, key="z_steps_diff")
# Add options for curve selection
st.subheader("Curves to Analyze")
analyze_upper_lower = st.checkbox("Upper-Lower Difference", value=True)
analyze_high_y = st.checkbox("High y Expression", value=False)
analyze_alt_low = st.checkbox("Alternate Low Expression", value=False)
if st.button("Compute Differentials", key="tab3_button"):
with col2:
betas_diff, lower_vals, upper_vals = sweep_beta_and_find_z_bounds(z_a_diff, y_diff, z_min_diff, z_max_diff, beta_steps_diff, z_steps_diff)
# Create figure
fig_diff = go.Figure()
if analyze_upper_lower:
diff_curve = upper_vals - lower_vals
d1 = np.gradient(diff_curve, betas_diff)
d2 = np.gradient(d1, betas_diff)
fig_diff.add_trace(go.Scatter(x=betas_diff, y=diff_curve, mode="lines",
name="Upper-Lower Difference", line=dict(color="magenta", width=2)))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d1, mode="lines",
name="Upper-Lower d/dβ", line=dict(color="magenta", dash='dash')))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d2, mode="lines",
name="Upper-Lower d²/dβ²", line=dict(color="magenta", dash='dot')))
if analyze_high_y:
high_y_curve = compute_high_y_curve(betas_diff, z_a_diff, y_diff)
d1 = np.gradient(high_y_curve, betas_diff)
d2 = np.gradient(d1, betas_diff)
fig_diff.add_trace(go.Scatter(x=betas_diff, y=high_y_curve, mode="lines",
name="High y", line=dict(color="green", width=2)))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d1, mode="lines",
name="High y d/dβ", line=dict(color="green", dash='dash')))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d2, mode="lines",
name="High y d²/dβ²", line=dict(color="green", dash='dot')))
if analyze_alt_low:
alt_low_curve = compute_alternate_low_expr(betas_diff, z_a_diff, y_diff)
d1 = np.gradient(alt_low_curve, betas_diff)
d2 = np.gradient(d1, betas_diff)
fig_diff.add_trace(go.Scatter(x=betas_diff, y=alt_low_curve, mode="lines",
name="Alt Low", line=dict(color="orange", width=2)))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d1, mode="lines",
name="Alt Low d/dβ", line=dict(color="orange", dash='dash')))
fig_diff.add_trace(go.Scatter(x=betas_diff, y=d2, mode="lines",
name="Alt Low d²/dβ²", line=dict(color="orange", dash='dot')))
fig_diff.update_layout(
title="Differential Analysis vs. β",
xaxis_title="β",
yaxis_title="Value",
hovermode="x unified",
showlegend=True,
legend=dict(
yanchor="top",
y=0.99,
xanchor="left",
x=0.01
)
)
st.plotly_chart(fig_diff, use_container_width=True)
st.markdown("""
### Curve Types
- Solid lines: Original curves
- Dashed lines: First derivatives (d/dβ)
- Dotted lines: Second derivatives (d²/dβ²)
""")