Sasidhar commited on
Commit
e8c4461
·
1 Parent(s): e842846

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +15 -8
app.py CHANGED
@@ -133,7 +133,7 @@ def create_component_for_analysis_for_single_df(selected_files, dfs, i):
133
 
134
  analysis_actions = st.multiselect("What analysis do you wish to do?",
135
  ['Summary of Data', 'Sample Data','Get Profile' ,'Univariate Analysis',
136
- 'Bivariate Analysis','Add a Target Column'], key='analysis_action_' + str(i))
137
  if analysis_actions:
138
 
139
  df_for_analysis = st.session_state['filtered_data'][selected_files[i]] if filter_data else df
@@ -195,13 +195,20 @@ def create_component_for_analysis_for_single_df(selected_files, dfs, i):
195
 
196
  st.plotly_chart(fig, use_container_width=True)
197
 
198
- elif action == "Add a Target Column":
199
- # create_component_to_add_target_func(selected_files, dfs, i)
200
- code= "def f1(x): return str(x * 3)"
201
- exec(code)
202
- st.write(f1(3))
203
-
204
-
 
 
 
 
 
 
 
205
  def create_component_for_data_analysis():
206
  if 'data_files' in st.session_state:
207
 
 
133
 
134
  analysis_actions = st.multiselect("What analysis do you wish to do?",
135
  ['Summary of Data', 'Sample Data','Get Profile' ,'Univariate Analysis',
136
+ 'Bivariate Analysis'], key='analysis_action_' + str(i))
137
  if analysis_actions:
138
 
139
  df_for_analysis = st.session_state['filtered_data'][selected_files[i]] if filter_data else df
 
195
 
196
  st.plotly_chart(fig, use_container_width=True)
197
 
198
+ elif action == "Bivariate Analysis":
199
+ create_for_bivariate_analysis(selected_files, df, i)
200
+
201
+ def create_for_bivariate_analysis(selected_files, df, i):
202
+ target_column = st.selectbox("Select the target column ", df.columns.values,
203
+ key= "bivariate_target_column_" + str(i))
204
+ bivariate_columns = st.multiselect("Select the columns to analyse ", df.columns.values,
205
+ key= "bivariate_analysis_columns_" + str(i))
206
+ for col in bivariate_columns:
207
+ st.write(pd.crosstab(df[col], df[target_column], margins=True, aggfunc=pd.Series.count))
208
+ # 3 any other aggregation function can be used based on column type
209
+
210
+
211
+
212
  def create_component_for_data_analysis():
213
  if 'data_files' in st.session_state:
214