Spaces:

macrocosm-os
/

sn1

Paused

App Files Files Community

steffenc commited on Apr 4, 2024

Commit

4dd30e1

unverified ·

2 Parent(s): 08fa697 091bef3

Merge pull request #11 from opentensor/alpha-validators

Browse files

Files changed (5) hide show

dashboard.py +9 -8
opendashboards/assets/inspect.py +7 -0
opendashboards/assets/io.py +4 -2
opendashboards/assets/metric.py +1 -2
opendashboards/utils/plotting.py +1 -1

dashboard.py CHANGED Viewed

@@ -8,7 +8,7 @@ from opendashboards.assets import io, inspect, metric, plot
 # cache individual file loads
 # Hotkey churn
-DEFAULT_PROJECT = "openvalidators"
 DEFAULT_FILTERS = {"tags": {"$in": [f'1.1.{i}' for i in range(10)]}}
 DEFAULT_SELECTED_HOTKEYS = None
 DEFAULT_SRC = 'followup'
@@ -23,7 +23,7 @@ st.set_page_config(
         'About': """
         This dashboard is part of the OpenTensor project. \n
         To see runs in wandb, go to: \n
-        https://wandb.ai/opentensor-dev/openvalidators/table?workspace=default
         """
     },
     layout = "centered"
@@ -82,7 +82,8 @@ with tab1:
         st.dataframe(df_long.head(num_rows) if use_long_checkbox else df.head(num_rows),
                      use_container_width=True)
-step_types = ['all']+['augment','followup','answer']#list(df.name.unique())
 ### UID Health ###
 # TODO: Live time - time elapsed since moving_averaged_score for selected UID was 0 (lower bound so use >Time)
@@ -93,8 +94,8 @@ with tab2:
     st.subheader("UID :violet[Health]")
     st.info(f"Showing UID health metrics for **{n_runs} selected runs**")
-    uid_src = st.radio('Select event type:', step_types, horizontal=True, key='uid_src')
-    df_uid = df_long[df_long.name.str.contains(uid_src)] if uid_src != 'all' else df_long
     metric.uids(df_uid, uid_src)
     uids = st.multiselect('UID:', sorted(df_uid['uids'].unique()), key='uid')
@@ -154,8 +155,8 @@ with tab3:
     msg_col1, msg_col2 = st.columns(2)
     # completion_src = msg_col1.radio('Select one:', ['followup', 'answer'], horizontal=True, key='completion_src')
-    completion_src = st.radio('Select event type:', step_types, horizontal=True, key='completion_src')
-    df_comp = df_long[df_long.name.str.contains(completion_src)] if completion_src != 'all' else df_long
     completion_info.info(f"Showing **{completion_src}** completions for **{n_runs} selected runs**")
@@ -204,7 +205,7 @@ with tab3:
             df_comp,
             completion_col='completions',
             uid_col='uids',
-            time_col='completion_times',
             length_opt=completion_length_radio,
         )

 # cache individual file loads
 # Hotkey churn
+DEFAULT_PROJECT = "alpha-validators"
 DEFAULT_FILTERS = {"tags": {"$in": [f'1.1.{i}' for i in range(10)]}}
 DEFAULT_SELECTED_HOTKEYS = None
 DEFAULT_SRC = 'followup'
         'About': """
         This dashboard is part of the OpenTensor project. \n
         To see runs in wandb, go to: \n
+        https://wandb.ai/opentensor-dev/alpha-validators/table?workspace=default
         """
     },
     layout = "centered"
         st.dataframe(df_long.head(num_rows) if use_long_checkbox else df.head(num_rows),
                      use_container_width=True)
+# step_types = ['all']+['augment','followup','answer']#list(df.name.unique())
+step_types = ['all']+list(df.task.unique())
 ### UID Health ###
 # TODO: Live time - time elapsed since moving_averaged_score for selected UID was 0 (lower bound so use >Time)
     st.subheader("UID :violet[Health]")
     st.info(f"Showing UID health metrics for **{n_runs} selected runs**")
+    uid_src = st.radio('Select task type:', step_types, horizontal=True, key='uid_src')
+    df_uid = df_long[df_long.task.str.contains(uid_src)] if uid_src != 'all' else df_long
     metric.uids(df_uid, uid_src)
     uids = st.multiselect('UID:', sorted(df_uid['uids'].unique()), key='uid')
     msg_col1, msg_col2 = st.columns(2)
     # completion_src = msg_col1.radio('Select one:', ['followup', 'answer'], horizontal=True, key='completion_src')
+    completion_src = st.radio('Select task type:', step_types, horizontal=True, key='completion_src')
+    df_comp = df_long[df_long.task.str.contains(completion_src)] if completion_src != 'all' else df_long
     completion_info.info(f"Showing **{completion_src}** completions for **{n_runs} selected runs**")
             df_comp,
             completion_col='completions',
             uid_col='uids',
+            time_col='timings',
             length_opt=completion_length_radio,
         )

opendashboards/assets/inspect.py CHANGED Viewed

@@ -4,6 +4,13 @@ import pandas as pd
 import opendashboards.utils.utils as utils
 def clean_data(df):
     return df.dropna(subset=df.filter(regex='completions|rewards').columns, how='any')
 @st.cache_data

 import opendashboards.utils.utils as utils
 def clean_data(df):
+    task_map = {
+        'question-answering': 'QA',
+        'summarization': 'Summarization',
+        'date-based question answering': 'Date QA',
+        'math': 'Math'
+    }
+    df['task'] = df.task.map(task_map)
     return df.dropna(subset=df.filter(regex='completions|rewards').columns, how='any')
 @st.cache_data

opendashboards/assets/io.py CHANGED Viewed

@@ -39,7 +39,7 @@ def load_runs(project, filters, min_steps=10):
         rules = {'hotkey': re.compile('^[0-9a-z]{48}$',re.IGNORECASE), 'version': re.compile('^\\d\.\\d+\.\\d+$'), 'spec_version': re.compile('\\d{4}$')}
         tags = {k: tag for k, rule in rules.items() for tag in run.tags if rule.match(tag)}
         # include bool flag for remaining tags
-        tags.update({k: k in run.tags for k in ('mock','custom_gating_model','nsfw_filter','outsource_scoring','disable_set_weights')})
         runs.append({
             'state': run.state,
@@ -61,7 +61,9 @@ def load_runs(project, filters, min_steps=10):
     progress.empty()
     msg.empty()
-    return pd.DataFrame(runs).astype({'state': 'category', 'hotkey': 'category', 'version': 'category', 'spec_version': 'category'})
 @st.cache_data

         rules = {'hotkey': re.compile('^[0-9a-z]{48}$',re.IGNORECASE), 'version': re.compile('^\\d\.\\d+\.\\d+$'), 'spec_version': re.compile('\\d{4}$')}
         tags = {k: tag for k, rule in rules.items() for tag in run.tags if rule.match(tag)}
         # include bool flag for remaining tags
+        tags.update({k: k in run.tags for k in ('mock','disable_set_weights')})
         runs.append({
             'state': run.state,
     progress.empty()
     msg.empty()
+    frame = pd.DataFrame(runs)
+    mappings = {'state': 'category', 'hotkey': 'category', 'version': 'category', 'spec_version': 'category'}
+    return frame.astype({k:v for k,v in mappings.items() if k in frame.columns})
 @st.cache_data

opendashboards/assets/metric.py CHANGED Viewed

@@ -44,8 +44,7 @@ def runs(df_long):
     col3.metric('Events', fmt(df_long.groupby(['run_id','_step']).ngroups))
     col4.metric('Completions', fmt(df_long.shape[0]))
-    name_type = df_long.name.apply(lambda x: x if not x[-1].isdigit() else x[:-1])
-    aggs = df_long.groupby(name_type).agg({'uids': 'nunique', 'completions': 'nunique'})
     print(aggs)
     for i,c in enumerate(st.columns(len(aggs))):
         name = aggs.index[i].title()

     col3.metric('Events', fmt(df_long.groupby(['run_id','_step']).ngroups))
     col4.metric('Completions', fmt(df_long.shape[0]))
+    aggs = df_long.groupby('task').agg({'uids': 'nunique', 'completions': 'nunique'})
     print(aggs)
     for i,c in enumerate(st.columns(len(aggs))):
         name = aggs.index[i].title()

opendashboards/utils/plotting.py CHANGED Viewed

@@ -310,7 +310,7 @@ def plot_completion_length_time(
     df: pd.DataFrame,
     uid_col: str = "uids",
     completion_col: str = "completions",
-    time_col: str = "completion_times",
     uids: List[int] = None,
     length_opt: str = 'characters',
 ) -> go.Figure:

     df: pd.DataFrame,
     uid_col: str = "uids",
     completion_col: str = "completions",
+    time_col: str = "timings",
     uids: List[int] = None,
     length_opt: str = 'characters',
 ) -> go.Figure: