Spaces:

Tonic
/

SmolFactory

Running

App Files Files Community

Tonic commited on 20 days ago

Commit

a509b8b

1 Parent(s): c560f4f

adds steps logging + parsing - woops

Browse files

Files changed (2) hide show

src/monitoring.py +14 -0
templates/spaces/trackio/app.py +20 -2

src/monitoring.py CHANGED Viewed

@@ -449,6 +449,20 @@ class SmolLM3Monitor:
         try:
             # Add timestamp
             metrics['timestamp'] = datetime.now().isoformat()
             if step is not None:
                 metrics['step'] = step

         try:
             # Add timestamp
             metrics['timestamp'] = datetime.now().isoformat()
+            # If caller didn't provide step, try to infer it from common keys emitted by HF/TRL
+            if step is None:
+                try:
+                    for step_key in (
+                        'global_step',
+                        'train/global_step',
+                        'step',
+                        'train/step',
+                    ):
+                        if step_key in metrics and metrics[step_key] is not None:
+                            step = int(metrics[step_key])
+                            break
+                except Exception:
+                    step = step  # keep None if parsing fails
             if step is not None:
                 metrics['step'] = step

templates/spaces/trackio/app.py CHANGED Viewed

@@ -1146,7 +1146,17 @@ def create_metrics_plot(experiment_id: str, metric_name: str = "loss") -> go.Fig
         # Ensure steps are numeric and monotonically increasing to avoid zig-zag lines
         try:
             df = df.copy()
-            df['step'] = pd.to_numeric(df['step'], errors='coerce').fillna(-1)
             df.sort_values('step', inplace=True)
         except Exception:
             pass
@@ -1546,7 +1556,15 @@ def create_combined_metrics_plot(experiment_id: str) -> go.Figure:
                 # Clean steps for each subplot too
                 try:
                     df_sub = df.copy()
-                    df_sub['step'] = pd.to_numeric(df_sub['step'], errors='coerce').fillna(-1)
                     df_sub.sort_values('step', inplace=True)
                 except Exception:
                     df_sub = df

         # Ensure steps are numeric and monotonically increasing to avoid zig-zag lines
         try:
             df = df.copy()
+            # If step looks constant or missing, try to derive it from a common field
+            if 'step' not in df or df['step'].nunique() <= 1:
+                for alt in ['train/global_step', 'global_step', 'train/step']:
+                    if alt in df.columns and df[alt].notna().any():
+                        df['step'] = pd.to_numeric(df[alt], errors='coerce')
+                        break
+            # If still missing or constant, fallback to an inferred counter by order of arrival
+            if 'step' not in df.columns or df['step'].isna().all() or df['step'].nunique() <= 1:
+                df['step'] = range(1, len(df) + 1)
+            else:
+                df['step'] = pd.to_numeric(df.get('step', -1), errors='coerce').fillna(-1)
             df.sort_values('step', inplace=True)
         except Exception:
             pass
                 # Clean steps for each subplot too
                 try:
                     df_sub = df.copy()
+                    if 'step' not in df_sub or df_sub['step'].nunique() <= 1:
+                        for alt in ['train/global_step', 'global_step', 'train/step']:
+                            if alt in df_sub.columns and df_sub[alt].notna().any():
+                                df_sub['step'] = pd.to_numeric(df_sub[alt], errors='coerce')
+                                break
+                    if 'step' not in df_sub.columns or df_sub['step'].isna().all() or df_sub['step'].nunique() <= 1:
+                        df_sub['step'] = range(1, len(df_sub) + 1)
+                    else:
+                        df_sub['step'] = pd.to_numeric(df_sub.get('step', -1), errors='coerce').fillna(-1)
                     df_sub.sort_values('step', inplace=True)
                 except Exception:
                     df_sub = df