bkb2135 commited on
Commit
19192aa
·
1 Parent(s): 2cec71e

Track large file with Git LFs

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. data/wandb/tzebw6rb.parquet +3 -0
  3. utils.py +5 -4
.gitattributes ADDED
@@ -0,0 +1 @@
 
 
1
+ data/wandb/tzebw6rb.parquet filter=lfs diff=lfs merge=lfs -text
data/wandb/tzebw6rb.parquet ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:97537f22180da6992b01c2ba7566fabc7c265d27c2c317eda2a191d52e08b843
3
+ size 13624028
utils.py CHANGED
@@ -136,11 +136,12 @@ def load_downloaded_runs(time, cols=KEYS):
136
  'date-based question answering': 'date_qa',
137
  'question-answering': 'qa',
138
  }
139
- if 'task' in df_all.columns:
140
- df_all.task = df_all.task.apply(lambda x: task_mapping.get(x, x))
 
141
 
142
  # Runs which do not have a turn field are imputed to be turn zero (single turn)
143
- df_all.turn.fillna(0, inplace=True)
144
 
145
  df_all.sort_values(by=['_timestamp'], inplace=True)
146
 
@@ -230,7 +231,7 @@ def download_runs(time, df_vali):
230
  continue
231
 
232
  try:
233
- pbar.set_description(f'* Downloading run {row.run_id!r}', flush=True)
234
  run = api.run(row.run_path)
235
 
236
  # By default we just download a subset of events (500 most recent)
 
136
  'date-based question answering': 'date_qa',
137
  'question-answering': 'qa',
138
  }
139
+
140
+ df_all['task'] = df_all.task.apply(lambda x: task_mapping.get(x, x))
141
+
142
 
143
  # Runs which do not have a turn field are imputed to be turn zero (single turn)
144
+ df_all['turn'] = df_all.turn.fillna(0)
145
 
146
  df_all.sort_values(by=['_timestamp'], inplace=True)
147
 
 
231
  continue
232
 
233
  try:
234
+ pbar.set_description(f'* Downloading run {row.run_id!r}')
235
  run = api.run(row.run_path)
236
 
237
  # By default we just download a subset of events (500 most recent)