Spaces:
Sleeping
Sleeping
bkb2135
commited on
Commit
·
19192aa
1
Parent(s):
2cec71e
Track large file with Git LFs
Browse files- .gitattributes +1 -0
- data/wandb/tzebw6rb.parquet +3 -0
- utils.py +5 -4
.gitattributes
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
data/wandb/tzebw6rb.parquet filter=lfs diff=lfs merge=lfs -text
|
data/wandb/tzebw6rb.parquet
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:97537f22180da6992b01c2ba7566fabc7c265d27c2c317eda2a191d52e08b843
|
3 |
+
size 13624028
|
utils.py
CHANGED
@@ -136,11 +136,12 @@ def load_downloaded_runs(time, cols=KEYS):
|
|
136 |
'date-based question answering': 'date_qa',
|
137 |
'question-answering': 'qa',
|
138 |
}
|
139 |
-
|
140 |
-
|
|
|
141 |
|
142 |
# Runs which do not have a turn field are imputed to be turn zero (single turn)
|
143 |
-
df_all.turn.fillna(0
|
144 |
|
145 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
146 |
|
@@ -230,7 +231,7 @@ def download_runs(time, df_vali):
|
|
230 |
continue
|
231 |
|
232 |
try:
|
233 |
-
pbar.set_description(f'* Downloading run {row.run_id!r}'
|
234 |
run = api.run(row.run_path)
|
235 |
|
236 |
# By default we just download a subset of events (500 most recent)
|
|
|
136 |
'date-based question answering': 'date_qa',
|
137 |
'question-answering': 'qa',
|
138 |
}
|
139 |
+
|
140 |
+
df_all['task'] = df_all.task.apply(lambda x: task_mapping.get(x, x))
|
141 |
+
|
142 |
|
143 |
# Runs which do not have a turn field are imputed to be turn zero (single turn)
|
144 |
+
df_all['turn'] = df_all.turn.fillna(0)
|
145 |
|
146 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
147 |
|
|
|
231 |
continue
|
232 |
|
233 |
try:
|
234 |
+
pbar.set_description(f'* Downloading run {row.run_id!r}')
|
235 |
run = api.run(row.run_path)
|
236 |
|
237 |
# By default we just download a subset of events (500 most recent)
|