Spaces:
Sleeping
Sleeping
bkb2135
commited on
Commit
·
19192aa
1
Parent(s):
2cec71e
Track large file with Git LFs
Browse files- .gitattributes +1 -0
- data/wandb/tzebw6rb.parquet +3 -0
- utils.py +5 -4
.gitattributes
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
data/wandb/tzebw6rb.parquet filter=lfs diff=lfs merge=lfs -text
|
data/wandb/tzebw6rb.parquet
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:97537f22180da6992b01c2ba7566fabc7c265d27c2c317eda2a191d52e08b843
|
| 3 |
+
size 13624028
|
utils.py
CHANGED
|
@@ -136,11 +136,12 @@ def load_downloaded_runs(time, cols=KEYS):
|
|
| 136 |
'date-based question answering': 'date_qa',
|
| 137 |
'question-answering': 'qa',
|
| 138 |
}
|
| 139 |
-
|
| 140 |
-
|
|
|
|
| 141 |
|
| 142 |
# Runs which do not have a turn field are imputed to be turn zero (single turn)
|
| 143 |
-
df_all.turn.fillna(0
|
| 144 |
|
| 145 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
| 146 |
|
|
@@ -230,7 +231,7 @@ def download_runs(time, df_vali):
|
|
| 230 |
continue
|
| 231 |
|
| 232 |
try:
|
| 233 |
-
pbar.set_description(f'* Downloading run {row.run_id!r}'
|
| 234 |
run = api.run(row.run_path)
|
| 235 |
|
| 236 |
# By default we just download a subset of events (500 most recent)
|
|
|
|
| 136 |
'date-based question answering': 'date_qa',
|
| 137 |
'question-answering': 'qa',
|
| 138 |
}
|
| 139 |
+
|
| 140 |
+
df_all['task'] = df_all.task.apply(lambda x: task_mapping.get(x, x))
|
| 141 |
+
|
| 142 |
|
| 143 |
# Runs which do not have a turn field are imputed to be turn zero (single turn)
|
| 144 |
+
df_all['turn'] = df_all.turn.fillna(0)
|
| 145 |
|
| 146 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
| 147 |
|
|
|
|
| 231 |
continue
|
| 232 |
|
| 233 |
try:
|
| 234 |
+
pbar.set_description(f'* Downloading run {row.run_id!r}')
|
| 235 |
run = api.run(row.run_path)
|
| 236 |
|
| 237 |
# By default we just download a subset of events (500 most recent)
|