Spaces:
Sleeping
Sleeping
bkb2135
commited on
Commit
·
be32e3b
1
Parent(s):
05503d0
Squash Bugs
Browse files
app.py
CHANGED
|
@@ -141,5 +141,7 @@ st.subheader('Logged runs')
|
|
| 141 |
# use_container_width=True
|
| 142 |
# )
|
| 143 |
|
|
|
|
|
|
|
| 144 |
with st.expander('Show raw run data'):
|
| 145 |
st.dataframe(df_runs)
|
|
|
|
| 141 |
# use_container_width=True
|
| 142 |
# )
|
| 143 |
|
| 144 |
+
|
| 145 |
+
df_runs['spec_version'] = df_runs['spec_version'].astype('int64')
|
| 146 |
with st.expander('Show raw run data'):
|
| 147 |
st.dataframe(df_runs)
|
utils.py
CHANGED
|
@@ -22,10 +22,7 @@ KEYS = ['_step','_timestamp','task','query','reference','challenge','topic','sub
|
|
| 22 |
ABBREV_CHARS = 8
|
| 23 |
ENTITY_CHOICES = ('identity', 'hotkey', 'coldkey')
|
| 24 |
LOCAL_WANDB_PATH = './data/wandb'
|
| 25 |
-
USERNAME = '
|
| 26 |
-
|
| 27 |
-
# Set the WANDB_API_KEY environment variable to 'anonymous'
|
| 28 |
-
os.environ["WANDB_API_KEY"] = "anonymous"
|
| 29 |
|
| 30 |
# Initialize wandb with anonymous login
|
| 31 |
wandb.login(anonymous='must')
|
|
@@ -142,8 +139,8 @@ def load_downloaded_runs(time, cols=KEYS):
|
|
| 142 |
'question-answering': 'qa',
|
| 143 |
}
|
| 144 |
|
| 145 |
-
# Runs which do not have a turn field are imputed to be turn zero (single turn)
|
| 146 |
-
df_all.turn.fillna(0, inplace=True)
|
| 147 |
|
| 148 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
| 149 |
# Check if df_all has the task columns
|
|
@@ -230,12 +227,15 @@ def download_runs(time, df_vali):
|
|
| 230 |
progress.progress(i/len(df_vali), text=f'{prog_msg}... **downloading** `{os.path.join(*row.run_id)}`')
|
| 231 |
|
| 232 |
save_path = f'data/wandb/{row.run_id}.parquet'
|
|
|
|
|
|
|
|
|
|
| 233 |
if os.path.exists(save_path):
|
| 234 |
pbar.set_description(f'>> Skipping {row.run_id!r} because file {save_path!r} already exists')
|
| 235 |
continue
|
| 236 |
|
| 237 |
try:
|
| 238 |
-
pbar.set_description(f'* Downloading run {row.run_id!r}'
|
| 239 |
run = api.run(row.run_path)
|
| 240 |
|
| 241 |
# By default we just download a subset of events (500 most recent)
|
|
|
|
| 22 |
ABBREV_CHARS = 8
|
| 23 |
ENTITY_CHOICES = ('identity', 'hotkey', 'coldkey')
|
| 24 |
LOCAL_WANDB_PATH = './data/wandb'
|
| 25 |
+
USERNAME = 'login19861986'
|
|
|
|
|
|
|
|
|
|
| 26 |
|
| 27 |
# Initialize wandb with anonymous login
|
| 28 |
wandb.login(anonymous='must')
|
|
|
|
| 139 |
'question-answering': 'qa',
|
| 140 |
}
|
| 141 |
|
| 142 |
+
# # Runs which do not have a turn field are imputed to be turn zero (single turn)
|
| 143 |
+
# df_all.turn.fillna(0, inplace=True)
|
| 144 |
|
| 145 |
df_all.sort_values(by=['_timestamp'], inplace=True)
|
| 146 |
# Check if df_all has the task columns
|
|
|
|
| 227 |
progress.progress(i/len(df_vali), text=f'{prog_msg}... **downloading** `{os.path.join(*row.run_id)}`')
|
| 228 |
|
| 229 |
save_path = f'data/wandb/{row.run_id}.parquet'
|
| 230 |
+
# Create the directory if it does not exist
|
| 231 |
+
os.makedirs(os.path.dirname(save_path), exist_ok=True)
|
| 232 |
+
|
| 233 |
if os.path.exists(save_path):
|
| 234 |
pbar.set_description(f'>> Skipping {row.run_id!r} because file {save_path!r} already exists')
|
| 235 |
continue
|
| 236 |
|
| 237 |
try:
|
| 238 |
+
pbar.set_description(f'* Downloading run {row.run_id!r}')
|
| 239 |
run = api.run(row.run_path)
|
| 240 |
|
| 241 |
# By default we just download a subset of events (500 most recent)
|