Spaces:
Running
Running
import argparse | |
from pathlib import Path | |
import yaml | |
from wandb_utils import WandbLogger | |
from utils.datasets import LoadImagesAndLabels | |
WANDB_ARTIFACT_PREFIX = 'wandb-artifact://' | |
def create_dataset_artifact(opt): | |
with open(opt.data) as f: | |
data = yaml.load(f, Loader=yaml.SafeLoader) # data dict | |
logger = WandbLogger(opt, '', None, data, job_type='create_dataset') | |
nc, names = (1, ['item']) if opt.single_cls else (int(data['nc']), data['names']) | |
names = {k: v for k, v in enumerate(names)} # to index dictionary | |
logger.log_dataset_artifact(LoadImagesAndLabels(data['train']), names, name='train') # trainset | |
logger.log_dataset_artifact(LoadImagesAndLabels(data['val']), names, name='val') # valset | |
# Update data.yaml with artifact links | |
data['train'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'train') | |
data['val'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'val') | |
path = opt.data if opt.overwrite_config else opt.data.replace('.', '_wandb.') # updated data.yaml path | |
data.pop('download', None) # download via artifact instead of predefined field 'download:' | |
with open(path, 'w') as f: | |
yaml.dump(data, f) | |
print("New Config file => ", path) | |
if __name__ == '__main__': | |
parser = argparse.ArgumentParser() | |
parser.add_argument('--data', type=str, default='data/coco128.yaml', help='data.yaml path') | |
parser.add_argument('--single-cls', action='store_true', help='train as single-class dataset') | |
parser.add_argument('--project', type=str, default='YOLOv5', help='name of W&B Project') | |
parser.add_argument('--overwrite_config', action='store_true', help='overwrite data.yaml') | |
opt = parser.parse_args() | |
create_dataset_artifact(opt) | |