import argparse from pathlib import Path import yaml from wandb_utils import WandbLogger from utils.datasets import LoadImagesAndLabels WANDB_ARTIFACT_PREFIX = 'wandb-artifact://' def create_dataset_artifact(opt): with open(opt.data) as f: data = yaml.load(f, Loader=yaml.SafeLoader) # data dict logger = WandbLogger(opt, '', None, data, job_type='create_dataset') nc, names = (1, ['item']) if opt.single_cls else (int(data['nc']), data['names']) names = {k: v for k, v in enumerate(names)} # to index dictionary logger.log_dataset_artifact(LoadImagesAndLabels(data['train']), names, name='train') # trainset logger.log_dataset_artifact(LoadImagesAndLabels(data['val']), names, name='val') # valset # Update data.yaml with artifact links data['train'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'train') data['val'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'val') path = opt.data if opt.overwrite_config else opt.data.replace('.', '_wandb.') # updated data.yaml path data.pop('download', None) # download via artifact instead of predefined field 'download:' with open(path, 'w') as f: yaml.dump(data, f) print("New Config file => ", path) if __name__ == '__main__': parser = argparse.ArgumentParser() parser.add_argument('--data', type=str, default='data/coco128.yaml', help='data.yaml path') parser.add_argument('--single-cls', action='store_true', help='train as single-class dataset') parser.add_argument('--project', type=str, default='YOLOv5', help='name of W&B Project') parser.add_argument('--overwrite_config', action='store_true', help='overwrite data.yaml') opt = parser.parse_args() create_dataset_artifact(opt)