File size: 1,750 Bytes
73a0669
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
import argparse
from pathlib import Path

import yaml

from wandb_utils import WandbLogger
from utils.datasets import LoadImagesAndLabels

WANDB_ARTIFACT_PREFIX = 'wandb-artifact://'


def create_dataset_artifact(opt):
    with open(opt.data) as f:
        data = yaml.load(f, Loader=yaml.SafeLoader)  # data dict
    logger = WandbLogger(opt, '', None, data, job_type='create_dataset')
    nc, names = (1, ['item']) if opt.single_cls else (int(data['nc']), data['names'])
    names = {k: v for k, v in enumerate(names)}  # to index dictionary
    logger.log_dataset_artifact(LoadImagesAndLabels(data['train']), names, name='train')  # trainset
    logger.log_dataset_artifact(LoadImagesAndLabels(data['val']), names, name='val')  # valset

    # Update data.yaml with artifact links
    data['train'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'train')
    data['val'] = WANDB_ARTIFACT_PREFIX + str(Path(opt.project) / 'val')
    path = opt.data if opt.overwrite_config else opt.data.replace('.', '_wandb.')  # updated data.yaml path
    data.pop('download', None)  # download via artifact instead of predefined field 'download:'
    with open(path, 'w') as f:
        yaml.dump(data, f)
    print("New Config file => ", path)


if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument('--data', type=str, default='data/coco128.yaml', help='data.yaml path')
    parser.add_argument('--single-cls', action='store_true', help='train as single-class dataset')
    parser.add_argument('--project', type=str, default='YOLOv5', help='name of W&B Project')
    parser.add_argument('--overwrite_config', action='store_true', help='overwrite data.yaml')
    opt = parser.parse_args()

    create_dataset_artifact(opt)