"""Prepare Cityscapes dataset""" import os import sys import argparse import zipfile # TODO: optim code cur_path = os.path.abspath(os.path.dirname(__file__)) root_path = os.path.split(os.path.split(os.path.split(cur_path)[0])[0])[0] sys.path.append(root_path) from core.utils import download, makedirs, check_sha1 _TARGET_DIR = os.path.expanduser('~/.torch/datasets/citys') def parse_args(): parser = argparse.ArgumentParser( description='Initialize ADE20K dataset.', epilog='Example: python prepare_cityscapes.py', formatter_class=argparse.ArgumentDefaultsHelpFormatter) parser.add_argument('--download-dir', default=None, help='dataset directory on disk') args = parser.parse_args() return args def download_city(path, overwrite=False): _CITY_DOWNLOAD_URLS = [ ('gtFine_trainvaltest.zip', '99f532cb1af174f5fcc4c5bc8feea8c66246ddbc'), ('leftImg8bit_trainvaltest.zip', '2c0b77ce9933cc635adda307fbba5566f5d9d404')] download_dir = os.path.join(path, 'downloads') makedirs(download_dir) for filename, checksum in _CITY_DOWNLOAD_URLS: if not check_sha1(filename, checksum): raise UserWarning('File {} is downloaded but the content hash does not match. ' \ 'The repo may be outdated or download may be incomplete. ' \ 'If the "repo_url" is overridden, consider switching to ' \ 'the default repo.'.format(filename)) # extract with zipfile.ZipFile(filename, "r") as zip_ref: zip_ref.extractall(path=path) print("Extracted", filename) if __name__ == '__main__': args = parse_args() makedirs(os.path.expanduser('~/.torch/datasets')) if args.download_dir is not None: if os.path.isdir(_TARGET_DIR): os.remove(_TARGET_DIR) # make symlink os.symlink(args.download_dir, _TARGET_DIR) else: download_city(_TARGET_DIR, overwrite=False)