| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889 |
- # Copyright (c) OpenMMLab. All rights reserved.
- import argparse
- import os
- import os.path as osp
- import tempfile
- import zipfile
- import mmcv
- from mmengine.utils import mkdir_or_exist
- CHASE_DB1_LEN = 28 * 3
- TRAINING_LEN = 60
- def parse_args():
- parser = argparse.ArgumentParser(
- description='Convert CHASE_DB1 dataset to mmsegmentation format')
- parser.add_argument('dataset_path', help='path of CHASEDB1.zip')
- parser.add_argument('--tmp_dir', help='path of the temporary directory')
- parser.add_argument('-o', '--out_dir', help='output path')
- args = parser.parse_args()
- return args
- def main():
- args = parse_args()
- dataset_path = args.dataset_path
- if args.out_dir is None:
- out_dir = osp.join('data', 'CHASE_DB1')
- else:
- out_dir = args.out_dir
- print('Making directories...')
- mkdir_or_exist(out_dir)
- mkdir_or_exist(osp.join(out_dir, 'images'))
- mkdir_or_exist(osp.join(out_dir, 'images', 'training'))
- mkdir_or_exist(osp.join(out_dir, 'images', 'validation'))
- mkdir_or_exist(osp.join(out_dir, 'annotations'))
- mkdir_or_exist(osp.join(out_dir, 'annotations', 'training'))
- mkdir_or_exist(osp.join(out_dir, 'annotations', 'validation'))
- with tempfile.TemporaryDirectory(dir=args.tmp_dir) as tmp_dir:
- print('Extracting CHASEDB1.zip...')
- zip_file = zipfile.ZipFile(dataset_path)
- zip_file.extractall(tmp_dir)
- print('Generating training dataset...')
- assert len(os.listdir(tmp_dir)) == CHASE_DB1_LEN, \
- f'len(os.listdir(tmp_dir)) != {CHASE_DB1_LEN}'
- for img_name in sorted(os.listdir(tmp_dir))[:TRAINING_LEN]:
- img = mmcv.imread(osp.join(tmp_dir, img_name))
- if osp.splitext(img_name)[1] == '.jpg':
- mmcv.imwrite(
- img,
- osp.join(out_dir, 'images', 'training',
- osp.splitext(img_name)[0] + '.png'))
- else:
- # The annotation img should be divided by 128, because some of
- # the annotation imgs are not standard. We should set a
- # threshold to convert the nonstandard annotation imgs. The
- # value divided by 128 is equivalent to '1 if value >= 128
- # else 0'
- mmcv.imwrite(
- img[:, :, 0] // 128,
- osp.join(out_dir, 'annotations', 'training',
- osp.splitext(img_name)[0] + '.png'))
- for img_name in sorted(os.listdir(tmp_dir))[TRAINING_LEN:]:
- img = mmcv.imread(osp.join(tmp_dir, img_name))
- if osp.splitext(img_name)[1] == '.jpg':
- mmcv.imwrite(
- img,
- osp.join(out_dir, 'images', 'validation',
- osp.splitext(img_name)[0] + '.png'))
- else:
- mmcv.imwrite(
- img[:, :, 0] // 128,
- osp.join(out_dir, 'annotations', 'validation',
- osp.splitext(img_name)[0] + '.png'))
- print('Removing the temporary files...')
- print('Done!')
- if __name__ == '__main__':
- main()
|