-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathdata.py
91 lines (78 loc) · 3.1 KB
/
data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
from __future__ import print_function
import argparse
import cv2
import lmdb
import numpy
import os
from os.path import exists, join
__author__ = 'Fisher Yu'
__email__ = 'fy@cs.princeton.edu'
__license__ = 'MIT'
def view(db_path):
print('Viewing', db_path)
print('Press ESC to exist or SPACE to advance.')
window_name = 'LSUN'
cv2.namedWindow(window_name)
env = lmdb.open(db_path, map_size=1099511627776,
max_readers=100, readonly=True)
with env.begin(write=False) as txn:
cursor = txn.cursor()
for key, val in cursor:
print('Current key:', key)
img = cv2.imdecode(
numpy.fromstring(val, dtype=numpy.uint8), 1)
cv2.imshow(window_name, img)
c = cv2.waitKey()
if c == 27:
break
def export_images(db_path, out_dir, flat=False, limit=-1):
print('Exporting', db_path, 'to', out_dir)
env = lmdb.open(db_path, map_size=1099511627776,
max_readers=100, readonly=True)
count = 0
with env.begin(write=False) as txn:
cursor = txn.cursor()
for key, val in cursor:
key_str = "".join([chr(_) for _ in key])
val_str = "".join([chr(_) for _ in val])
if not flat:
image_out_dir = join(out_dir, '/'.join([chr(_) for _ in key[:6]]))
else:
image_out_dir = out_dir
if not exists(image_out_dir):
os.makedirs(image_out_dir)
image_out_path = join(image_out_dir, key_str + '.webp')
with open(image_out_path, 'wb') as fp:
fp.write(val)
count += 1
if count == limit:
break
if count % 1000 == 0:
print('Finished', count, 'images')
def main():
parser = argparse.ArgumentParser()
parser.add_argument('command', nargs='?', type=str,
choices=['view', 'export'],
help='view: view the images in the lmdb database '
'interactively.\n'
'export: Export the images in the lmdb databases '
'to a folder. The images are grouped in subfolders'
' determinted by the prefiex of image key.')
parser.add_argument('lmdb_path', nargs='+', type=str,
help='The path to the lmdb database folder. '
'Support multiple database paths.')
parser.add_argument('--out_dir', type=str, default='')
parser.add_argument('--flat', action='store_true',
help='If enabled, the images are imported into output '
'directory directly instead of hierarchical '
'directories.')
args = parser.parse_args()
command = args.command
lmdb_paths = args.lmdb_path
for lmdb_path in lmdb_paths:
if command == 'view':
view(lmdb_path)
elif command == 'export':
export_images(lmdb_path, args.out_dir, args.flat)
if __name__ == '__main__':
main()