-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
70 lines (55 loc) · 2.14 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
import os
import shutil
from argparse import ArgumentParser
import numpy as np
from sklearn.cluster import KMeans
from keras.preprocessing import image
from extractor import XceptionExtractor, WHashExtractor
np.random.seed(0)
EXTENSTIONS = ['.png', '.jpg']
os.environ['TF_CPP_MIN_LOG_LEVEL'] = '3'
def target_list(input_dir):
targets = []
for root, dirs, files in os.walk(input_dir):
for fname in files:
_, file_extension = os.path.splitext(fname)
if not file_extension in EXTENSTIONS:
continue
targets.append(os.path.join(root, fname))
return targets
def sampling(vec, sampled_data_num):
kmeans = KMeans(n_clusters=sampled_data_num, random_state=0).fit(vec)
labels = kmeans.labels_
out = []
for ind in range(sampled_data_num):
out.extend(np.random.choice((np.where(labels == ind)[0]), 1))
return out
def argparser():
parser = ArgumentParser()
parser.add_argument("INPUT_DIR", help="input image directory")
parser.add_argument("OUTPUT_DIR", help="output image directory")
parser.add_argument("NUM_SAMPLE", type=int, help="number of sample")
parser.add_argument("--extractor", default="Xception",
choices=["Xception", "whash"],
help="choise of extractor")
args = parser.parse_args()
return args
def main():
args = argparser()
targets = target_list(args.INPUT_DIR)
images = [image.img_to_array(image.load_img(target, target_size=(299, 299)))
for target in targets]
images = np.array(images)
if args.extractor == "Xception":
extractor = XceptionExtractor()
elif args.extractor == "whash":
extractor = WHashExtractor()
feature_vectors = extractor.feature_extraction(images)
sampled_index = sampling(feature_vectors, args.NUM_SAMPLE)
output_targets = [targets[index] for index in sampled_index]
for output_target in output_targets:
basename = os.path.basename(output_target)
shutil.copy(output_target, os.path.join(args.OUTPUT_DIR, basename))
print('done.')
if __name__ == "__main__":
main()