Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
Tetragramm
GitHub Repository: Tetragramm/opencv
Path: blob/master/modules/dnn/test/pascal_semsegm_test_fcn.py
16356 views
1
from __future__ import print_function
2
from abc import ABCMeta, abstractmethod
3
import numpy as np
4
import sys
5
import argparse
6
import time
7
8
from imagenet_cls_test_alexnet import CaffeModel, DnnCaffeModel
9
try:
10
import cv2 as cv
11
except ImportError:
12
raise ImportError('Can\'t find OpenCV Python module. If you\'ve built it from sources without installation, '
13
'configure environment variable PYTHONPATH to "opencv_build_dir/lib" directory (with "python3" subdirectory if required)')
14
15
16
def get_metrics(conf_mat):
17
pix_accuracy = np.trace(conf_mat) / np.sum(conf_mat)
18
t = np.sum(conf_mat, 1)
19
num_cl = np.count_nonzero(t)
20
assert num_cl
21
mean_accuracy = np.sum(np.nan_to_num(np.divide(np.diagonal(conf_mat), t))) / num_cl
22
col_sum = np.sum(conf_mat, 0)
23
mean_iou = np.sum(
24
np.nan_to_num(np.divide(np.diagonal(conf_mat), (t + col_sum - np.diagonal(conf_mat))))) / num_cl
25
return pix_accuracy, mean_accuracy, mean_iou
26
27
28
def eval_segm_result(net_out):
29
assert type(net_out) is np.ndarray
30
assert len(net_out.shape) == 4
31
32
channels_dim = 1
33
y_dim = channels_dim + 1
34
x_dim = y_dim + 1
35
res = np.zeros(net_out.shape).astype(np.int)
36
for i in range(net_out.shape[y_dim]):
37
for j in range(net_out.shape[x_dim]):
38
max_ch = np.argmax(net_out[..., i, j])
39
res[0, max_ch, i, j] = 1
40
return res
41
42
43
def get_conf_mat(gt, prob):
44
assert type(gt) is np.ndarray
45
assert type(prob) is np.ndarray
46
47
conf_mat = np.zeros((gt.shape[0], gt.shape[0]))
48
for ch_gt in range(conf_mat.shape[0]):
49
gt_channel = gt[ch_gt, ...]
50
for ch_pr in range(conf_mat.shape[1]):
51
prob_channel = prob[ch_pr, ...]
52
conf_mat[ch_gt][ch_pr] = np.count_nonzero(np.multiply(gt_channel, prob_channel))
53
return conf_mat
54
55
56
class MeanChannelsPreproc:
57
def __init__(self):
58
pass
59
60
@staticmethod
61
def process(img):
62
image_data = np.array(img).transpose(2, 0, 1).astype(np.float32)
63
mean = np.ones(image_data.shape)
64
mean[0] *= 104
65
mean[1] *= 117
66
mean[2] *= 123
67
image_data -= mean
68
image_data = np.expand_dims(image_data, 0)
69
return image_data
70
71
72
class DatasetImageFetch(object):
73
__metaclass__ = ABCMeta
74
data_prepoc = object
75
76
@abstractmethod
77
def __iter__(self):
78
pass
79
80
@abstractmethod
81
def next(self):
82
pass
83
84
@staticmethod
85
def pix_to_c(pix):
86
return pix[0] * 256 * 256 + pix[1] * 256 + pix[2]
87
88
@staticmethod
89
def color_to_gt(color_img, colors):
90
num_classes = len(colors)
91
gt = np.zeros((num_classes, color_img.shape[0], color_img.shape[1])).astype(np.int)
92
for img_y in range(color_img.shape[0]):
93
for img_x in range(color_img.shape[1]):
94
c = DatasetImageFetch.pix_to_c(color_img[img_y][img_x])
95
if c in colors:
96
cls = colors.index(c)
97
gt[cls][img_y][img_x] = 1
98
return gt
99
100
101
class PASCALDataFetch(DatasetImageFetch):
102
img_dir = ''
103
segm_dir = ''
104
names = []
105
colors = []
106
i = 0
107
108
def __init__(self, img_dir, segm_dir, names_file, segm_cls_colors_file, preproc):
109
self.img_dir = img_dir
110
self.segm_dir = segm_dir
111
self.colors = self.read_colors(segm_cls_colors_file)
112
self.data_prepoc = preproc
113
self.i = 0
114
115
with open(names_file) as f:
116
for l in f.readlines():
117
self.names.append(l.rstrip())
118
119
@staticmethod
120
def read_colors(img_classes_file):
121
result = []
122
with open(img_classes_file) as f:
123
for l in f.readlines():
124
color = np.array(map(int, l.split()[1:]))
125
result.append(DatasetImageFetch.pix_to_c(color))
126
return result
127
128
def __iter__(self):
129
return self
130
131
def next(self):
132
if self.i < len(self.names):
133
name = self.names[self.i]
134
self.i += 1
135
segm_file = self.segm_dir + name + ".png"
136
img_file = self.img_dir + name + ".jpg"
137
gt = self.color_to_gt(cv.imread(segm_file, cv.IMREAD_COLOR)[:, :, ::-1], self.colors)
138
img = self.data_prepoc.process(cv.imread(img_file, cv.IMREAD_COLOR)[:, :, ::-1])
139
return img, gt
140
else:
141
self.i = 0
142
raise StopIteration
143
144
def get_num_classes(self):
145
return len(self.colors)
146
147
148
class SemSegmEvaluation:
149
log = sys.stdout
150
151
def __init__(self, log_path,):
152
self.log = open(log_path, 'w')
153
154
def process(self, frameworks, data_fetcher):
155
samples_handled = 0
156
157
conf_mats = [np.zeros((data_fetcher.get_num_classes(), data_fetcher.get_num_classes())) for i in range(len(frameworks))]
158
blobs_l1_diff = [0] * len(frameworks)
159
blobs_l1_diff_count = [0] * len(frameworks)
160
blobs_l_inf_diff = [sys.float_info.min] * len(frameworks)
161
inference_time = [0.0] * len(frameworks)
162
163
for in_blob, gt in data_fetcher:
164
frameworks_out = []
165
samples_handled += 1
166
for i in range(len(frameworks)):
167
start = time.time()
168
out = frameworks[i].get_output(in_blob)
169
end = time.time()
170
segm = eval_segm_result(out)
171
conf_mats[i] += get_conf_mat(gt, segm[0])
172
frameworks_out.append(out)
173
inference_time[i] += end - start
174
175
pix_acc, mean_acc, miou = get_metrics(conf_mats[i])
176
177
name = frameworks[i].get_name()
178
print(samples_handled, 'Pixel accuracy, %s:' % name, 100 * pix_acc, file=self.log)
179
print(samples_handled, 'Mean accuracy, %s:' % name, 100 * mean_acc, file=self.log)
180
print(samples_handled, 'Mean IOU, %s:' % name, 100 * miou, file=self.log)
181
print("Inference time, ms ", \
182
frameworks[i].get_name(), inference_time[i] / samples_handled * 1000, file=self.log)
183
184
for i in range(1, len(frameworks)):
185
log_str = frameworks[0].get_name() + " vs " + frameworks[i].get_name() + ':'
186
diff = np.abs(frameworks_out[0] - frameworks_out[i])
187
l1_diff = np.sum(diff) / diff.size
188
print(samples_handled, "L1 difference", log_str, l1_diff, file=self.log)
189
blobs_l1_diff[i] += l1_diff
190
blobs_l1_diff_count[i] += 1
191
if np.max(diff) > blobs_l_inf_diff[i]:
192
blobs_l_inf_diff[i] = np.max(diff)
193
print(samples_handled, "L_INF difference", log_str, blobs_l_inf_diff[i], file=self.log)
194
195
self.log.flush()
196
197
for i in range(1, len(blobs_l1_diff)):
198
log_str = frameworks[0].get_name() + " vs " + frameworks[i].get_name() + ':'
199
print('Final l1 diff', log_str, blobs_l1_diff[i] / blobs_l1_diff_count[i], file=self.log)
200
201
if __name__ == "__main__":
202
parser = argparse.ArgumentParser()
203
parser.add_argument("--imgs_dir", help="path to PASCAL VOC 2012 images dir, data/VOC2012/JPEGImages")
204
parser.add_argument("--segm_dir", help="path to PASCAL VOC 2012 segmentation dir, data/VOC2012/SegmentationClass/")
205
parser.add_argument("--val_names", help="path to file with validation set image names, download it here: "
206
"https://github.com/shelhamer/fcn.berkeleyvision.org/blob/master/data/pascal/seg11valid.txt")
207
parser.add_argument("--cls_file", help="path to file with colors for classes, download it here: "
208
"https://github.com/opencv/opencv/blob/master/samples/data/dnn/pascal-classes.txt")
209
parser.add_argument("--prototxt", help="path to caffe prototxt, download it here: "
210
"https://github.com/opencv/opencv/blob/master/samples/data/dnn/fcn8s-heavy-pascal.prototxt")
211
parser.add_argument("--caffemodel", help="path to caffemodel file, download it here: "
212
"http://dl.caffe.berkeleyvision.org/fcn8s-heavy-pascal.caffemodel")
213
parser.add_argument("--log", help="path to logging file")
214
parser.add_argument("--in_blob", help="name for input blob", default='data')
215
parser.add_argument("--out_blob", help="name for output blob", default='score')
216
args = parser.parse_args()
217
218
prep = MeanChannelsPreproc()
219
df = PASCALDataFetch(args.imgs_dir, args.segm_dir, args.val_names, args.cls_file, prep)
220
221
fw = [CaffeModel(args.prototxt, args.caffemodel, args.in_blob, args.out_blob, True),
222
DnnCaffeModel(args.prototxt, args.caffemodel, '', args.out_blob)]
223
224
segm_eval = SemSegmEvaluation(args.log)
225
segm_eval.process(fw, df)
226
227