-
Notifications
You must be signed in to change notification settings - Fork 46
/
Copy pathfuse_validate_data.py
205 lines (163 loc) · 7.15 KB
/
fuse_validate_data.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
"""
Class for managing our data.
"""
import csv
import numpy as np
import os.path
import random
import threading
from keras.utils import to_categorical
import cv2
class DataSet():
def __init__(self, class_limit=None, image_shape=(224, 224), original_image_shape=(341, 256), n_snip=5, opt_flow_len=10, batch_size=16):
"""Constructor.
opt_flow_len = (int) the number of optical flow frames to consider
class_limit = (int) number of classes to limit the data to.
None = no limit.
"""
self.class_limit = class_limit
self.image_shape = image_shape
self.original_image_shape = original_image_shape
self.n_snip = n_snip
self.opt_flow_len = opt_flow_len
self.batch_size = batch_size
self.static_frame_path = os.path.join('/data/test')
self.opt_flow_path = os.path.join('/data', 'opt_flow')
# Get the data.
self.data_list = self.get_data_list()
# Get the classes.
self.classes = self.get_classes()
# Now do some minor data cleaning
self.data_list = self.clean_data_list()
# Get the right dataset for the generator.
train, test = self.split_train_test()
self.data_list = test
# number of batches in 1 epoch
self.n_batch = len(self.data_list) // self.batch_size
@staticmethod
def get_data_list():
"""Load our data list from file."""
with open(os.path.join('/data', 'data_list.csv'), 'r') as fin:
reader = csv.reader(fin)
data_list = list(reader)
return data_list
def clean_data_list(self):
data_list_clean = []
for item in self.data_list:
if item[1] in self.classes:
data_list_clean.append(item)
return data_list_clean
def get_classes(self):
"""Extract the classes from our data, '\n'. If we want to limit them,
only return the classes we need."""
classes = []
for item in self.data_list:
if item[1] not in classes:
classes.append(item[1])
# Sort them.
classes = sorted(classes)
# Return.
if self.class_limit is not None:
return classes[:self.class_limit]
else:
return classes
def get_class_one_hot(self, class_str):
"""Given a class as a string, return its number in the classes
list. This lets us encode and one-hot it for training."""
# Encode it first.
label_encoded = self.classes.index(class_str)
# Now one-hot it.
label_hot = to_categorical(label_encoded, len(self.classes))
assert label_hot.shape[0] == len(self.classes)
return label_hot
def split_train_test(self):
"""Split the data into train and test groups."""
train = []
test = []
for item in self.data_list:
if item[0] == 'train':
train.append(item)
else:
test.append(item)
return train, test
def validation_generator(self):
"""Return a generator of optical frame stacks that we can use to test."""
print("\nCreating validation generator with %d samples.\n" % len(self.data_list))
idx = 0
while 1:
idx += 1
idx = idx % self.n_batch
print("\nGenerating batch number {0}/{1} ...".format(idx, self.n_batch))
X_spatial_batch = []
X_temporal_batch = []
y_batch = []
# Get a list of batch-size samples.
batch_list = self.data_list[idx * self.batch_size: (idx + 1) * self.batch_size]
for row in batch_list:
# Get the stacked optical flows from disk.
X_spatial, X_temporal = self.get_static_frame_and_stacked_opt_flows(row)
# Get the corresponding labels
y = self.get_class_one_hot(row[1])
y = np.array(y)
y = np.squeeze(y)
X_spatial_batch.append(X_spatial)
X_temporal_batch.append(X_temporal)
y_batch.append(y)
X_batch = [np.array(X_spatial_batch), np.array(X_temporal_batch)]
y_batch = np.array(y_batch)
yield X_batch, y_batch
def get_static_frame_and_stacked_opt_flows(self, row):
static_frames = []
opt_flow_stacks = []
static_frame_dir = os.path.join(self.static_frame_path, row[1], row[2])
opt_flow_dir_x = os.path.join(self.opt_flow_path, 'u', row[2])
opt_flow_dir_y = os.path.join(self.opt_flow_path, 'v', row[2])
# spatial parameters (crop at center for validation)
left = int((self.original_image_shape[0] - self.image_shape[0]) * 0.5)
top = int((self.original_image_shape[1] - self.image_shape[1]) * 0.5)
right = left + self.image_shape[0]
bottom = top + self.image_shape[1]
# temporal parameters
total_frames = len(os.listdir(opt_flow_dir_x))
if total_frames - self.opt_flow_len + 1 < self.n_snip:
loop = True
start_frame_window_len = 1
else:
loop = False
start_frame_window_len = (total_frames - self.opt_flow_len + 1) // self.n_snip # starting frame selection window length
# loop over snippets
for i_snip in range(self.n_snip):
if loop:
start_frame = i_snip % (total_frames - self.opt_flow_len + 1) + 1
else:
start_frame = int(0.5 * start_frame_window_len + 0.5) + start_frame_window_len * i_snip
# Get the static frame
static_frame = cv2.imread(static_frame_dir + '-%04d' % start_frame + '.jpg')
static_frame = static_frame / 255.0
static_frame = cv2.resize(static_frame, self.image_shape)
static_frames.append(static_frame)
# Get the optical flow stack
frames = range(start_frame, start_frame + self.opt_flow_len) # selected optical flow frames
opt_flow_stack = []
# loop over frames
for i_frame in frames:
# horizontal components
img = None # reset to be safe
img = cv2.imread(opt_flow_dir_x + '/frame' + "%06d"%i_frame + '.jpg', 0)
img = np.array(img)
img = img - np.mean(img) # mean substraction
img = img[top: bottom, left: right]
img = img / 255.0 # normalize pixels
opt_flow_stack.append(img)
# vertical components
img2 = None # reset to be safe
img2 = cv2.imread(opt_flow_dir_y + '/frame' + "%06d"%i_frame + '.jpg', 0)
img2 = np.array(img2)
img2 = img2 - np.mean(img2) # mean substraction
img2 = img2[top: bottom, left: right]
img2 = img2 / 255.0 # normalize pixels
opt_flow_stack.append(img2)
opt_flow_stack = np.array(opt_flow_stack)
opt_flow_stack = np.swapaxes(opt_flow_stack, 0, 2)
opt_flow_stacks.append(opt_flow_stack)
return np.array(static_frames), np.array(opt_flow_stacks)