-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfeature_packager.py
87 lines (73 loc) · 3.9 KB
/
feature_packager.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
import glob
import os
import h5py
import numpy as np
from configs.preprocess_configs import (FEATURE_PACKAGE_ROOT,
GRID_FEATURE_ROOT_QUERY, GRID_FEATURE_ROOT_CLIP,
TEXT_FEATURE_ROOT_QUERY, TEXT_FEATURE_ROOT_CLIP)
def load_from_feature_package(group_handle):
feature_dict = dict()
vids = group_handle.keys()
for vid in vids:
feature_dict[vid] = dict()
sub_groups = group_handle[vid].keys()
for sub_group in sub_groups:
if '.jpg' in sub_group:
regions = group_handle[vid][sub_group].keys()
region_feature_list = [[] for r in regions]
for region in regions:
if region == 'image':
region_feature_list[0] = group_handle[vid][sub_group][region][0].squeeze()
elif region == 'bbox' or region == 'box':
region_feature_list[1] = group_handle[vid][sub_group][region][0].squeeze()
else:
bbox_idx = int(region[4:])
region_feature_list[bbox_idx] = group_handle[vid][sub_group][region][0].squeeze()
feature_dict[vid][sub_group] = np.array(region_feature_list)
else:
feature_dict[vid][sub_group] = dict()
datas = group_handle[vid][sub_group].keys()
for data in datas:
if data == 'img_alignment':
img_alignment_rows = group_handle[vid][sub_group][data].keys()
feature_dict[vid][sub_group][data] = [[] for i in img_alignment_rows]
for img_alignment_row in img_alignment_rows:
int(img_alignment_row)
feature_dict[vid][sub_group][data][int(img_alignment_row)] = \
group_handle[vid][sub_group][data][img_alignment_row][:].tolist()
elif data == 'token':
token_list = group_handle[vid][sub_group][data][:].tolist()
feature_dict[vid][sub_group][data] = [str(token)[2:-1] for token in token_list]
else:
if len(group_handle[vid][sub_group][data][:]) == 4:
feature_dict[vid][sub_group][data] = group_handle[vid][sub_group][data][:].squeeze()
else:
feature_dict[vid][sub_group][data] = group_handle[vid][sub_group][data][:]
return feature_dict
def copy_all_group(root, feature_group):
frame_grid_h5_list = glob.glob(os.path.join(root, '*.hdf5'))
for frame_grid_h5 in frame_grid_h5_list:
with h5py.File(frame_grid_h5, 'r') as sub_f:
vid = frame_grid_h5.split('/')[-1][:11]
feature_group.create_group(vid)
for key in sub_f.keys():
sub_f.copy(key, feature_group[vid])
def package_all_feature(save_path=FEATURE_PACKAGE_ROOT,
query_grid_root=GRID_FEATURE_ROOT_QUERY, frame_grid_root=GRID_FEATURE_ROOT_CLIP,
query_text_root=TEXT_FEATURE_ROOT_QUERY, subtitle_text_root=TEXT_FEATURE_ROOT_CLIP):
f = h5py.File(os.path.join(save_path, 'feature.hdf5'), 'w')
# query_grid_feature
query_grid_feature = f.create_group('query_grid_feature')
copy_all_group(query_grid_root, query_grid_feature)
# frame_grid_feature
frame_grid_feature = f.create_group('frame_grid_feature')
copy_all_group(frame_grid_root, frame_grid_feature)
# query_text_feature
query_text_feature = f.create_group('query_text_feature')
copy_all_group(query_text_root, query_text_feature)
# subtitle_text_feature
subtitle_text_feature = f.create_group('subtitle_text_feature')
copy_all_group(subtitle_text_root, subtitle_text_feature)
f.close()
if __name__ == '__main__':
package_all_feature()