-
Notifications
You must be signed in to change notification settings - Fork 71
/
Copy pathinference_memory_bank.py
86 lines (64 loc) · 2.33 KB
/
inference_memory_bank.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
import math
import torch
def softmax_w_top(x, top):
values, indices = torch.topk(x, k=top, dim=1)
x_exp = values.exp_()
x_exp /= torch.sum(x_exp, dim=1, keepdim=True)
# The types should be the same already
# some people report an error here so an additional guard is added
x.zero_().scatter_(1, indices, x_exp.type(x.dtype)) # B * THW * HW
return x
class MemoryBank:
def __init__(self, k, top_k=20):
self.top_k = top_k
self.CK = None
self.CV = None
self.mem_k = None
self.mem_v = None
self.num_objects = k
def _global_matching(self, mk, qk):
# NE means number of elements -- typically T*H*W
B, CK, NE = mk.shape
# See supplementary material
a_sq = mk.pow(2).sum(1).unsqueeze(2)
ab = mk.transpose(1, 2) @ qk
affinity = (2*ab-a_sq) / math.sqrt(CK) # B, NE, HW
affinity = softmax_w_top(affinity, top=self.top_k) # B, NE, HW
return affinity
def _readout(self, affinity, mv):
return torch.bmm(mv, affinity)
def match_memory(self, qk):
k = self.num_objects
_, _, h, w = qk.shape
qk = qk.flatten(start_dim=2)
if self.temp_k is not None:
mk = torch.cat([self.mem_k, self.temp_k], 2)
mv = torch.cat([self.mem_v, self.temp_v], 2)
else:
mk = self.mem_k
mv = self.mem_v
affinity = self._global_matching(mk, qk)
# One affinity for all
readout_mem = self._readout(affinity.expand(k,-1,-1), mv)
return readout_mem.view(k, self.CV, h, w)
def add_memory(self, key, value, is_temp=False):
# Temp is for "last frame"
# Not always used
# But can always be flushed
self.temp_k = None
self.temp_v = None
key = key.flatten(start_dim=2)
value = value.flatten(start_dim=2)
if self.mem_k is None:
# First frame, just shove it in
self.mem_k = key
self.mem_v = value
self.CK = key.shape[1]
self.CV = value.shape[1]
else:
if is_temp:
self.temp_k = key
self.temp_v = value
else:
self.mem_k = torch.cat([self.mem_k, key], 2)
self.mem_v = torch.cat([self.mem_v, value], 2)