forked from palver7/CFLPytorch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathoffsetcalculator.py
211 lines (174 loc) · 8.45 KB
/
offsetcalculator.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
import math
import torch
import argparse
from torch import nn, Tensor
from torch.nn import init
from torch.nn.parameter import Parameter
from torch.nn.modules.utils import _pair
from torch.jit.annotations import Optional, Tuple
#from torchvision.ops.deform_conv import deform_conv2d
import time
def offcalc(batchsize=4):
# type: (Tensor, Tensor, Tensor, Optional[Tensor], Tuple[int, int], Tuple[int, int], Tuple[int, int]) -> Tensor
"""
Performs Equirectangular Convolution, described in Corners for Layout : End to End Layout Recovery from 360 Images
Arguments:
input (Tensor[batch_size, in_channels, in_height, in_width]): input tensor
weight (Tensor[out_channels, in_channels // groups, kernel_height, kernel_width]):
convolution weights, split into groups of size (in_channels // groups)
bias (Tensor[out_channels]): optional bias of shape (out_channels,). Default: None
stride (int or Tuple[int, int]): distance between convolution centers. Default: 1
padding (int or Tuple[int, int]): height/width of padding of zeroes around
each image. Default: 0
dilation (int or Tuple[int, int]): the spacing between kernel elements. Default: 1
Returns:
output (Tensor[batch_sz, out_channels, out_h, out_w]): result of convolution
Examples::
>>> input = torch.rand(1, 3, 10, 10)
>>> kh, kw = 3, 3
>>> weight = torch.rand(5, 3, kh, kw)
>>> # offset should have the same spatial size as the output
>>> # of the convolution. In this case, for an input of 10, stride of 1
>>> # and kernel size of 3, without padding, the output size is 8
>>> offset = torch.rand(5, 2 * kh * kw, 8, 8)
>>> out = deform_conv2d(input, offset, weight)
>>> print(out.shape)
>>> # returns
>>> torch.Size([1, 5, 8, 8])
"""
#stride_h, stride_w = _pair(stride)
#pad_h, pad_w = _pair(padding)
#dil_h, dil_w = _pair(dilation)
#k_h, k_w = _pair(kernelsize)
#pano_H, pano_W = _pair(pano)
#bs = batchsize
#time1=time.time()
def rotation_matrix(axis, theta):
""" code by cfernandez and jmfacil """
"""
Return the rotation matrix associated with counterclockwise rotation about
the given axis by theta radians.
"""
axis = torch.as_tensor(axis, device='cpu', dtype=torch.float)
axis = axis / math.sqrt(torch.dot(axis, axis))
a = math.cos(theta / 2.0)
b, c, d = -axis * math.sin(theta / 2.0)
aa, bb, cc, dd = a * a, b * b, c * c, d * d
bc, ad, ac, ab, bd, cd = b * c, a * d, a * c, a * b, b * d, c * d
ROT = torch.tensor([[aa + bb - cc - dd, 2 * (bc + ad), 2 * (bd - ac)],
[2 * (bc - ad), aa + cc - bb - dd, 2 * (cd + ab)],
[2 * (bd + ac), 2 * (cd - ab), aa + dd - bb - cc]], device='cpu', dtype=torch.float)
return ROT
def equi_coord(pano_W,pano_H,k_W,k_H,u,v):
""" code by cfernandez and jmfacil """
fov_w = k_W * math.radians(360./float(pano_W))
focal = (float(k_W)/2) / math.tan(fov_w/2)
c_x = 0
c_y = 0
u_r, v_r = u, v
u_r, v_r = u_r-float(pano_W)/2.,v_r-float(pano_H)/2.
phi, theta = u_r/(pano_W) * (math.pi) *2, -v_r/(pano_H) * (math.pi)
ROT = rotation_matrix((0,1,0),phi)
ROT = torch.matmul(ROT,rotation_matrix((1,0,0),theta))#np.eye(3)
h_range = torch.tensor(range(k_H), device='cpu', dtype=torch.float)
w_range = torch.tensor(range(k_W,), device='cpu', dtype=torch.float)
w_ones = (torch.ones(k_W, device='cpu', dtype=torch.float))
h_ones = (torch.ones(k_H, device='cpu', dtype=torch.float))
h_grid = torch.matmul(torch.unsqueeze(h_range,-1),torch.unsqueeze(w_ones,0))+0.5-float(k_H)/2
w_grid = torch.matmul(torch.unsqueeze(h_ones,-1),torch.unsqueeze(w_range,0))+0.5-float(k_W)/2
K = torch.tensor([[focal,0,c_x],[0,focal,c_y],[0.,0.,1.]], device='cpu', dtype=torch.float)
inv_K = torch.inverse(K)
rays = torch.stack([w_grid,h_grid,torch.ones(h_grid.shape, device='cpu', dtype=torch.float)],0)
rays = torch.matmul(inv_K,rays.reshape(3,k_H*k_W))
rays /= torch.norm(rays,dim=0,keepdim=True)
rays = torch.matmul(ROT,rays)
rays = rays.reshape(3,k_H,k_W)
phi = torch.atan2(rays[0,...],rays[2,...])
theta = torch.asin(torch.clamp(rays[1,...],-1,1))
x = (pano_W)/(2.*math.pi)*phi +float(pano_W)/2.
y = (pano_H)/(math.pi)*theta +float(pano_H)/2.
roi_y = h_grid+v_r +float(pano_H)/2.
roi_x = w_grid+u_r +float(pano_W)/2.
new_roi_y = (y)
new_roi_x = (x)
offsets_x = (new_roi_x - roi_x)
offsets_y = (new_roi_y - roi_y)
return offsets_x, offsets_y
def distortion_aware_map(pano_W, pano_H, k_W, k_H, s_width = 1, s_height = 1,bs = 16):
""" code by cfernandez and jmfacil """
#n=1
offset = torch.zeros(2*k_H*k_W,pano_H,pano_W, device='cpu', dtype=torch.float)
for v in range(0, pano_H, s_height):
for u in range(0, pano_W, s_width):
offsets_x, offsets_y = equi_coord(pano_W,pano_H,k_W,k_H,u,v)
offsets = torch.cat((torch.unsqueeze(offsets_y,-1),torch.unsqueeze(offsets_x,-1)),dim=-1)
total_offsets = offsets.flatten()
offset[:,v,u] = total_offsets
offset = torch.unsqueeze(offset, 0)
offset = torch.cat([offset for _ in range(bs)],dim=0)
offset.requires_grad_(False)
#print(offset.shape)
#print(offset)
return offset
#offset = distortion_aware_map(pano_W, pano_H, k_w, k_h,
# s_width = stride_w, s_height = stride_h, bs = bs)
layerdict = {0:((64,128),(3,3),(2,2)),
1:((64,128),(3,3),(1,1)),
2:((32,64),(3,3),(2,2)),
3:((32,64),(3,3),(1,1)),
4:((16,32),(5,5),(2,2)),
5:((16,32),(5,5),(1,1)),
6:((8,16),(3,3),(2,2)),
7:((8,16),(3,3),(1,1)),
8:((8,16),(3,3),(1,1)),
9:((8,16),(5,5),(1,1)),
10:((8,16),(5,5),(1,1)),
11:((8,16),(5,5),(1,1)),
12:((4,8),(5,5),(2,2)),
13:((4,8),(5,5),(1,1)),
14:((4,8),(5,5),(1,1)),
15:((4,8),(5,5),(1,1)),
16:((4,8),(3,3),(1,1)),
17:((4,8),(1,1),(1,1)),
18:((4,8),(3,3),(1,1)),
19:((8,16),(3,3),(1,1)),
20:((16,32),(3,3),(1,1)),
21:((16,32),(3,3),(1,1)),
22:((32,64),(3,3),(1,1)),
23:((32,64),(5,5),(1,1)),
24:((64,128),(3,3),(1,1)),
25:((64,128),(5,5),(1,1)),
26:((64,128),(3,3),(1,1))
}
paramlist =[((64,128),(5,5),(1,1)),
((64,128),(3,3),(2,2)),
((64,128),(3,3),(1,1)),
((32,64),(5,5),(1,1)),
((32,64),(3,3),(2,2)),
((32,64),(3,3),(1,1)),
((16,32),(5,5),(2,2)),
((16,32),(5,5),(1,1)),
((16,32),(3,3),(1,1)),
((8,16),(3,3),(2,2)),
((8,16),(3,3),(1,1)),
((8,16),(5,5),(1,1)),
((4,8),(5,5),(2,2)),
((4,8),(5,5),(1,1)),
((4,8),(3,3),(1,1)),
((4,8),(1,1),(1,1))]
offsetdict={}
for key in paramlist:
offsetdict[key] = distortion_aware_map(key[0][1],key[0][0],key[1][1],key[1][0],s_width=key[2][1],s_height=key[2][0],bs=batchsize)
#time2=time.time()
#print((time2-time1)/60)
return layerdict, offsetdict
if __name__ == '__main__':
parser = argparse.ArgumentParser()
parser.add_argument('--batchsize', type=int, default=4, metavar='B',
help='size of minibatches (default: 4)')
parser.add_argument('--mode', type=str, default='train', metavar='M',
help='append to the saved dict file either train or test (default: train)')
args = parser.parse_args()
layerdict,offsetdict = offcalc(batchsize=args.batchsize)
torch.save(layerdict,'./layer{}.pt'.format(args.mode))
torch.save(offsetdict,'./offset{}.pt'.format(args.mode))