in vision_charts/models.py [0:0]
def __init__(self, args):
super(Image_Encoder, self).__init__()
layers = []
cur_size = 6
next_size = 16
for i in range(args.num_img_blocks):
layers.append(CNN_layer(cur_size, next_size, args.size_img_ker, stride=2))
cur_size = next_size
next_size = next_size * 2
for j in range(args.num_img_layers -1):
layers.append(CNN_layer(cur_size, cur_size, args.size_img_ker))
self.args = args
self.layers = nn.ModuleList(layers)
f = 221.7025
RT = np.array([[-0.0000, -1.0000, 0.0000, -0.0000],
[-0.7071, 0.0000, -0.7071, 0.4243],
[0.7071, 0.0000, -0.7071, 1.1314]])
K = np.array([[f, 0, 128.], [0, f, 128.], [0, 0, 1]])
self.matrix = torch.FloatTensor(K.dot(RT)).cuda()