spectral-lib/LearnableInterp2D.lua at master · mbhenaff/spectral-lib · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
-- General interpolation module. Images and weights are resized to be n^2 and k^2 respectively.
-- The interpolation map is a n^2 x k^2 matrix.
require 'nn'

local LearnableInterp2D, parent = torch.class('nn.LearnableInterp2D', 'nn.Module')

function LearnableInterp2D:__init(iH, iW, oH, oW, interpType)
   parent.__init(self)
   assert(iH == iW and oH == oW)
   self.iH = iH
   self.iW = iW
   self.oH = oH
   self.oW = oW
   self.interpType = interpType
   self.cntr = 0
   if self.interpType == 'spatial' then
      self.weight = torch.load('/misc/vlgscratch3/LecunGroup/mbhenaff/spectralnet/interp_kernels/spatial_kernel_' .. iH .. '_' .. oH .. '.th'):float()
   else
      self.weight = compute_interpolation_matrix(iH, oH, interpType)
   end
   self.gradWeight = torch.Tensor(self.weight:size()):zero()
   if false then
   self.mask = torch.Tensor(self.weight:size()):fill(1)
   for i = 1,self.weight:size(1) do
      for j = 1,self.weight:size(2) do
         if math.abs(self.weight[i][j]) < 1e-5 then
            self.mask[i][j] = 0
         end
      end
   end
else
   self.mask = compute_mask(iH, oH)
end
   self.originalKernel = self.weight:clone()
end

--[[
function LearnableInterp2D:reset()
   if self.interpType == 'spatial' then
      self.weight = torch.load('/misc/vlgscratch3/LecunGroup/mbhenaff/spectralnet/interp_kernels/spatial_kernel_' .. iH .. '_' .. oH .. '.th'):float()
   else
      self.weight = compute_interpolation_matrix(iH, oH, interpType)
   end
   self.gradWeight = torch.Tensor(self.weight:size()):zero()
   self.mask = torch.Tensor(self.weight:size()):fill(1)
   for i = 1,self.weight:size(1) do
      for j = 1,self.weight:size(2) do
         if math.abs(self.weight[i][j]) < 1e-5 then
            self.mask[i][j] = 0
         end
      end
   end
end
--]]


function LearnableInterp2D:updateOutput(input)

   self.cntr = self.cntr + 1
   -- rescale the weights to the right nuclear norm
   if self.cntr % 100 == 0 then
      local s = estimate_scaling(self.originalKernel, self.weight)
      print('rescaling, s = ' .. s)
      print(self.weight:norm())
      self.weight:mul(s)
      collectgarbage()
   end
   self.weight:cmul(self.mask)
   local d1 = input:size(1)
   local d2 = input:size(2)
   input:resize(d1*d2, self.iH*self.iW*2)
   self.output:resize(d1*d2, self.oH*self.oW*2)
   self.output:zero()
   self.output:addmm(input,self.weight)
   input:resize(d1,d2,self.iH,self.iW,2)
   self.output:resize(d1,d2,self.oH,self.oW,2)
   return self.output
end

function LearnableInterp2D:updateGradInput(input, gradOutput)
   self.weight:cmul(self.mask)
   local d1 = input:size(1)
   local d2 = input:size(2)
   gradOutput:resize(d1*d2, self.oH*self.oW*2)
   self.gradInput:resize(d1*d2, self.iH*self.iW*2)
   self.gradInput:zero()
   self.gradInput:addmm(gradOutput, self.weight:t())
   self.gradInput:resize(d1,d2,self.iH,self.iW,2)
   gradOutput:resize(d1,d2,self.oH,self.oW,2)
   return self.gradInput
end

function LearnableInterp2D:accGradParameters(input, gradOutput, scale)
   local scale = scale or 1
   local d1 = input:size(1)
   local d2 = input:size(2)
   gradOutput:resize(d1*d2, self.oH*self.oW*2)
   input:resize(d1*d2,self.iH*self.iW*2)
   self.gradWeight:zero()
   self.gradWeight:addmm(scale, input:t(), gradOutput)
   self.gradWeight:cmul(self.mask)
   input:resize(d1, d2, self.iH, self.iW, 2)
   gradOutput:resize(d1, d2, self.oH, self.oW, 2)
end

function compute_interpolation_matrix(k,n,interpType)
   local K = torch.FloatTensor(2*k^2, 2*n^2)
   local model = nn.ComplexInterp(k,k,n,n,interpType):float()
   local input = torch.FloatTensor(1,k,k,2)
   local cntr = 1
   for i = 1,k do
      for j = 1,k do
         for l = 1,2 do
            input:zero()
            input[1][i][j][l] = 1
            out = model:forward(input)
            K[{cntr,{}}]:copy(out:resize(2*n^2))
            cntr = cntr + 1
         end
      end
   end
   -- scale so it has similar norm to FFT matrix
   local FFTmat = interpKernel(k,n,'spatial2D')
   local scale = estimate_scaling(FFTmat, K)
   print('scaling factor: ' .. scale)
   K:mul(scale)
   return K,scale
end


function compute_mask(k,n)
   local K = torch.FloatTensor(2*k^2, 2*n^2)
   local model = nn.ComplexInterp(k,k,n,n,'bilinear'):float()
   model.kernelRows:fill(1)
   model.kernelCols:fill(1)
   local input = torch.FloatTensor(1,k,k,2)
   local cntr = 1
   for i = 1,k do
      for j = 1,k do
         for l = 1,2 do
            input:zero()
            input[1][i][j][l] = 1
            out = model:forward(input)
            K[{cntr,{}}]:copy(out:resize(2*n^2))
            cntr = cntr + 1
         end
      end
   end

   for i = 1,2*k^2 do
      for j = 1,2*n^2 do
         if math.abs(K[i][j]) < 1e-5 then
            K[i][j] = 0
         else
            K[i][j] = 1
         end
      end
   end
   return K
end


-- estimate a scaling factor for matrix M2 so that it has a similar matrix norm as M1
function estimate_scaling(M1, M2, npts)
   local npts = npts or 1000
   local k = M1:size(1)
   local n = M1:size(2)
   local out1
   local out2
   local input
   if M2:type() == 'torch.CudaTensor' then
      input = torch.rand(npts,k):cuda()
      out1 = torch.CudaTensor(npts,n):zero()
      out2 = torch.CudaTensor(npts,n):zero()
   else
      input = torch.rand(npts,k):float()
      out1 = torch.FloatTensor(npts,n):zero()
      out2 = torch.FloatTensor(npts,n):zero()
   end

   for i = 1,npts do
      input[i]:mul(1/input[i]:norm())
   end
   out1:addmm(input,M1)
   out2:addmm(input,M2)

   local d1 = out1:norm(2,2)
   local d2 = out2:norm(2,2)
   return torch.max(d1) / torch.max(d2)
end