forked from ayanc/mdepth
-
Notifications
You must be signed in to change notification settings - Fork 0
/
loadModel.m
153 lines (120 loc) · 3.98 KB
/
loadModel.m
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
% function net = loadModel(path_to_model_file)
%
% Load kernels, bins, and network weights from trained model.
%
% path = Full path of trained caffemodel.h5 file
%
%-- Ayan Chakrabarti <[email protected]>
function net = loadModel(mh5)
% Network Definition
layers = {{ 'conv1', 1, 1}, { 'conv2', 1, 1}, { 'conv3', 1, 1}, { 'conv4', 2, 1}, { 'conv5', 4, 1}, { 'conv6', 8, 1}, { 'conv7', 16, 1}, { 'conv8', 16, 1}, { 'conv9', 16, 1}, { 'pred0', 16, 0}, };
% Build struct with all details
net = struct;
% Get filters and bin centers
k = squeeze(h5read(mh5,'/data/derFilt/0'));
net.numk = size(k,3);
k = k(end:-1:1,end:-1:1,:);
k = permute(k,[2 1 3]);
net.bins = -squeeze(h5read(mh5,'/data/fBins/1'));
net.nbins = length(net.bins) / net.numk;
net.bins = reshape(net.bins,[net.nbins net.numk]);
scales = squeeze(h5read(mh5,'/data/fBins/0'));
scales = scales(1:net.nbins:end);
scales = reshape(scales,[1 1 net.numk]);
net.k = bsxfun(@times,k,scales);
% Set up local path
net.layers = {}; rsize = 1;
for i = 1:length(layers)
l = layers{i};
dil = l{2}; relu = l{3};
wts = h5read(mh5,['/data/' l{1} '/0']);
wts = permute(wts,[2 1 3 4]);
bias = h5read(mh5,['/data/' l{1} '/1']);
net.layers{end+1} = {wts, bias, dil, relu};
rsize = rsize + (size(wts,1)-1)*dil;
end;
net.rsize = rsize;
% Set up VGG-19 path
net.vconvs = [2 2 4 4 4];
net.vlayers = {};
for i = 1:length(net.vconvs)
for j = 1:net.vconvs(i)
w = h5read(mh5,sprintf('/data/conv%d_%d/0',i,j));
b = h5read(mh5,sprintf('/data/conv%d_%d/1',i,j));
net.vlayers{end+1} = {w,b};
end;
end;
w = h5read(mh5,'/data/vgg_fc1/0');
b = h5read(mh5,'/data/vgg_fc1/1');
net.vgg_fc1 = {w',b};
w = h5read(mh5,'/data/vgg_fc2/0');
b = h5read(mh5,'/data/vgg_fc2/1');
net.vgg_gfp = {w',b};
fac = 32;
bw = ceil(560/fac)+1; bh = ceil(426/fac)+1;
nUnits = length(b)/bw/bh;
net.gsz = [bw bh nUnits fac];
% Move everything to gpu
if 1 > 2
for i = 1:length(net.layers)
net.layers{i}{1} = gpuArray(single(net.layers{i}{1}));
net.layers{i}{2} = gpuArray(single(net.layers{i}{2}));
end;
for i = 1:length(net.vlayers)
net.vlayers{i}{1} = gpuArray(single(net.vlayers{i}{1}));
net.vlayers{i}{2} = gpuArray(single(net.vlayers{i}{2}));
end;
net.vgg_fc1{1} = gpuArray(single(net.vgg_fc1{1}));
net.vgg_fc1{2} = gpuArray(single(net.vgg_fc1{2}));
net.vgg_gfp{1} = gpuArray(single(net.vgg_gfp{1}));
net.vgg_gfp{2} = gpuArray(single(net.vgg_gfp{2}));
end;
%%%% Precompute things for consensus
%%% Choose regularizer
rfilt = [-1 2 -1];
rf1 = [0 0 0; rfilt; 0 0 0]; rf2 = diag(rfilt);
regf = cat(3,rf1,rf1',rf2,fliplr(rf2));
% set up sizes
filt_x = (size(net.k,1)-1)/2; % Filter size
tot_x = 2*filt_x; % Increase FFT size by this much
Zht = 427+2*tot_x;
Zwd = 561+2*tot_x;
% Pad, shift and DFT of filters
Kf = padarray(net.k,[Zht Zwd] - size(net.k,1),'post');
Kf = circshift(Kf,-filt_x*[1 1]);
Kf = gpuArray(single(Kf));
% Scale everything
ksc = sqrt(1./sum(sum(net.k.^2,1),2));
% Downweight 0th derivs
zdidx = min(min(net.k,[],1),[],2);
zdidx = find(zdidx >= 0);
ksc(zdidx) = ksc(zdidx)/4;
ksc = gpuArray(single(ksc));
Kf = bsxfun(@times,Kf,ksc);
Kf = fft2(Kf); Kfc = conj(Kf); Kfm = sum(Kf.*Kfc,3);
net.Kf = Kf; net.Kfc = Kfc; net.Kfm = Kfm;
% Add regularizer
Rf = padarray(regf,[Zht Zwd]-size(regf,1),'post');
Rf = circshift(Rf,-(size(regf,1)-1)/2*[1 1]);
Rf = gpuArray(single(Rf));
Rf = fft2(Rf); Rf = sum(Rf.*conj(Rf),3);
net.Rf = Rf;
% Move bin-centers to gpu
bins = net.bins'; bins = reshape(bins,[1 1 size(bins)]);
bins = gpuArray(single(bins));
net.bins = bsxfun(@times,bins,ksc);
% Fix last layer to give scaled log-likelihoods, permuted to be
% HxWxKxB
wts = net.layers{end}{1}; bias = net.layers{end}{2};
osz = size(wts);
wts = reshape(wts, [prod(osz)/net.numk/net.nbins ...
net.nbins net.numk]);
wts = permute(wts,[1 3 2]);
wts = reshape(wts,osz); net.layers{end}{1} = wts;
osz = size(bias);
bias = reshape(bias, [1 net.nbins net.numk]);
bias = permute(bias,[1 3 2]);
bias = reshape(bias,osz);
net.layers{end}{2} = bias;
% Store multiplier for doForward output
net.ksc = -2*ksc.^2;