Caffe-DeepBinaryCode/src/caffe/layers/spp_layer.cpp at master · feiyuhug/Caffe-DeepBinaryCode

History

193 lines (164 loc) · 6.65 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

#include <algorithm>

#include <cfloat>

#include <vector>

#include "caffe/common.hpp"

#include "caffe/layer.hpp"

#include "caffe/syncedmem.hpp"

#include "caffe/util/math_functions.hpp"

#include "caffe/vision_layers.hpp"

namespace caffe {

using std::min;

using std::max;

template <typename Dtype>

LayerParameter SPPLayer<Dtype>::GetPoolingParam(const int pyramid_level,

const int bottom_h, const int bottom_w, const SPPParameter spp_param) {

LayerParameter pooling_param;

int num_bins = pow(2, pyramid_level);

// find padding and kernel size so that the pooling is

// performed across the entire image

int kernel_h = ceil(bottom_h / static_cast<double>(num_bins));

// remainder_h is the min number of pixels that need to be padded before

// entire image height is pooled over with the chosen kernel dimension

int remainder_h = kernel_h * num_bins - bottom_h;

// pooling layer pads (2 * pad_h) pixels on the top and bottom of the

// image.

int pad_h = (remainder_h + 1) / 2;

// similar logic for width

int kernel_w = ceil(bottom_w / static_cast<double>(num_bins));

int remainder_w = kernel_w * num_bins - bottom_w;

int pad_w = (remainder_w + 1) / 2;

pooling_param.mutable_pooling_param()->set_pad_h(pad_h);

pooling_param.mutable_pooling_param()->set_pad_w(pad_w);

pooling_param.mutable_pooling_param()->set_kernel_h(kernel_h);

pooling_param.mutable_pooling_param()->set_kernel_w(kernel_w);

pooling_param.mutable_pooling_param()->set_stride_h(kernel_h);

pooling_param.mutable_pooling_param()->set_stride_w(kernel_w);

switch (spp_param.pool()) {

case SPPParameter_PoolMethod_MAX:

pooling_param.mutable_pooling_param()->set_pool(

PoolingParameter_PoolMethod_MAX);

break;

case SPPParameter_PoolMethod_AVE:

pooling_param.mutable_pooling_param()->set_pool(

PoolingParameter_PoolMethod_AVE);

break;

case SPPParameter_PoolMethod_STOCHASTIC:

pooling_param.mutable_pooling_param()->set_pool(

PoolingParameter_PoolMethod_STOCHASTIC);

break;

default:

LOG(FATAL) << "Unknown pooling method.";

}

return pooling_param;

}

template <typename Dtype>

void SPPLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

SPPParameter spp_param = this->layer_param_.spp_param();

bottom_h_ = bottom[0]->height();

bottom_w_ = bottom[0]->width();

CHECK_GT(bottom_h_, 0) << "Input dimensions cannot be zero.";

CHECK_GT(bottom_w_, 0) << "Input dimensions cannot be zero.";

pyramid_height_ = spp_param.pyramid_height();

split_top_vec_.clear();

pooling_bottom_vecs_.clear();

pooling_layers_.clear();

pooling_top_vecs_.clear();

pooling_outputs_.clear();

flatten_layers_.clear();

flatten_top_vecs_.clear();

flatten_outputs_.clear();

concat_bottom_vec_.clear();

// split layer output holders setup

for (int i = 0; i < pyramid_height_; i++) {

split_top_vec_.push_back(new Blob<Dtype>());

}

// split layer setup

LayerParameter split_param;

split_layer_.reset(new SplitLayer<Dtype>(split_param));

split_layer_->SetUp(bottom, split_top_vec_);

for (int i = 0; i < pyramid_height_; i++) {

// pooling layer input holders setup

pooling_bottom_vecs_.push_back(new vector<Blob<Dtype>*>);

pooling_bottom_vecs_[i]->push_back(split_top_vec_[i]);

// pooling layer output holders setup

pooling_outputs_.push_back(new Blob<Dtype>());

pooling_top_vecs_.push_back(new vector<Blob<Dtype>*>);

pooling_top_vecs_[i]->push_back(pooling_outputs_[i]);

// pooling layer setup

LayerParameter pooling_param = GetPoolingParam(

i, bottom_h_, bottom_w_, spp_param);

pooling_layers_.push_back(shared_ptr<PoolingLayer<Dtype> > (

new PoolingLayer<Dtype>(pooling_param)));

pooling_layers_[i]->SetUp(*pooling_bottom_vecs_[i], *pooling_top_vecs_[i]);

// flatten layer output holders setup

flatten_outputs_.push_back(new Blob<Dtype>());

flatten_top_vecs_.push_back(new vector<Blob<Dtype>*>);

flatten_top_vecs_[i]->push_back(flatten_outputs_[i]);

// flatten layer setup

LayerParameter flatten_param;

flatten_layers_.push_back(new FlattenLayer<Dtype>(flatten_param));

flatten_layers_[i]->SetUp(*pooling_top_vecs_[i], *flatten_top_vecs_[i]);

// concat layer input holders setup

concat_bottom_vec_.push_back(flatten_outputs_[i]);

}

// concat layer setup

LayerParameter concat_param;

concat_layer_.reset(new ConcatLayer<Dtype>(concat_param));

concat_layer_->SetUp(concat_bottom_vec_, top);

}

template <typename Dtype>

void SPPLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

CHECK_EQ(4, bottom[0]->num_axes()) << "Input must have 4 axes, "

<< "corresponding to (num, channels, height, width)";

channels_ = bottom[0]->channels();

bottom_h_ = bottom[0]->height();

bottom_w_ = bottom[0]->width();

SPPParameter spp_param = this->layer_param_.spp_param();

split_layer_->Reshape(bottom, split_top_vec_);

for (int i = 0; i < pyramid_height_; i++) {

LayerParameter pooling_param = GetPoolingParam(

i, bottom_h_, bottom_w_, spp_param);

pooling_layers_[i].reset(

new PoolingLayer<Dtype>(pooling_param));

pooling_layers_[i]->SetUp(

*pooling_bottom_vecs_[i], *pooling_top_vecs_[i]);

pooling_layers_[i]->Reshape(

*pooling_bottom_vecs_[i], *pooling_top_vecs_[i]);

flatten_layers_[i]->Reshape(

*pooling_top_vecs_[i], *flatten_top_vecs_[i]);

}

concat_layer_->Reshape(concat_bottom_vec_, top);

}

template <typename Dtype>

void SPPLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

split_layer_->Forward(bottom, split_top_vec_);

for (int i = 0; i < pyramid_height_; i++) {

pooling_layers_[i]->Forward(

*pooling_bottom_vecs_[i], *pooling_top_vecs_[i]);

flatten_layers_[i]->Forward(

*pooling_top_vecs_[i], *flatten_top_vecs_[i]);

}

concat_layer_->Forward(concat_bottom_vec_, top);

}

template <typename Dtype>

void SPPLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,

const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom) {

if (!propagate_down[0]) {

return;

}

vector<bool> concat_propagate_down(pyramid_height_, true);

concat_layer_->Backward(top, concat_propagate_down, concat_bottom_vec_);

for (int i = 0; i < pyramid_height_; i++) {

flatten_layers_[i]->Backward(

*flatten_top_vecs_[i], propagate_down, *pooling_top_vecs_[i]);

pooling_layers_[i]->Backward(

*pooling_top_vecs_[i], propagate_down, *pooling_bottom_vecs_[i]);

}

split_layer_->Backward(split_top_vec_, propagate_down, bottom);

}

INSTANTIATE_CLASS(SPPLayer);

REGISTER_LAYER_CLASS(SPP);

} // namespace caffe

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

spp_layer.cpp

Latest commit

History

spp_layer.cpp

File metadata and controls