Caffe-DeepBinaryCode/src/caffe/layers/pooling_layer.cpp at master · feiyuhug/Caffe-DeepBinaryCode

History

319 lines (308 loc) · 11.3 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

#include <algorithm>

#include <cfloat>

#include <vector>

#include "caffe/common.hpp"

#include "caffe/layer.hpp"

#include "caffe/syncedmem.hpp"

#include "caffe/util/math_functions.hpp"

#include "caffe/vision_layers.hpp"

namespace caffe {

using std::min;

using std::max;

template <typename Dtype>

void PoolingLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

PoolingParameter pool_param = this->layer_param_.pooling_param();

if (pool_param.global_pooling()) {

CHECK(!(pool_param.has_kernel_size() ||

pool_param.has_kernel_h() || pool_param.has_kernel_w()))

<< "With Global_pooling: true Filter size cannot specified";

} else {

CHECK(!pool_param.has_kernel_size() !=

!(pool_param.has_kernel_h() && pool_param.has_kernel_w()))

<< "Filter size is kernel_size OR kernel_h and kernel_w; not both";

CHECK(pool_param.has_kernel_size() ||

(pool_param.has_kernel_h() && pool_param.has_kernel_w()))

<< "For non-square filters both kernel_h and kernel_w are required.";

}

CHECK((!pool_param.has_pad() && pool_param.has_pad_h()

&& pool_param.has_pad_w())

|| (!pool_param.has_pad_h() && !pool_param.has_pad_w()))

<< "pad is pad OR pad_h and pad_w are required.";

CHECK((!pool_param.has_stride() && pool_param.has_stride_h()

&& pool_param.has_stride_w())

|| (!pool_param.has_stride_h() && !pool_param.has_stride_w()))

<< "Stride is stride OR stride_h and stride_w are required.";

global_pooling_ = pool_param.global_pooling();

if (global_pooling_) {

kernel_h_ = bottom[0]->height();

kernel_w_ = bottom[0]->width();

} else {

if (pool_param.has_kernel_size()) {

kernel_h_ = kernel_w_ = pool_param.kernel_size();

} else {

kernel_h_ = pool_param.kernel_h();

kernel_w_ = pool_param.kernel_w();

}

CHECK_GT(kernel_h_, 0) << "Filter dimensions cannot be zero.";

CHECK_GT(kernel_w_, 0) << "Filter dimensions cannot be zero.";

if (!pool_param.has_pad_h()) {

pad_h_ = pad_w_ = pool_param.pad();

} else {

pad_h_ = pool_param.pad_h();

pad_w_ = pool_param.pad_w();

}

if (!pool_param.has_stride_h()) {

stride_h_ = stride_w_ = pool_param.stride();

} else {

stride_h_ = pool_param.stride_h();

stride_w_ = pool_param.stride_w();

}

if (global_pooling_) {

CHECK(pad_h_ == 0 && pad_w_ == 0 && stride_h_ == 1 && stride_w_ == 1)

<< "With Global_pooling: true; only pad = 0 and stride = 1";

}

if (pad_h_ != 0 || pad_w_ != 0) {

CHECK(this->layer_param_.pooling_param().pool()

== PoolingParameter_PoolMethod_AVE

|| this->layer_param_.pooling_param().pool()

== PoolingParameter_PoolMethod_MAX)

<< "Padding implemented only for average and max pooling.";

CHECK_LT(pad_h_, kernel_h_);

CHECK_LT(pad_w_, kernel_w_);

}

template <typename Dtype>

void PoolingLayer<Dtype>::Reshape(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

CHECK_EQ(4, bottom[0]->num_axes()) << "Input must have 4 axes, "

<< "corresponding to (num, channels, height, width)";

channels_ = bottom[0]->channels();

height_ = bottom[0]->height();

width_ = bottom[0]->width();

if (global_pooling_) {

kernel_h_ = bottom[0]->height();

kernel_w_ = bottom[0]->width();

}

pooled_height_ = static_cast<int>(ceil(static_cast<float>(

height_ + 2 * pad_h_ - kernel_h_) / stride_h_)) + 1;

pooled_width_ = static_cast<int>(ceil(static_cast<float>(

width_ + 2 * pad_w_ - kernel_w_) / stride_w_)) + 1;

if (pad_h_ || pad_w_) {

// If we have padding, ensure that the last pooling starts strictly

// inside the image (instead of at the padding); otherwise clip the last.

if ((pooled_height_ - 1) * stride_h_ >= height_ + pad_h_) {

--pooled_height_;

}

if ((pooled_width_ - 1) * stride_w_ >= width_ + pad_w_) {

--pooled_width_;

}

CHECK_LT((pooled_height_ - 1) * stride_h_, height_ + pad_h_);

CHECK_LT((pooled_width_ - 1) * stride_w_, width_ + pad_w_);

}

top[0]->Reshape(bottom[0]->num(), channels_, pooled_height_,

pooled_width_);

if (top.size() > 1) {

top[1]->ReshapeLike(*top[0]);

}

// If max pooling, we will initialize the vector index part.

if (this->layer_param_.pooling_param().pool() ==

PoolingParameter_PoolMethod_MAX && top.size() == 1) {

max_idx_.Reshape(bottom[0]->num(), channels_, pooled_height_,

pooled_width_);

}

// If stochastic pooling, we will initialize the random index part.

if (this->layer_param_.pooling_param().pool() ==

PoolingParameter_PoolMethod_STOCHASTIC) {

rand_idx_.Reshape(bottom[0]->num(), channels_, pooled_height_,

pooled_width_);

}

// TODO(Yangqing): Is there a faster way to do pooling in the channel-first

// case?

template <typename Dtype>

void PoolingLayer<Dtype>::Forward_cpu(const vector<Blob<Dtype>*>& bottom,

const vector<Blob<Dtype>*>& top) {

const Dtype* bottom_data = bottom[0]->cpu_data();

Dtype* top_data = top[0]->mutable_cpu_data();

const int top_count = top[0]->count();

// We'll output the mask to top[1] if it's of size >1.

const bool use_top_mask = top.size() > 1;

int* mask = NULL; // suppress warnings about uninitalized variables

Dtype* top_mask = NULL;

// Different pooling methods. We explicitly do the switch outside the for

// loop to save time, although this results in more code.

switch (this->layer_param_.pooling_param().pool()) {

case PoolingParameter_PoolMethod_MAX:

// Initialize

if (use_top_mask) {

top_mask = top[1]->mutable_cpu_data();

caffe_set(top_count, Dtype(-1), top_mask);

} else {

mask = max_idx_.mutable_cpu_data();

caffe_set(top_count, -1, mask);

}

caffe_set(top_count, Dtype(-FLT_MAX), top_data);

// The main loop

for (int n = 0; n < bottom[0]->num(); ++n) {

for (int c = 0; c < channels_; ++c) {

for (int ph = 0; ph < pooled_height_; ++ph) {

for (int pw = 0; pw < pooled_width_; ++pw) {

int hstart = ph * stride_h_ - pad_h_;

int wstart = pw * stride_w_ - pad_w_;

int hend = min(hstart + kernel_h_, height_);

int wend = min(wstart + kernel_w_, width_);

hstart = max(hstart, 0);

wstart = max(wstart, 0);

const int pool_index = ph * pooled_width_ + pw;

for (int h = hstart; h < hend; ++h) {

for (int w = wstart; w < wend; ++w) {

const int index = h * width_ + w;

if (bottom_data[index] > top_data[pool_index]) {

top_data[pool_index] = bottom_data[index];

if (use_top_mask) {

top_mask[pool_index] = static_cast<Dtype>(index);

} else {

mask[pool_index] = index;

}

// compute offset

bottom_data += bottom[0]->offset(0, 1);

top_data += top[0]->offset(0, 1);

if (use_top_mask) {

top_mask += top[0]->offset(0, 1);

} else {

mask += top[0]->offset(0, 1);

}

break;

case PoolingParameter_PoolMethod_AVE:

for (int i = 0; i < top_count; ++i) {

top_data[i] = 0;

}

// The main loop

for (int n = 0; n < bottom[0]->num(); ++n) {

for (int c = 0; c < channels_; ++c) {

for (int ph = 0; ph < pooled_height_; ++ph) {

for (int pw = 0; pw < pooled_width_; ++pw) {

int hstart = ph * stride_h_ - pad_h_;

int wstart = pw * stride_w_ - pad_w_;

int hend = min(hstart + kernel_h_, height_ + pad_h_);

int wend = min(wstart + kernel_w_, width_ + pad_w_);

int pool_size = (hend - hstart) * (wend - wstart);

hstart = max(hstart, 0);

wstart = max(wstart, 0);

hend = min(hend, height_);

wend = min(wend, width_);

for (int h = hstart; h < hend; ++h) {

for (int w = wstart; w < wend; ++w) {

top_data[ph * pooled_width_ + pw] +=

bottom_data[h * width_ + w];

}

top_data[ph * pooled_width_ + pw] /= pool_size;

}

// compute offset

bottom_data += bottom[0]->offset(0, 1);

top_data += top[0]->offset(0, 1);

}

break;

case PoolingParameter_PoolMethod_STOCHASTIC:

NOT_IMPLEMENTED;

break;

default:

LOG(FATAL) << "Unknown pooling method.";

}

template <typename Dtype>

void PoolingLayer<Dtype>::Backward_cpu(const vector<Blob<Dtype>*>& top,

const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom) {

if (!propagate_down[0]) {

return;

}

const Dtype* top_diff = top[0]->cpu_diff();

Dtype* bottom_diff = bottom[0]->mutable_cpu_diff();

// Different pooling methods. We explicitly do the switch outside the for

// loop to save time, although this results in more codes.

caffe_set(bottom[0]->count(), Dtype(0), bottom_diff);

// We'll output the mask to top[1] if it's of size >1.

const bool use_top_mask = top.size() > 1;

const int* mask = NULL; // suppress warnings about uninitialized variables

const Dtype* top_mask = NULL;

switch (this->layer_param_.pooling_param().pool()) {

case PoolingParameter_PoolMethod_MAX:

// The main loop

if (use_top_mask) {

top_mask = top[1]->cpu_data();

} else {

mask = max_idx_.cpu_data();

}

for (int n = 0; n < top[0]->num(); ++n) {

for (int c = 0; c < channels_; ++c) {

for (int ph = 0; ph < pooled_height_; ++ph) {

for (int pw = 0; pw < pooled_width_; ++pw) {

const int index = ph * pooled_width_ + pw;

const int bottom_index =

use_top_mask ? top_mask[index] : mask[index];

bottom_diff[bottom_index] += top_diff[index];

}

bottom_diff += bottom[0]->offset(0, 1);

top_diff += top[0]->offset(0, 1);

if (use_top_mask) {

top_mask += top[0]->offset(0, 1);

} else {

mask += top[0]->offset(0, 1);

}

break;

case PoolingParameter_PoolMethod_AVE:

// The main loop

for (int n = 0; n < top[0]->num(); ++n) {

for (int c = 0; c < channels_; ++c) {

for (int ph = 0; ph < pooled_height_; ++ph) {

for (int pw = 0; pw < pooled_width_; ++pw) {

int hstart = ph * stride_h_ - pad_h_;

int wstart = pw * stride_w_ - pad_w_;

int hend = min(hstart + kernel_h_, height_ + pad_h_);

int wend = min(wstart + kernel_w_, width_ + pad_w_);

int pool_size = (hend - hstart) * (wend - wstart);

hstart = max(hstart, 0);

wstart = max(wstart, 0);

hend = min(hend, height_);

wend = min(wend, width_);

for (int h = hstart; h < hend; ++h) {

for (int w = wstart; w < wend; ++w) {

bottom_diff[h * width_ + w] +=

top_diff[ph * pooled_width_ + pw] / pool_size;

}

// offset

bottom_diff += bottom[0]->offset(0, 1);

top_diff += top[0]->offset(0, 1);

}

break;

case PoolingParameter_PoolMethod_STOCHASTIC:

NOT_IMPLEMENTED;

break;

default:

LOG(FATAL) << "Unknown pooling method.";

}

#ifdef CPU_ONLY

STUB_GPU(PoolingLayer);

#endif

INSTANTIATE_CLASS(PoolingLayer);

} // namespace caffe

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

pooling_layer.cpp

Latest commit

History

pooling_layer.cpp

File metadata and controls