r-cnn學習（五）：SmoothL1LossLayer論文與代碼的結合理解

本文轉載自查看原文 2016-12-06 11:41 11108 R-CNN

A Loss Function for Learning Region Proposals

訓練RPN時，只對兩種anchor給予正標簽：和gt_box有着最高的IoU && IoU超過0.7。如果對於

所有的gt_box，其IoU都小於0.3，則標記為負。損失函數定義如下：

其中i為一個mini-batch中某anchor的索引，p_i表示其為目標的預測概率,p_i*表示gt_box（正為1，否則為0）。

t_i和t_i*分別表示預測框的位置和gt_box框的位置。L_reg如下：

bound-box regression中各參數的計算方式為：

（4）

其對應的SmoothL1LossLayer代碼如下，整個過程分為兩部分：前向計算以及后向計算（1）式的后半部分：

// ------------------------------------------------------------------  
// Fast R-CNN  
// Copyright (c) 2015 Microsoft  
// Licensed under The MIT License [see fast-rcnn/LICENSE for details]  
// Written by Ross Girshick  
// ------------------------------------------------------------------  
  
#include "caffe/fast_rcnn_layers.hpp" 
 namespace caffe { //SmoothL1前向計算（3）式  template <typename Dtype>  
__global__ void SmoothL1Forward(const int n, const Dtype* in, Dtype* out, Dtype sigma2) { // f(x) = 0.5 * (sigma * x)^2          if |x| < 1 / sigma / sigma //        |x| - 0.5 / sigma / sigma otherwise CUDA_KERNEL_LOOP(index, n) { Dtype val = in[index]; Dtype abs_val = abs(val); if (abs_val < 1.0 / sigma2) { out[index] = 0.5 * val * val * sigma2; } else { out[index] = abs_val - 0.5 / sigma2; } } } // template <typename Dtype> void SmoothL1LossLayer<Dtype>::Forward_gpu(const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top) { int count = bottom[0]->count(); caffe_gpu_sub( count, bottom[0]->gpu_data(), //t_i bottom[1]->gpu_data(), //t_i* diff_.mutable_gpu_data()); // d := t_i-t_i^* if (has_weights_) { //乘上相關的權重，對應於（1）式中的p_i*,有目標時為1 // apply "inside" weights caffe_gpu_mul( count, bottom[2]->gpu_data(), //p_i* diff_.gpu_data(), diff_.mutable_gpu_data()); // d := w_in * (b0 - b1) } 
 //代入計算SmoothL1 SmoothL1Forward<Dtype><<<CAFFE_GET_BLOCKS(count), CAFFE_CUDA_NUM_THREADS>>>( count, diff_.gpu_data(), errors_.mutable_gpu_data(), sigma2_); CUDA_POST_KERNEL_CHECK; if (has_weights_) { //乘上相關的權重 // apply "outside" weights caffe_gpu_mul( count, bottom[3]->gpu_data(), // 1/N_reg  errors_.gpu_data(), errors_.mutable_gpu_data()); // d := w_out * SmoothL1(w_in * (b0 - b1)) } Dtype loss; caffe_gpu_dot(count, ones_.gpu_data(), errors_.gpu_data(), &loss); top[0]->mutable_cpu_data()[0] = loss / bottom[0]->num(); } //反向計算，對smoothLoss求導  template <typename Dtype>  
__global__ void SmoothL1Backward(const int n, const Dtype* in, Dtype* out, Dtype sigma2) { // f'(x) = sigma * sigma * x if |x| < 1 / sigma / sigma 
  //       = sign(x) otherwise CUDA_KERNEL_LOOP(index, n) { Dtype val = in[index]; Dtype abs_val = abs(val); if (abs_val < 1.0 / sigma2) { out[index] = sigma2 * val; } else { out[index] = (Dtype(0) < val) - (val < Dtype(0)); } } } // template <typename Dtype> void SmoothL1LossLayer<Dtype>::Backward_gpu(const vector<Blob<Dtype>*>& top, const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom) { // after forwards, diff_ holds w_in * (b0 - b1) int count = diff_.count(); 
 //調用反向smoothloss，diff_.gpu_data()表示x，diff_.mutable_gpu_data()表示smoothloss的導數 SmoothL1Backward<Dtype><<<CAFFE_GET_BLOCKS(count), CAFFE_CUDA_NUM_THREADS>>>( count, diff_.gpu_data(), diff_.mutable_gpu_data(), sigma2_); 
 
 //類似於前向 CUDA_POST_KERNEL_CHECK; for (int i = 0; i < 2; ++i) { if (propagate_down[i]) { const Dtype sign = (i == 0) ? 1 : -1; const Dtype alpha = sign * top[0]->cpu_diff()[0] / bottom[i]->num(); caffe_gpu_axpby( count, // count alpha, // alpha diff_.gpu_data(), // x Dtype(0), // beta bottom[i]->mutable_gpu_diff());  // y if (has_weights_) { // Scale by "inside" weight caffe_gpu_mul( count, bottom[2]->gpu_data(), bottom[i]->gpu_diff(), bottom[i]->mutable_gpu_diff()); // Scale by "outside" weight caffe_gpu_mul( count, bottom[3]->gpu_data(), bottom[i]->gpu_diff(), bottom[i]->mutable_gpu_diff()); } } } } INSTANTIATE_LAYER_GPU_FUNCS(SmoothL1LossLayer); } // namespace caffe

免責聲明！

本站轉載的文章為個人學習借鑒使用，本站對版權不負任何法律責任。如果侵犯了您的隱私權益，請聯系本站郵箱yoyou2525@163.com刪除。

猜您在找 Mask R-CNN論文理解學習Faster R-CNN代碼rpn（六）學習Faster R-CNN代碼nms（七） R-CNN論文翻譯學習Faster R-CNN代碼demo（一）深度學習論文翻譯解析（十二）：Fast R-CNN r-cnn學習（二） r-cnn學習(一) Fast R-CNN（理解）學習Faster R-CNN代碼roi_pooling（三）