Caffe框架原始碼剖析(3)—資料層DataLayer

阿新 • • 發佈：2018-10-31

Caffe網路正向傳導時，首先進行的是DataLayer資料層的傳導。該層從檔案讀取資料，載入至它的上一層卷積層。反向傳播時，因為資料層不需要反傳，所以它的Backward_cpu()和Backward_gpu()都是空函式。下面看一下DataLayer類圖關係。

首先從父類BaseDataLayer開始看原始碼，base_data_layer.hpp標頭檔案：

template <typename Dtype>
class BaseDataLayer : public Layer<Dtype> {
 public:
  // 建構函式
  explicit BaseDataLayer(const LayerParameter& param);
  // 實現一般資料層構建，並呼叫DataLayerSetup函式
  virtual void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top);
  // 資料層可在並行時共享
  virtual inline bool ShareInParallel() const { return true; }
  // 空的構建函式（該函式為虛擬函式，待子類過載）
  virtual void DataLayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top) {}
  // 資料層沒有bottom層，因此Reshape函式為空函式
  virtual void Reshape(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top) {}

  // 反向傳播，空函式
  virtual void Backward_cpu(const vector<Blob<Dtype>*>& top,
      const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom) {}
  virtual void Backward_gpu(const vector<Blob<Dtype>*>& top,
      const vector<bool>& propagate_down, const vector<Blob<Dtype>*>& bottom) {}

 protected:
  TransformationParameter transform_param_;
  shared_ptr<DataTransformer<Dtype> > data_transformer_;
  // 是否包含有輸出標籤
  bool output_labels_;
};

base_data_layer.cpp實現檔案

// 建構函式
template <typename Dtype>
BaseDataLayer<Dtype>::BaseDataLayer(const LayerParameter& param)
    : Layer<Dtype>(param),
      transform_param_(param.transform_param()) {
}

template <typename Dtype>
void BaseDataLayer<Dtype>::LayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top) {
  // 如果top層size大於1，則包含有標籤
  if (top.size() == 1) {
    output_labels_ = false;
  } else {
    output_labels_ = true;
  }
  data_transformer_.reset(
      new DataTransformer<Dtype>(transform_param_, this->phase_));
  // 初始化隨機數生成器
  data_transformer_->InitRand();
  // 呼叫構建虛擬函式
  DataLayerSetUp(bottom, top);
}

接下來看一下子類BasePrefetchingDataLayer類，該類不僅繼承了BaseDataLayer類，還繼承自InternalThread類。因此該類過載了InternalThread類的虛擬函式InternalThreadEntry()。

template <typename Dtype>
class BasePrefetchingDataLayer :
    public BaseDataLayer<Dtype>, public InternalThread {
 public:
  explicit BasePrefetchingDataLayer(const LayerParameter& param);
  // 構建函式
  void LayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top);

  // CPU正向傳導函式
  virtual void Forward_cpu(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top);
  // GPU正向傳導函式
  virtual void Forward_gpu(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top);

  // 預取資料塊大小
  static const int PREFETCH_COUNT = 3;

 protected:
  // 執行緒函式，虛擬函式過載
  virtual void InternalThreadEntry();
  // 載入batch，純虛擬函式，由子類DataLayer實現
  virtual void load_batch(Batch<Dtype>* batch) = 0;

  Batch<Dtype> prefetch_[PREFETCH_COUNT];
  BlockingQueue<Batch<Dtype>*> prefetch_free_;
  BlockingQueue<Batch<Dtype>*> prefetch_full_;

  Blob<Dtype> transformed_data_;
};

base_data_layer.cpp實現檔案

template <typename Dtype>
BasePrefetchingDataLayer<Dtype>::BasePrefetchingDataLayer(
    const LayerParameter& param)
    : BaseDataLayer<Dtype>(param),
      prefetch_free_(), prefetch_full_() {
  for (int i = 0; i < PREFETCH_COUNT; ++i) {
    prefetch_free_.push(&prefetch_[i]);
  }
}

template <typename Dtype>
void BasePrefetchingDataLayer<Dtype>::LayerSetUp(
    const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top) {
  // 先呼叫父類LayerSetUp
  BaseDataLayer<Dtype>::LayerSetUp(bottom, top);
  // 執行緒開啟前先分配記憶體&視訊記憶體，防止在某些GPU上報錯
  for (int i = 0; i < PREFETCH_COUNT; ++i) {
    prefetch_[i].data_.mutable_cpu_data();
    if (this->output_labels_) {
      prefetch_[i].label_.mutable_cpu_data();
    }
  }
#ifndef CPU_ONLY
  if (Caffe::mode() == Caffe::GPU) {
    for (int i = 0; i < PREFETCH_COUNT; ++i) {
      prefetch_[i].data_.mutable_gpu_data();
      if (this->output_labels_) {
        prefetch_[i].label_.mutable_gpu_data();
      }
    }
  }
#endif
  DLOG(INFO) << "Initializing prefetch";
  // 初始化隨機數生成器
  this->data_transformer_->InitRand();
  // 開啟執行緒
  StartInternalThread();
  DLOG(INFO) << "Prefetch initialized.";
}

// 執行緒函式，由StartInternalThread開啟
template <typename Dtype>
void BasePrefetchingDataLayer<Dtype>::InternalThreadEntry() {
#ifndef CPU_ONLY
  // 在GPU上啟用stream非同步載入
  cudaStream_t stream;
  if (Caffe::mode() == Caffe::GPU) {
    CUDA_CHECK(cudaStreamCreateWithFlags(&stream, cudaStreamNonBlocking));
  }
#endif

  try {
    while (!must_stop()) {
      Batch<Dtype>* batch = prefetch_free_.pop();
      // 載入batch，該函式由子類DataLayer實現
      load_batch(batch);
#ifndef CPU_ONLY
      if (Caffe::mode() == Caffe::GPU) {
        batch->data_.data().get()->async_gpu_push(stream);
        CUDA_CHECK(cudaStreamSynchronize(stream));
      }
#endif
      prefetch_full_.push(batch);
    }
  } catch (boost::thread_interrupted&) {
    // Interrupted exception is expected on shutdown
  }
#ifndef CPU_ONLY
  if (Caffe::mode() == Caffe::GPU) {
    CUDA_CHECK(cudaStreamDestroy(stream));
  }
#endif
}

// CPU正向傳導
template <typename Dtype>
void BasePrefetchingDataLayer<Dtype>::Forward_cpu(
    const vector<Blob<Dtype>*>& bottom, const vector<Blob<Dtype>*>& top) {
  Batch<Dtype>* batch = prefetch_full_.pop("Data layer prefetch queue empty");
  // Reshape成與batch資料同一維度
  top[0]->ReshapeLike(batch->data_);
  // 將batch資料拷貝至top層blob[0]
  caffe_copy(batch->data_.count(), batch->data_.cpu_data(),
             top[0]->mutable_cpu_data());
  DLOG(INFO) << "Prefetch copied";
  // 如果包含輸出標籤
  if (this->output_labels_) {
    // Reshape成batch標籤同一維度
    top[1]->ReshapeLike(batch->label_);
    // 將batch標籤拷貝至top層blob[1]
    caffe_copy(batch->label_.count(), batch->label_.cpu_data(),
        top[1]->mutable_cpu_data());
  }

  prefetch_free_.push(batch);
}
// 如果CPU_ONLY模式則禁止Forward_gpu和Backward_gpu函式
#ifdef CPU_ONLY
STUB_GPU_FORWARD(BasePrefetchingDataLayer, Forward);
#endif

最後分析下最終的子類DataLayer，由於很多方法由它的父類實現了，該類功能很簡單了，只過載了兩個虛擬函式DataLayerSetUp()和load_batch()。

template <typename Dtype>
class DataLayer : public BasePrefetchingDataLayer<Dtype> {
 public:
  explicit DataLayer(const LayerParameter& param);
  virtual ~DataLayer();

  // 構建函式，過載虛擬函式
  virtual void DataLayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top);
  // DataLayer uses DataReader instead for sharing for parallelism
  virtual inline bool ShareInParallel() const { return false; }
  virtual inline const char* type() const { return "Data"; }
  virtual inline int ExactNumBottomBlobs() const { return 0; }
  virtual inline int MinTopBlobs() const { return 1; }
  virtual inline int MaxTopBlobs() const { return 2; }

 protected:
  // 載入batch，過載虛擬函式
  virtual void load_batch(Batch<Dtype>* batch);

  // DataReader物件
  DataReader reader_;
};

cpp檔案如下，

// 建構函式
template <typename Dtype>
DataLayer<Dtype>::DataLayer(const LayerParameter& param)
  : BasePrefetchingDataLayer<Dtype>(param),
    reader_(param) {
}
// 解構函式
template <typename Dtype>
DataLayer<Dtype>::~DataLayer() {
  // 終止執行緒
  this->StopInternalThread();
}

template <typename Dtype>
void DataLayer<Dtype>::DataLayerSetUp(const vector<Blob<Dtype>*>& bottom,
      const vector<Blob<Dtype>*>& top) {
  const int batch_size = this->layer_param_.data_param().batch_size();
  // 讀取一個dataum，用來初始化top blob維度
  Datum& datum = *(reader_.full().peek());

  // 從datum獲取單個數據維度
  vector<int> top_shape = this->data_transformer_->InferBlobShape(datum);
  this->transformed_data_.Reshape(top_shape);
  // 加上batch尺寸
  top_shape[0] = batch_size;
  // Reshape
  top[0]->Reshape(top_shape);
  for (int i = 0; i < this->PREFETCH_COUNT; ++i) {
    // Reshape，並分配data記憶體
    this->prefetch_[i].data_.Reshape(top_shape);
  }
  // 輸出尺寸資訊
  LOG(INFO) << "output data size: " << top[0]->num() << ","
      << top[0]->channels() << "," << top[0]->height() << ","
      << top[0]->width();
  // label
  if (this->output_labels_) {
    vector<int> label_shape(1, batch_size);
    top[1]->Reshape(label_shape);
    for (int i = 0; i < this->PREFETCH_COUNT; ++i) {
      // Reshape，並分配label記憶體
      this->prefetch_[i].label_.Reshape(label_shape);
    }
  }
}

// 該函式被InternalThreadEntry執行緒函式呼叫
template<typename Dtype>
void DataLayer<Dtype>::load_batch(Batch<Dtype>* batch) {
  CPUTimer batch_timer;
  batch_timer.Start();
  double read_time = 0;
  double trans_time = 0;
  CPUTimer timer;
  CHECK(batch->data_.count());
  CHECK(this->transformed_data_.count());

  // 讀取一個dataum，用來初始化top blob維度，同上
  const int batch_size = this->layer_param_.data_param().batch_size();
  Datum& datum = *(reader_.full().peek());
  vector<int> top_shape = this->data_transformer_->InferBlobShape(datum);
  this->transformed_data_.Reshape(top_shape);
  top_shape[0] = batch_size;
  batch->data_.Reshape(top_shape);

  Dtype* top_data = batch->data_.mutable_cpu_data();
  Dtype* top_label = NULL;  // suppress warnings about uninitialized variables

  if (this->output_labels_) {
    top_label = batch->label_.mutable_cpu_data();
  }

  // 迴圈載入batch
  for (int item_id = 0; item_id < batch_size; ++item_id) {
    timer.Start();
    // 讀取資料datum
    Datum& datum = *(reader_.full().pop("Waiting for data"));
    // 統計讀取時間
    read_time += timer.MicroSeconds();
    timer.Start();
    // 計算指標offset
    int offset = batch->data_.offset(item_id);
    this->transformed_data_.set_cpu_data(top_data + offset);
    // 將datum資料拷貝到batch中
    this->data_transformer_->Transform(datum, &(this->transformed_data_));
    // 拷貝標籤
    if (this->output_labels_) {
      top_label[item_id] = datum.label();
    }
    // 統計拷貝時間
    trans_time += timer.MicroSeconds();

    reader_.free().push(const_cast<Datum*>(&datum));
  }
  timer.Stop();
  // 統計載入batch總時間
  batch_timer.Stop();
  // 輸出時間開銷
  DLOG(INFO) << "Prefetch batch: " << batch_timer.MilliSeconds() << " ms.";
  DLOG(INFO) << "     Read time: " << read_time / 1000 << " ms.";
  DLOG(INFO) << "Transform time: " << trans_time / 1000 << " ms.";
}

Caffe框架原始碼剖析(3)—資料層DataLayer

Caffe網路正向傳導時，首先進行的是DataLayer資料層的傳導。該層從檔案讀取資料，載入至它的上一層卷積層。反向傳播時，因為資料層不需要反傳，所以它的Backward_cpu()和Backward_gpu()都是空函式。下面看一下DataLayer類圖關係。首先從父類Ba

Caffe框架原始碼剖析(6)—池化層PoolingLayer

卷積層ConvolutionLayer正向傳導的目標層往往是池化層PoolingLayer。池化層通過降取樣來降低卷積層輸出的特徵向量，同時改善結果，不易出現過擬合。最常用的降取樣方法有均值取樣（取區域平均值作為降取樣值）、最大值取樣（取區域最大值作為降取樣值）和隨機

Caffe框架原始碼剖析(5)—卷積層ConvolutionLayer

ConvolutionLayer是BaseConvolutionLayer的子類，功能較為簡單。類中不包含成員變數，僅包含幾個虛擬函式的實現。 conv_layer.hpp標頭檔案的定義如下： template <typename Dtype> class Convoluti

Caffe框架原始碼剖析(4)—卷積層基類BaseConvolutionLayer

資料層DataLayer正向傳導的目標層是卷積層ConvolutionLayer。卷積層的是用一系列的權重濾波核與輸入影象進行卷積，具體實現是通過將影象展開成向量，作用矩陣乘法實現卷積。同樣，首先看一下卷積層的類圖。

Caffe框架原始碼剖析(2)—訓練網路

中間因為工程開發等雜七雜八原因暫停了Caffe原始碼分析，現在繼續補上。上篇分析在函式 train() 中建立了網路，接下來就是進入訓練網路步驟了。在函式train()中，使用前一步建立好的solver智慧指標物件呼叫函式Solve()， int train() {

Caffe框架原始碼剖析(1)—構建網路

今天花了一整天時間進行閱讀和除錯Caffe框架程式碼，單單是以Lenet網路進行測試就可見框架的大致工作原理。賈揚清在Caffe中大量使用了STL、模板、智慧指標，有些地方為了效率也犧牲了一些程式碼可讀性，處處彰顯了大牛風範。為了他人閱讀方便，現將程式碼流程簡單梳理一下。 1.LeNe

雲風的 BLOG: Lua GC 的原始碼剖析 (3)

/* ** Garbage-collection function */ LUA_API int lua_gc (lua_State *L, int what, int data) { int res = 0; global_State

【java集合框架原始碼剖析系列】java原始碼剖析之HashMap

前言：之所以打算寫java集合框架原始碼剖析系列部落格是因為自己反思了一下阿里內推一面的失敗（估計沒過，因為寫此部落格已距阿里巴巴一面一個星期），當時面試完之後感覺自己回答的挺好的，而且據面試官最後說的這幾天可能會和你聯絡來看當時以為自己一面應該是通過的，但是事與願違，痛定

使用SSD基於caffe框架訓練自己的資料

宣告：本文僅以自己的實驗過程編寫，如若轉載，請與博主聯絡。建議讀者在做本文中的嘗試之前，先訓練一編官網論文中的例子，按照SSD教程跑一邊，或者參看博主博文：http://blog.csdn.net/xunan003/article/details/78427446 配

Android原始碼剖析之Framework層實戰版（Ams管理Activity啟動）

Intent中的四個重要屬性——Action、Data、Category、Extras以上是對intent的介紹，接下來會再介紹一下task，也就是如何啟動，以什麼樣的規則啟動和退出。以下均指launchFlag，標記均以FLAG_ACTIVITY_開頭，介紹時會忽略，請注意一下；啟動時會依次判斷如下標識1、

caffe框架原始碼目錄結構

先自頂向下捋清楚框架結構：工程目錄下資料夾 data/ 用於存放下載的訓練資料 docs/ 幫助文件 examples/ 程式碼樣例 matlab/ MATLAB介面檔案 python/ PYTHON介面檔案 mod

【2】Caffe學習系列：資料層及引數

要執行caffe，需要先建立一個模型（model)，如比較常用的Lenet,Alex等，而一個模型由多個屋（layer）構成，每一屋又由許多引數組成。所有的引數都定義在caffe.proto這個檔案中。要熟練使用caffe，最重要的就是學會配置檔案（prototxt）的編寫。層有很多種型別，

scrapy框架中Crawlspider模組原始碼剖析

一、前言 1、scrapy從Terminal中通過genspider命令建立一個蜘蛛，其中包含四個模組，分別為spider，crawlspider，csvfeedspider和xmlfeedspider，其中spider(basic模組)和crawlspider最為常用。 2、做過web

原始碼剖析 | 螞蟻金服 mPaaS 框架下的 RPC 呼叫歷程

背景 mPaaS-RPC 是支付寶原生的 RPC 呼叫庫。在客戶端開發過程中，只需要簡單的呼叫庫裡封裝的函式即可完成一次資料請求過程，但是遇到異常情況往往會面對各種異常碼卻不知所云。所以這篇文章帶領大家瞭解一下 mPaaS-RPC 的呼叫過程以及各種異常碼產生的原因。 1. 使用方法在 Andro

caffe 資料層(lmdb資料來源)引數配置

layer { name: "my_data" type: "Data" top: "data" top: "label" include { phase: TRAIN } transform_param { mean_file: "/home/h

4.Java集合框架剖析之 LinkedList原始碼剖析

1 package java.util; 2 3 import java.util.function.Consumer; 4 5 //LinkedList基於連結串列實現 6 //實現了List、Deque、Cloneable、Serializable介面 7 publi

5.Java集合框架剖析之 Hashset和LinkedHashSet原始碼剖析

1 package java.util; 2 3 import java.io.InvalidObjectException; 4 import sun.misc.SharedSecrets; 5 6 public class HashSet<E> extends

【ABP框架系列學習】N層架構(3)

map ogg user www logs 授權 bject layer arc 原文:【ABP框架系列學習】N層架構(3)目錄 0.引言 1.DDD分層 2.ABP應用構架模型客戶端應用程序(Client Applications) 表現層(Presentat

《TensorFlow：實戰Google深度學習框架》——6.3 卷積神經網路常用結構（池化層）

池化層在兩個卷積層之間，可以有效的縮小矩陣的尺寸（也可以減小矩陣深度，但實踐中一般不會這樣使用），co。池從而減少最後全連線層中的引數。池化層既可以加快計算速度也可以防止過度擬合問題的作用。池化層也是通過一個類似過濾器結構完成的，計算方式有兩種：最大池化層：採用最

【原始碼剖析】Launcher 8.0 原始碼 26---使用者操作（3）拖拽模式之springload

接下來是第三種狀態，springloader模式，也是drag模式。到此刻使用者的操作有3中，點選，滑動，長按。點選是觸發onclick，滑動是GroupView自帶方法，而長按一種是進入overview或allapp模式，另外一種就是接下來學習的drag模式。

Caffe框架原始碼剖析(3)—資料層DataLayer

相關推薦