MFC/Qt下呼叫caffe原始碼（一）---將caffe原始碼生成動態連結庫dll

阿新 • • 發佈：2018-12-21

本人研一，最近想將用caffe訓出的模型，通過MFC做出一個介面，扔進一張圖片，點選預測，即可呼叫預測分類函式完成測試，並且通過MessageBox彈出最終分類的資訊。

首先通過查資料總結出兩種方法，第一：直接呼叫編譯好的caffe原始碼；（本次用到的原始碼是classification.cpp）

第二：將caffe原始碼生成動態連結庫dll,然後在其它工程專案下進行呼叫。由於caffe的原始碼依賴項太多，稍微錯一點就編譯不通過，故本次操作採用呼叫dll的方式。

1.win7 vs2013,新建win32控制檯程式，如下所示：

2.首先將專案的屬性改成release和x64編譯模式，新增兩個.h檔案和一個cpp檔案：

（1）我採用的是dllexport方式匯出的，採用了條件編譯，要將DLL_EXPORTS巨集定義加入到前處理器中以及_SCL_SECURE_NO_WARNINGS

Tip:.h檔案

#ifndef CAFFE_CLASSIFY_H_
#define CAFFE_CLASSIFY_H_
#define CPU_ONLY 1

#include <caffe/caffe.hpp>  
#include <opencv2/core/core.hpp>  
#include <opencv2/highgui/highgui.hpp>  
#include <opencv2/imgproc/imgproc.hpp>  
#include <algorithm>  
#include <iosfwd>  
#include <memory>  
#include <string>  
#include <utility>  
#include <vector>  
//#pragma once
using namespace caffe;
using std::string;
using namespace std;
using boost::shared_ptr;

#ifdef DLL_EXPORTS
#define DLL_EXPORTS_API _declspec(dllexport)
#else
#define DLL_EXPORTS_API _declspec(dllimport)
#endif
/* Pair (label, confidence) representing a prediction. */
typedef std::pair<string, float> Prediction;

class DLL_EXPORTS_API  Classifier {
public:
	Classifier(const string& model_file,
		const string& trained_file,
		const string& mean_file,
		const string& label_file);

	std::vector<Prediction> Classify(const cv::Mat& img, int N = 5);
	~Classifier();

private:
	void SetMean(const string& mean_file);


	std::vector<float> Predict(const cv::Mat& img);

	void WrapInputLayer(std::vector<cv::Mat>* input_channels);

	void Preprocess(const cv::Mat& img,
		std::vector<cv::Mat>* input_channels);

private:
	boost::shared_ptr<Net<float> > net_;
	cv::Size input_geometry_;
	int num_channels_;
	cv::Mat mean_;
	std::vector<string> labels_;
};
#endif

（2）.

Tip .h檔案，此檔案是關於層的，缺哪個新增哪個。之前按照網上部落格抄的，後來執行的時候報錯：Unkown Layer 。後來想起來我的網路裡面用到了Concat Layer，後來就自己添加了，特別注意：直接extern 就行，不用REGISTER_LAYER_CLASS(Concat);

#ifndef LAYER_H
#define LAYER_H

#include "caffe/common.hpp"
#include "caffe/layers/input_layer.hpp"
#include "caffe/layers/inner_product_layer.hpp"
#include "caffe/layers/dropout_layer.hpp"
#include "caffe/layers/conv_layer.hpp"
#include "caffe/layers/relu_layer.hpp"

#include "caffe/layers/pooling_layer.hpp"
#include "caffe/layers/lrn_layer.hpp"
#include "caffe/layers/softmax_layer.hpp"
#include "caffe/layers/concat_layer.hpp"


namespace caffe
{

	extern INSTANTIATE_CLASS(InputLayer);
	extern INSTANTIATE_CLASS(InnerProductLayer);
	extern INSTANTIATE_CLASS(DropoutLayer);
	extern INSTANTIATE_CLASS(ConcatLayer);
	extern INSTANTIATE_CLASS(ConvolutionLayer);
	REGISTER_LAYER_CLASS(Convolution);
	extern INSTANTIATE_CLASS(ReLULayer);
	REGISTER_LAYER_CLASS(ReLU);
	extern INSTANTIATE_CLASS(PoolingLayer);
	REGISTER_LAYER_CLASS(Pooling);
	extern INSTANTIATE_CLASS(LRNLayer);
	REGISTER_LAYER_CLASS(LRN);
	extern INSTANTIATE_CLASS(SoftmaxLayer);
	REGISTER_LAYER_CLASS(Softmax);
	//extern INSTANTIATE_CLASS(ConcatLayer);
	//REGISTER_LAYER_CLASS(Concat);


}

#endif

（3）將classification的原始檔賦值到cpp中，注意新增標頭檔案；

.cpp檔案


#include "Header.h"
#include "SingleDll.h"

Classifier::Classifier(const string& model_file,
	const string& trained_file,
	const string& mean_file,
	const string& label_file) {
#ifdef CPU_ONLY
	Caffe::set_mode(Caffe::CPU);
#else
	Caffe::set_mode(Caffe::GPU);
#endif
	//Caffe::set_mode(Caffe::GPU);
	/* Load the network. */
	net_.reset(new Net<float>(model_file, TEST));
	net_->CopyTrainedLayersFrom(trained_file);

	CHECK_EQ(net_->num_inputs(), 1) << "Network should have exactly one input.";
	CHECK_EQ(net_->num_outputs(), 1) << "Network should have exactly one output.";

	Blob<float>* input_layer = net_->input_blobs()[0];
	num_channels_ = input_layer->channels();
	CHECK(num_channels_ == 3 || num_channels_ == 1)
		<< "Input layer should have 1 or 3 channels.";
	input_geometry_ = cv::Size(input_layer->width(), input_layer->height());

	/* Load the binaryproto mean file. */
	SetMean(mean_file);

	/* Load labels. */
	std::ifstream labels(label_file.c_str());
	CHECK(labels) << "Unable to open labels file " << label_file;
	string line;
	while (std::getline(labels, line))
		labels_.push_back(string(line));

	Blob<float>* output_layer = net_->output_blobs()[0];
	CHECK_EQ(labels_.size(), output_layer->channels())
		<< "Number of labels is different from the output layer dimension.";
}
static bool PairCompare(const std::pair<float, int>& lhs,
	const std::pair<float, int>& rhs) {
	return lhs.first > rhs.first;
}

/* Return the indices of the top N values of vector v. */
static std::vector<int> Argmax(const std::vector<float>& v, int N) {
	std::vector<std::pair<float, int> > pairs;
	for (size_t i = 0; i < v.size(); ++i)
		pairs.push_back(std::make_pair(v[i], static_cast<int>(i)));
	std::partial_sort(pairs.begin(), pairs.begin() + N, pairs.end(), PairCompare);

	std::vector<int> result;
	for (int i = 0; i < N; ++i)
		result.push_back(pairs[i].second);
	return result;
}
/* Return the top N predictions. */
std::vector<Prediction> Classifier::Classify(const cv::Mat& img, int N) {
	std::vector<float> output = Predict(img);

	N = std::min<int>(labels_.size(), N);
	std::vector<int> maxN = Argmax(output, N);
	std::vector<Prediction> predictions;
	for (int i = 0; i < N; ++i) {
		int idx = maxN[i];
		predictions.push_back(std::make_pair(labels_[idx], output[idx]));
	}
	return predictions;
}
/* Load the mean file in binaryproto format. */
void Classifier::SetMean(const string& mean_file) {
	BlobProto blob_proto;
	ReadProtoFromBinaryFileOrDie(mean_file.c_str(), &blob_proto);
	/* Convert from BlobProto to Blob<float> */
	Blob<float> mean_blob;
	mean_blob.FromProto(blob_proto);
	CHECK_EQ(mean_blob.channels(), num_channels_)
		<< "Number of channels of mean file doesn't match input layer.";
	/* The format of the mean file is planar 32-bit float BGR or grayscale. */
	std::vector<cv::Mat> channels;
	float* data = mean_blob.mutable_cpu_data();
	for (int i = 0; i < num_channels_; ++i) {
		/* Extract an individual channel. */
		cv::Mat channel(mean_blob.height(), mean_blob.width(), CV_32FC1, data);
		channels.push_back(channel);
		data += mean_blob.height() * mean_blob.width();
	}
	/* Merge the separate channels into a single image. */
	cv::Mat mean;
	cv::merge(channels, mean);
	/* Compute the global mean pixel value and create a mean image
	* filled with this value. */
	cv::Scalar channel_mean = cv::mean(mean);
	mean_ = cv::Mat(input_geometry_, mean.type(), channel_mean);
}
std::vector<float> Classifier::Predict(const cv::Mat& img) {
	Blob<float>* input_layer = net_->input_blobs()[0];
	input_layer->Reshape(1, num_channels_,
		input_geometry_.height, input_geometry_.width);
	/* Forward dimension change to all layers. */
	net_->Reshape();

	std::vector<cv::Mat> input_channels;
	WrapInputLayer(&input_channels);

	Preprocess(img, &input_channels);

	net_->Forward();

	/* Copy the output layer to a std::vector */
	Blob<float>* output_layer = net_->output_blobs()[0];
	const float* begin = output_layer->cpu_data();
	const float* end = begin + output_layer->channels();
	return std::vector<float>(begin, end);
}

/* Wrap the input layer of the network in separate cv::Mat objects
* (one per channel). This way we save one memcpy operation and we
* don't need to rely on cudaMemcpy2D. The last preprocessing
* operation will write the separate channels directly to the input
* layer. */
void Classifier::WrapInputLayer(std::vector<cv::Mat>* input_channels) {
	Blob<float>* input_layer = net_->input_blobs()[0];

	int width = input_layer->width();
	int height = input_layer->height();
	float* input_data = input_layer->mutable_cpu_data();
	for (int i = 0; i < input_layer->channels(); ++i) {
		cv::Mat channel(height, width, CV_32FC1, input_data);
		input_channels->push_back(channel);
		input_data += width * height;
	}
}

void Classifier::Preprocess(const cv::Mat& img,
	std::vector<cv::Mat>* input_channels) {
	/* Convert the input image to the input image format of the network. */
	cv::Mat sample;
	if (img.channels() == 3 && num_channels_ == 1)
		cv::cvtColor(img, sample, cv::COLOR_BGR2GRAY);
	else if (img.channels() == 4 && num_channels_ == 1)
		cv::cvtColor(img, sample, cv::COLOR_BGRA2GRAY);
	else if (img.channels() == 4 && num_channels_ == 3)
		cv::cvtColor(img, sample, cv::COLOR_BGRA2BGR);
	else if (img.channels() == 1 && num_channels_ == 3)
		cv::cvtColor(img, sample, cv::COLOR_GRAY2BGR);
	else
		sample = img;

	cv::Mat sample_resized;
	if (sample.size() != input_geometry_)
		cv::resize(sample, sample_resized, input_geometry_);
	else
		sample_resized = sample;

	cv::Mat sample_float;
	if (num_channels_ == 3)
		sample_resized.convertTo(sample_float, CV_32FC3);
	else
		sample_resized.convertTo(sample_float, CV_32FC1);

	cv::Mat sample_normalized;
	cv::subtract(sample_float, mean_, sample_normalized);

	/* This operation will write the separate BGR planes directly to the
	* input layer of the network because it is wrapped by the cv::Mat
	* objects in input_channels. */
	cv::split(sample_normalized, *input_channels);

	CHECK(reinterpret_cast<float*>(input_channels->at(0).data)
		== net_->input_blobs()[0]->cpu_data())
		<< "Input channels are not wrapping the input layer of the network.";
}
Classifier::~Classifier()
{}

3.開啟屬性管理器，新增caffe相關依賴項。新增完可能會報各種can not open XXX.lib的錯誤。莫著急，這都是由於粗心路徑不對造成的，要注意細節。

包含目錄：

D:\caffe\NugetPackages\gflags.2.1.2.1\build\native\include  
D:\caffe\NugetPackages\glog.0.3.3.0\build\native\include  
D:\caffe\NugetPackages\protobuf-v120.2.6.1\build\native\include  
D:\caffe\NugetPackages\OpenCV.2.4.10\build\native\include  
D:\caffe\NugetPackages\OpenBLAS.0.2.14.1\lib\native\include  
D:\caffe\NugetPackages\boost.1.59.0.0\lib\native\include 
還要加上caffe編譯完生成的include路徑，最好將其複製到該專案下
eg.D:\caffe-class\include

庫目錄：

E:\caffe\NugetPackages\OpenCV.2.4.10\build\native\lib\x64\v120\Release 
E:\caffe\NugetPackages\gflags.2.1.2.1\build\native\x64\v120\dynamic\Lib  
E:\caffe\NugetPackages\glog.0.3.3.0\build\native\lib\x64\v120\Release \dynamic  
E:\caffe\NugetPackages\OpenBLAS.0.2.14.1\lib\native\lib\x64  
E:\caffe\NugetPackages\protobuf-v120.2.6.1\build\native\lib\x64\v120\Release  
E:\caffe\NugetPackages\LevelDB-vc120.1.2.0.0\build\native\lib\x64\v120\Release 
E:\caffe\NugetPackages\hdf5-v120-complete.1.8.15.2\lib\native\lib\x64  
E:\caffe\NugetPackages\boost_date_time-vc120.1.59.0.0\lib\native\address-model-64\lib  
E:\caffe\NugetPackages\boost_filesystem-vc120.1.59.0.0\lib\native\address-model-64\lib  
E:\caffe\NugetPackages\boost_system-vc120.1.59.0.0\lib\native\address-model-64\lib  
E:\caffe\NugetPackages\boost_thread-vc120.1.59.0.0\lib\native\address-model-64\lib  
E:\caffe\NugetPackages\boost_chrono-vc120.1.59.0.0\lib\native\address-model-64\lib  
注意還需新增caffe編譯生成的release檔案

Tip：上述庫目錄中少了lmdb ，自己別忘了

新增依賴項

libglog.lib  
libcaffe.lib  
gflags.lib  
gflags_nothreads.lib  
hdf5.lib  
hdf5_hl.lib  
libprotobuf.lib  
libopenblas.dll.a  
Shlwapi.lib  
LevelDb.lib  
lmdb.lib  
opencv_core2410.lib  
opencv_highgui2410.lib  
opencv_imgproc2410.lib  
opencv_video2410.lib  
opencv_objdetect2410.lib

注意：由於我是cpu條件下編譯的（加了巨集定義CPU_ONLY），若您是GPU 則要新增相應的cudn的路徑，以及

cublas.lib
cuda.lib
curand.lib
cudart.lib
cudnn.lib 這些依賴項！！

4.編譯生成，會發現生成dll lib等檔案，但是沒有ink，不知道為啥，那不重要。

最後第一篇生成dll檔案就講解到這裡，生成完後可以測試一下能不能用。我也是先測試能用，才新建MFC工程進行呼叫的。

下次就為大家講解MFC下呼叫，具體實現MFC呼叫caffemodel實現過程。

若需要help,QQ 1443563995.如有錯誤，多多指教！

MFC/Qt下呼叫caffe原始碼（一）---將caffe原始碼生成動態連結庫dll

本人研一，最近想將用caffe訓出的模型，通過MFC做出一個介面，扔進一張圖片，點選預測，即可呼叫預測分類函式完成測試，並且通過MessageBox彈出最終分類的資訊。首先通過查資料總結出兩種方法，第一：直接呼叫編譯好的caffe原始碼；（本次用到的原始碼是classif

【深度學習之Caffe】將模型測試Classification過程生成動態連結庫dll以方便其他專案呼叫

#include "caffe_classify.h" #include "head.h" Classifier::Classifier(const string& model_file,const string& trained_file,const string& mean

MFC/Qt下呼叫caffe原始碼（二）---MFC下呼叫caffe的動態連線庫dll檔案

首先，先看下最後的效果吧。 win7 vs2013 新建一個MFC 工程注：MFC中如何最簡便的方法將圖片顯示到對話方塊中？大家可以搜下，很多種方法，但是我採用的是最簡單的方法，即將opencv視窗繫結到MFC的PIcture control上。在:

QT框架下的文字操作（一）

簡介檔案操作作為軟體開發中不可或缺的一環，將其獨立出來並形成一個模組就顯得十分必要。這樣不僅易於維護管理，而且易於在專案中整合。文字型別常用的文字型別包括： csv檔案 dbf 檔案 excel 檔案 ini 檔案 json 檔案

Caffe原始碼解讀（一）：caffe.proto（上）

caffe.proto檔案位於 ..\caffe-fast-rcnn\src\caffe\proto檔案目錄下，根目錄為 py_faster_rcnn資料夾 syntax = "proto2"; package caffe; // repeated require

菜鳥讀caffe原始碼（一）：protoc.exe的使用

caffe感覺都是別人玩剩下的東西，但是結合目前專案和以後對工作的設想，caffe原始碼還是有很好的學習價值。參考入門書籍《深度學習21天實戰caffe-趙永科》學習protobuffer相關知識，瞭解如何讀取proto.txt等相關引數檔案。路線下載protobu

Python下opencv使用筆記（一）（圖像簡單讀取、顯示與儲存）

操作灰度圖清晰 ren from tty ims 圖像 type 寫在之前從去年開始關註python這個軟件，途中間間斷斷看與學過一些關於python的東西。感覺python確實是一個簡單優美、easy上手的腳本編程語言，眾多的第三方庫使得py

Linux下MySQL的基礎（一）

mysql基於解釋MYSQL的基礎1. MySQL服務器中幫助的使用格式： mysql> help command eg： mysql> help create database Name: ‘CREATE DATABASE‘ Description: Sy

hibernate框架在eclipse下的配置方法（一）

java、 sql數據庫文件目錄測試表 any 配置包名 ive 當我一、ORM O:object 對象 R:Realtion 關系（關系型數據庫） M:Mapping 映射 ORM：對象關系型映射　　目前流行的編程語言，如Java、C# ，它們都是面向對象的編程

【golang-GUI開發】qt之signal和slot（一）

類型取消 htm return 所在 turn hang nbsp type 想了很久，我決定還是先從signal和slot（信號槽）開始講起。 signal和slot大家一定不陌生，先看一段示例（選自文檔）： 1 class Counter : public QOb

windows伺服器下使用nginx 基礎（一）

windows nginx 安裝 nginx 手機端訪問 https 問題：為什麼使用windows伺服器，因為不會linux。為什麼使用node做伺

C# VS2012下的3D顯示（一）

首先，把工具下載齊全。在codeproject中找到的，找資料真的比程式設計還累。 http://www.codeproject.com/Articles/3144/SharpGL-a-C-OpenGL-class-library 這裡需要用到的是：Download the Vis

Linux下的基本指令（一）

文章目錄 1.檔案系統層次結構 1.1根目錄下重要的目錄 2. 對目錄進行操作 2.1 樹狀目錄結構的解釋 2.2 目錄的基本命令 1. cp 指令：複製一個或多個檔案

Linux下使用ElasticSearch教程（一）

一：ElasticSearch在Linux下安裝簡單總結. 1.本次安裝的版本是ES6.3.2.版本.下載到壓縮包.解壓後直接來到當前的解壓目錄. cd config &n

RK3399 Camera呼叫USB攝像頭（一）測試篇

新買的開發板RK3399外接USB攝像頭，查看了下，RK3399 Android系統rom是支援底層UVC驅動的，將一些測試結果和測試demo記錄下來，以免他人踩坑，如果有幫到你，請點個關注和start，謝謝文章目錄一、USB攝像頭連線資

白話Spring原始碼（一）：怎麼閱讀原始碼

跟大家分享Spring原始碼前我想先聊聊：為什麼要閱讀原始碼？怎麼閱讀原始碼？希望大家在學習某個新的知識前多問幾個為什麼，好奇心是我們學習的一大動力。一、為什麼要閱讀原始碼剛入行時，我們會接觸很多框架：spirng，Struts，Hibernate，mybatis等等，

ubuntu 18.04下greenplum安裝筆記（一）Linux下基礎環境的搭建

背景需要構建一個用於資料倉庫的分散式資料庫叢集。每一個節點暫時不需要進行備份，同時也不考慮壞掉的情況。每一個數據節點最好都不用進行過多的配置，安裝起來方便。 Greenplum的Shared-Nothing的設計思路很適合我目前的業務場景。物理環境 4檯安裝了Linux的主機，安裝的作業系統的版本均為

Spring原始碼學習筆記（一）bean是怎麼生成的

bean 實在 bean 重新整理過程中產生的，首先我們看下 bean 的重新整理方法。下面是 AbstractApplicationContext 的 refresh 方法。 @Override public void refresh() throws

手寫一個Linux下的debug工具（一）

寫在前面學習過Linux程式設計的同學都或多或少用過gdb來除錯自己的程式，但是並沒有很多的資源讓我們學習有關偵錯程式的東西。希望通過這篇文章，你可以瞭解基本的除錯原理，更重要的是可以寫出一個自己的簡易除錯工具。更有趣的是，你可以瞭解如何修改記憶體，來“愚弄

呼叫鏈系列（一）：解讀UAVStack中的貪吃蛇-呼叫鏈

背景對於分散式線上服務，一個請求需要經過多個系統中多個模組，可能多達上百臺機器的協作才能完成單次請求。這種場景下單靠人力無法掌握整個請求中各個階段的效能開銷，更無法快速的定位系統中效能瓶頸。當發生故障時通常需要檢視大量日誌跨越多個團隊來確認問題。

MFC/Qt下呼叫caffe原始碼（一）---將caffe原始碼生成動態連結庫dll

相關推薦