使用Caffe和訓練好的model從影象中提取某一層特徵

阿新 • • 發佈：2018-12-20

有時我們並不是需要分類結果，只要某一層的特徵，作為影象的特徵表示。

#encoding=utf8
'''
python2.7
'''
import numpy as np
import os
import argparse
import caffe
import sys
import pickle
import struct
import sys,cv2
caffe_root = '../'
sys.path.insert(0, caffe_root + 'python')


def set_gpu(gpuID):
    if gpuID >= 0:
        caffe. 
set_mode_gpu()
        caffe.set_device(gpuID)
    else:
        caffe.set_mode_cpu()


class FeatureExtractor(caffe.Net):
    """
    Classifier extends Net for image class prediction
    by scaling, center cropping, or oversampling.
    Parameters
    ----------
    image_dims : dimensions to scale input for cropping/sampling.
        Default is to scale to net input size for whole-image crop.
    mean, input_scale, raw_scale, channel_swap: params for
        preprocessing options.
    """ 

    def __init__(self, model_file, pretrained_file, image_dims=None,
                 mean=None, input_scale=None, raw_scale=None,
                 channel_swap=None):
        caffe.Net.__init__(self, model_file, caffe.TEST, weights=pretrained_file)
        # self.net = caffe.Net(model_file, caffe.TEST, pretrained_file) 


        # configure pre-processing
        in_ = self.inputs[0]
        self.transformer = caffe.io.Transformer(
            {in_: self.blobs[in_].data.shape})
        self.transformer.set_transpose(in_, (2, 0, 1))
        if mean is not None:
            self.transformer.set_mean(in_, mean)
        if input_scale is not None:
            self.transformer.set_input_scale(in_, input_scale)
        if raw_scale is not None:
            self.transformer.set_raw_scale(in_, raw_scale)
        if channel_swap is not None:
            self.transformer.set_channel_swap(in_, channel_swap)

        self.crop_dims = np.array(self.blobs[in_].data.shape[2:])
        if not image_dims:
            image_dims = self.crop_dims
        self.image_dims = image_dims

    def _get_feature(self, inputs, layer_name):
        input_ = np.zeros((len(inputs), self.image_dims[0], self.image_dims[1], inputs[0].shape[2]), dtype=np.float32)
        for ix, in_ in enumerate(inputs):
            input_[ix] = caffe.io.resize_image(in_, self.image_dims)

        caffe_in = np.zeros(np.array(input_.shape)[[0,3,1,2]], dtype=np.float32)
        for ix, in_ in enumerate(input_):
            caffe_in[ix] = self.transformer.preprocess(self.inputs[ix], in_)
        # out = self.forward()
        out = self.forward_all(**{self.inputs[0]: caffe_in})
        predictions = out[self.outputs[0]]
        cls_result = []
        for prediction in predictions:
            cls_id = np.argmax(prediction)
            cls_result.append(cls_id)
        print(cls_result)
        return cls_result

    # 提取特徵並儲存為相應地檔案
    def extractFeature(self, input_file, layer_name):
        inputs = [caffe.io.load_image(input_file)]
        self._get_feature(inputs, layer_name)
        return self.blobs[layer_name].data[0].flatten()
    
        # 提取特徵並儲存為相應地檔案
    def extractFeatureFromImage(self, input_image, layer_name):
        self._get_feature([input_image], layer_name)
        return self.blobs[layer_name].data[0].flatten()
    
    def extractFeatureFromMultiImage(self, inputs, layer_name):
        self._get_feature(inputs, layer_name)
        features = []
        for i in range(len(inputs)):
            features.append(self.blobs[layer_name].data[i].flatten())
        return features


def get_args():
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--input_file",
        default='/home/zhangxin/pic/2.png',
        help="Input image, directory, or npy."
    )
    parser.add_argument(
        "--layer_name",
        default='pool5/7x7_s1'
    )
    parser.add_argument(
        "--model_def",
        default="/home/zhangxin/github/caffe/models/bvlc_googlenet/deploy.prototxt",
        help="Model definition file."
    )
    parser.add_argument(
        "--pretrained_model",
        default="/home/zhangxin/github/caffe/models/bvlc_googlenet/bvlc_googlenet.caffemodel",
        help="Trained model weights file."
    )
    parser.add_argument(
        "--gpu",
        action='store_true',
        help="Switch for gpu computation."
    )
    parser.add_argument(
        "--center_only",
        action='store_true',
        help="Switch for prediction from center crop alone instead of " +
             "averaging predictions across crops (default)."
    )
    parser.add_argument(
        "--images_dim",
        default='256,256',
        help="Canonical 'height,width' dimensions of input images."
    )
    parser.add_argument(
        "--mean_file",
        default='/home/zhangxin/github/caffe/python/caffe/imagenet/ilsvrc_2012_mean.npy',
        help="Data set image mean of [Channels x Height x Width] dimensions " +
             "(numpy array). Set to '' for no mean subtraction."
    )
    parser.add_argument(
        "--input_scale",
        type=float,
        help="Multiply input features by this scale to finish preprocessing."
    )
    parser.add_argument(
        "--raw_scale",
        type=float,
        default=255.0,
        help="Multiply raw input by this scale before preprocessing."
    )
    parser.add_argument(
        "--channel_swap",
        default='2,1,0',
        help="Order to permute input channels. The default converts " +
             "RGB -> BGR since BGR is the Caffe default by way of OpenCV."
    )

    return parser.parse_args()

def main(args):
    image_dims = [int(s) for s in args.images_dim.split(',')]
    mean, channel_swap = None, None
    if args.mean_file:
        # mean = np.load(args.mean_file)
        mean = np.load(args.mean_file).mean(1).mean(1)
    if args.channel_swap:
        channel_swap = [int(s) for s in args.channel_swap.split(',')]

    if args.gpu:
        caffe.set_mode_gpu()
        print("GPU mode")
    else:
        caffe.set_mode_cpu()
        print("CPU mode")

    extractor = FeatureExtractor(args.model_def, args.pretrained_model, image_dims, mean, args.input_scale, args.raw_scale, channel_swap)

    feature = extractor.extractFeature(args.input_file, args.layer_name)
    print(feature.shape, type(feature), feature)


if __name__ == "__main__":
    main(get_args())

使用方法：

python caffe_py_extract_feature.py \
    --input_file /home/zhangxin/pic/2.png \
    --layer_name pool5/7x7_s1 \
    --model_def /home/zhangxin/github/caffe/models/bvlc_googlenet/deploy.prototxt \
    --pretrained_model /home/zhangxin/github/caffe/models/bvlc_googlenet/bvlc_googlenet.caffemodel \
    --mean_file /home/zhangxin/github/caffe/python/caffe/imagenet/ilsvrc_2012_mean.npy \
    --images_dim 224,224

使用Caffe和訓練好的model從影象中提取某一層特徵

有時我們並不是需要分類結果，只要某一層的特徵，作為影象的特徵表示。 #encoding=utf8 ''' python2.7 ''' import numpy as np import os import argparse import caffe import sys impor

按空格和按換行從檔案中提取資料

1，讀取檔案的類為ifstream，其中“i”代表“in”，針對變數而言，ifstream所在的標頭檔案為fstream； 2，ifstream中有open方法，可以開啟檔案； 3，ifstream中有>>方法，可以以空格為分割符，以換行為結束符讀取資料； 4，iostrea

用Python在訓練好的log檔案中提取出資料並畫圖

在caffe框架下，對訓練好的log0檔案用Python中正則表示式進行匹配，提取出每一次顯示的accuracy，並對其進行在Spyder中運用pyplot進行畫圖。程式碼這是拿訓練資料為300

從mysqldump檔案中提取某一天某一表格的sql語句

#!/bin/sh ################################################################# #輸入需要備份的伺服器 fwq="MT2TV_2

Android MediaMetadataRetriever 從視訊中擷取某一幀圖片

從視訊中擷取某一幀圖片儲存到本地最近遇到一個問題，拍攝完視訊後需要在視訊中選擇一幀當作視訊封面在Android中有這樣一個類MediaMetadataRetriever **官方API解釋：MediaMetadataRetriever class pr

SEPC：使用3D卷積從FPN中提取尺度不變特徵，漲點神器 | CVPR 2020

> 論文提出PConv為對特徵金字塔進行3D卷積，配合特定的iBN進行正則化，能夠有效地融合尺度間的內在關係，另外，論文提出SEPC，使用可變形卷積來適應實際特徵間對應的不規律性，保持尺度均衡。PConv和SEPC對SOTA的檢測演算法有顯著地提升，並且沒有帶來過多的額外計算量來源：曉飛的

caffe測試訓練好的caffemodel和記錄每層的執行時間

我用的是ubuntu的caffe。在caffe的目錄下在terminal中執行以下命令用以測試已經訓練好的caffemodel的accuracy：（或者將以下命令放在.sh檔案中執行） ./build/tools/caffe test --model=/example

從訓練好的tensorflow模型中列印訓練變數

從tensorflow 訓練後儲存的模型中列印訓變數：使用tf.train.NewCheckpointReader()import tensorflow as tf reader = tf.train.

caffe 用訓練好的模型提取圖片特徵（使用自帶classify.py和classifier.py）

原材料： 1）訓練好的caffemodel 2) 定義網路結構的deploy.prototxt配置檔案 3）訓練時使用的mean檔案，在/cafferoot/python/classify.py的demo中，要求使用的是.npy格式的meanfile，如果我們手上有的是

Excel怎樣從字串中提取位置和長度不固定的數字

最近上課的時候，常常有學員諮詢怎樣從Excel字元中提取位置和長度都不固定的數字，今天我們分兩種情況來聊一聊對應的解決方案。情況1：數字前後有特定的分隔符如果數字前後有特定的分隔符，比如（）、##等分隔符，那麼我們可以通過查詢這些分隔符的位置，來定位到數字的位置。比如下圖所示的這個

kalibr 如何從bag中提取影象/由影象生成bag

１. 從bag中提取影象使用kalibr自帶的bagextractor工具 ./kalibr_bagextractor --image-topics /cam0/image_raw --bag ./static/output.bag 使用python指令碼２. 由影象生

Matlab從影象中選取矩形區域

imrect a = imread(‘lena8.jpg’); b = imcrop(); % 得到矩形區域的畫素矩陣 imcrop a = imread(‘lena8.jpg’); b = imrect; h = wait(b);%得到矩形的起

DL開源框架Caffe | 用訓練好的模型對資料進行預測

一句話理解Caffe：　　Caffe的萬丈高樓（Net）是按照我們設計的圖紙（prototxt），用很多磚塊（Blob）築成一層層（Layer）樓房，最後通過某些手段（Solver）進行簡裝修（Train）/精裝修（Finetune）實現的，另外每個樓層都可

Caffe用訓練好的模型測試圖片

這是一個python指令碼，用訓練好的caffemodel來測試圖片，接下來直接上程式碼，裡面有詳細解釋，大部分你要修改的只是路徑，另外在這個指令碼的基礎上你可以根據自己的需要進行改動。需要的東西：訓練好的caffemodel，deploy.prototxt

HBase建表高階屬性，hbase應用案例看行鍵設計，HBase和mapreduce結合，從Hbase中讀取資料、分析，寫入hdfs，從hdfs中讀取資料寫入Hbase，協處理器和二級索引

1. Hbase高階應用 1.1建表高階屬性下面幾個shell 命令在hbase操作中可以起到很到的作用，且主要體現在建表的過程中，看下面幾個create 屬性 1、 BLOOMFILTER 預設是NONE 是否使用布隆過慮及使用何種方式布隆

caffe利用訓練好的模型進行實際測試

官方版demo import numpy as np import os import sys import cv2 caffe_root = 'your caffe root' sys.path.insert(0, caffe_root + '/py

Caffe中用訓練好的模型測試，deploy檔案的修改方法

訓練好網路模型後，需要在測試集上驗證模型分類的正確率，這時，就需要把訓練的網路檔案net.prototxt修改為deploy.prototxt，然後再進行測試。輸入資料層改動如下： name: "SpecNet" layer { name: "sp

深度學習tensorflow實戰筆記（5）用預訓練好的VGG-16模型提取影象特徵

上一篇部落格介紹瞭如果使用自己訓練好的模型用於影象分類和特徵提取，但是有時候自己的資料集大小有限，所以更多的時候我們需要用VGG-16預訓練好的模型提取特徵，相關學者預訓練好的模型使用的都是公開的標準資料集，所以我們直接用預訓練的模型提取我們自己影象的特徵，可以用於

用PDFMiner從PDF中提取文本文字

dfp port 下載 span setup 技術分享 code with converter 1、下載並安裝PDFMiner 　　從https://pypi.python.org/pypi/pdfminer/下載PDFMineer wget https://pypi.p

從數組中刪除某一項

index style 刪除 ret indexof span 數組 pan cnblogs function remove(arr,item){ if(arr.length){ var index = arr.indexOf(item);

使用Caffe和訓練好的model從影象中提取某一層特徵

相關推薦