caffe-----使用C++ 提取网络中间层特征数据

最近实验，想要在c++下知道网络中间某一层的特征数据情况，查找了相关资料，记录一下。

其实在caffe框架里面是包含这种操作的，可以模仿tools/extract_features.cpp中的操作来得到网络中间的特征数据。

首先看下extract_features.cpp是如何写的。

template<typename Dtype>

int feature_extraction_pipeline(int argc, char** argv) {

  ::google::InitGoogleLogging(argv[]);

  const int num_required_args = ;

  if (argc < num_required_args) {

    LOG(ERROR)<<

    "This program takes in a trained network and an input data layer, and then"

    " extract features of the input data produced by the net.\n"

    "Usage: extract_features  pretrained_net_param"

    "  feature_extraction_proto_file  extract_feature_blob_name1[,name2,...]"

    "  save_feature_dataset_name1[,name2,...]  num_mini_batches  db_type"

    "  [CPU/GPU] [DEVICE_ID=0]\n"

    "Note: you can extract multiple features in one pass by specifying"

    " multiple feature blob names and dataset names separated by ','."

    " The names cannot contain white space characters and the number of blobs"

    " and datasets must be equal.";

    return ;

  }

  int arg_pos = num_required_args;

  arg_pos = num_required_args;

  if (argc > arg_pos && strcmp(argv[arg_pos], "GPU") == ) {

    LOG(ERROR)<< "Using GPU";

    int device_id = ;

    if (argc > arg_pos + ) {

      device_id = atoi(argv[arg_pos + ]);

      CHECK_GE(device_id, );

    }

    LOG(ERROR) << "Using Device_id=" << device_id;

    Caffe::SetDevice(device_id);

    Caffe::set_mode(Caffe::GPU);

  } else {

    LOG(ERROR) << "Using CPU";

    Caffe::set_mode(Caffe::CPU);

  }

  arg_pos = ;  // the name of the executable

  std::string pretrained_binary_proto(argv[++arg_pos]);

  // Expected prototxt contains at least one data layer such as

  //  the layer data_layer_name and one feature blob such as the

  //  fc7 top blob to extract features.

  /*

   layers {

     name: "data_layer_name"

     type: DATA

     data_param {

       source: "/path/to/your/images/to/extract/feature/images_leveldb"

       mean_file: "/path/to/your/image_mean.binaryproto"

       batch_size: 128

       crop_size: 227

       mirror: false

     }

     top: "data_blob_name"

     top: "label_blob_name"

   }

   layers {

     name: "drop7"

     type: DROPOUT

     dropout_param {

       dropout_ratio: 0.5

     }

     bottom: "fc7"

     top: "fc7"

   }

   */

  std::string feature_extraction_proto(argv[++arg_pos]);

  boost::shared_ptr<Net<Dtype> > feature_extraction_net(

      new Net<Dtype>(feature_extraction_proto, caffe::TEST));

  feature_extraction_net->CopyTrainedLayersFrom(pretrained_binary_proto);//初始化网络

  std::string extract_feature_blob_names(argv[++arg_pos]);

  std::vector<std::string> blob_names;

  boost::split(blob_names, extract_feature_blob_names, boost::is_any_of(","));

  std::string save_feature_dataset_names(argv[++arg_pos]);

  std::vector<std::string> dataset_names;

  boost::split(dataset_names, save_feature_dataset_names,

               boost::is_any_of(","));

  CHECK_EQ(blob_names.size(), dataset_names.size()) <<

      " the number of blob names and dataset names must be equal";

  size_t num_features = blob_names.size();

  for (size_t i = ; i < num_features; i++) {

    CHECK(feature_extraction_net->has_blob(blob_names[i]))

        << "Unknown feature blob name " << blob_names[i]

        << " in the network " << feature_extraction_proto;

  }

  int num_mini_batches = atoi(argv[++arg_pos]);

  std::vector<boost::shared_ptr<db::DB> > feature_dbs;

  std::vector<boost::shared_ptr<db::Transaction> > txns;

  const char* db_type = argv[++arg_pos];

  for (size_t i = ; i < num_features; ++i) {

    LOG(INFO)<< "Opening dataset " << dataset_names[i];

    boost::shared_ptr<db::DB> db(db::GetDB(db_type));

    db->Open(dataset_names.at(i), db::NEW);

    feature_dbs.push_back(db);

    boost::shared_ptr<db::Transaction> txn(db->NewTransaction());

    txns.push_back(txn);

  }

  LOG(ERROR)<< "Extracting Features";

  Datum datum;

  std::vector<int> image_indices(num_features, );

  for (int batch_index = ; batch_index < num_mini_batches; ++batch_index) {

    feature_extraction_net->Forward();//首先进行前传 这样才能有中间数据

    for (int i = ; i < num_features; ++i) {

      const boost::shared_ptr<Blob<Dtype> > feature_blob =

        feature_extraction_net->blob_by_name(blob_names[i]);//通过名字查找blob

      int batch_size = feature_blob->num();

      int dim_features = feature_blob->count() / batch_size;

      const Dtype* feature_blob_data;

      for (int n = ; n < batch_size; ++n) {

        datum.set_height(feature_blob->height());

        datum.set_width(feature_blob->width());

        datum.set_channels(feature_blob->channels());

        datum.clear_data();

        datum.clear_float_data();

        feature_blob_data = feature_blob->cpu_data() +

            feature_blob->offset(n);

        for (int d = ; d < dim_features; ++d) {

          datum.add_float_data(feature_blob_data[d]);//将feature_blob的数据都保存到datum里

        }

        string key_str = caffe::format_int(image_indices[i], );

        string out;

        CHECK(datum.SerializeToString(&out));//将datum保存到本地

        txns.at(i)->Put(key_str, out);

        ++image_indices[i];

        if (image_indices[i] %  == ) {

          txns.at(i)->Commit();

          txns.at(i).reset(feature_dbs.at(i)->NewTransaction());

          LOG(ERROR)<< "Extracted features of " << image_indices[i] <<

              " query images for feature blob " << blob_names[i];

        }

      }  // for (int n = 0; n < batch_size; ++n)

    }  // for (int i = 0; i < num_features; ++i)

  }  // for (int batch_index = 0; batch_index < num_mini_batches; ++batch_index)

  // write the last batch

  for (int i = ; i < num_features; ++i) {

    if (image_indices[i] %  != ) {

      txns.at(i)->Commit();

    }

    LOG(ERROR)<< "Extracted features of " << image_indices[i] <<

        " query images for feature blob " << blob_names[i];

    feature_dbs.at(i)->Close();

  }

  LOG(ERROR)<< "Successfully extracted the features!";

  return ;

}

主要三个核心步骤：

1.初始化网络，并前传，

net->Forward()

2.通过blob的名字（prototxt中的name）来得到blob数据，

const boost::shared_ptr<Blob<Dtype> > feature_blob = net->blob_by_name(blob_names[i])

3.blob里面已经保存了所有的特征数据，按照需求取出来就好了。

count = feature_blob->channels() * feature_blob->height() *  feature_blob->width();

float* feature_array = new float[count];

const float* feature_blob_data = feature_blob->cpu_data() + feature_blob->offset(n); // feature data generated from

                             // the nth input image within a batch

memcpy(feature_array, feature_blob_data, count * sizeof(float));

...// other operations

delete [] feature_array;

如下是做实验时候的一个例子，提取出了blstm_input中的数据，并保存到了txt里。

Blob<float>* input_layer = m_net->input_blobs()[];

  input_layer->Reshape(, m_channelNum, m_inputGeometry.height, m_inputGeometry.width);

  m_net->Reshape();

  std::vector<cv::Mat> input_channels;

  wrapInputLayer(&input_channels);

  preprocess(img, &input_channels);

  m_net->Forward();

  Blob<float>* output_layer = m_net->output_blobs()[];

  int alphabet_size=output_layer->shape();

  int time_step=output_layer->shape();

 vector<int> shape;

const boost::shared_ptr<Blob<float> > blstm_input = m_net->blob_by_name("blstm_input");

    shape = blstm_input->shape();

    for(int i = ; i < shape.size(); i++)

    {

        cout<<" blstm_input shape:"<<i<<"    :"<<shape[i]<<endl;

    }

    const boost::shared_ptr<Blob<float> > lstm1 = m_net->blob_by_name("lstm1");

    shape = lstm1->shape();

    for(int i = ; i < shape.size(); i++)

    {

        cout<<" lstm1 shape:"<<i<<"    :"<<shape[i]<<endl;

    }

    cout<<"==============blob info======="<<endl;

    ofstream of("blstm.txt");

    for(int h = ; h < ; h++)

    {

        int count = blstm_input->channels() * blstm_input->height() * blstm_input->width();

        // cout<<"blstm_input->channels():"<<blstm_input->channels()<<"    blstm_input->height():"<<blstm_input->height()

        //     <<"    blstm_input->width():"<<blstm_input->width()<<endl;

        float* feature_array = new float[count];

        const float* feature_blob_data = blstm_input->cpu_data() +

            blstm_input->offset(h); // feature data generated from the nth input image within a batch

        memcpy(feature_array, feature_blob_data, count * sizeof(float)); 

        for(int i = ; i < count; i++ )

        {

            if(i && i %  == )

            {

                of<<endl;

            }

            of<<"    ["<< h<< ","<<i % << "]:"<<feature_blob_data[i];

        }

        of<<endl;

        delete [] feature_array;

    }

    of.close();

参考：

https://stackoverflow.com/questions/40938372/how-to-get-features-from-several-layers-using-c-in-caffe

caffe-----使用C++ 提取网络中间层特征数据的更多相关文章

Paper | 深度网络中特征的可迁移性
目录 1. 核心贡献 2. 实验设置 2.1. 任务设置 2.2. 网络设置 3. 实验结果 4. 启发论文:How transferable are features in deep neural ...
KDD Cup 99网络入侵检测数据的分析
看论文该数据集是从一个模拟的美国空军局域网上采集来的 9 个星期的网络连接数据, 分成具有标识的训练数据和未加标识的测试数据.测试数据和训练数据有着不同的概率分布, 测试数据包含了一些未出现在训练数 ...
python数据可视化-matplotlib入门(7)-从网络加载数据及数据可视化的小总结
除了从文件加载数据,另一个数据源是互联网,互联网每天产生各种不同的数据,可以用各种各样的方式从互联网加载数据. 一.了解 Web API Web 应用编程接口(API)自动请求网站的特定信息,再对这些 ...
Android之三种网络请求解析数据(最佳案例)
AsyncTask解析数据 AsyncTask主要用来更新UI线程,比较耗时的操作可以在AsyncTask中使用. AsyncTask是个抽象类,使用时需要继承这个类,然后调用execute()方法. ...
ASP.NET提取多层嵌套json数据的方法
本文实例讲述了ASP.NET利用第三方类库Newtonsoft.Json提取多层嵌套json数据的方法,具体例子如下. 假设需要提取的json字符串如下: {"name":&quo ...
NLP用CNN分类Mnist，提取出来的特征训练SVM及Keras的使用（demo）
用CNN分类Mnist http://www.bubuko.com/infodetail-777299.html /DeepLearning Tutorials/keras_usage 提取出来的特征 ...
教你50招提升ASP.NET性能（十）：减少通过网络发送的数据
(16)Reduce the data sent across the network 招数16: 减少通过网络发送的数据 Reducing the amount of data sent acros ...
iOS开发网络篇—JSON数据的解析
iOS开发网络篇—JSON数据的解析 iOS开发网络篇—JSON介绍一.什么是JSON JSON是一种轻量级的数据格式,一般用于数据交互服务器返回给客户端的数据,一般都是JSON格式或者XML格式 ...
分享非常有用的Java程序(关键代码)(八)---Java InputStream读取网络响应Response数据的方法!(重要)
原文:分享非常有用的Java程序(关键代码)(八)---Java InputStream读取网络响应Response数据的方法!(重要) Java InputStream读取数据问题 ======== ...

随机推荐

UVA - 10829 L-Gap Substrings (后缀自动机+线段树启发式合并)
题意:统计一段字符串中形如UVU的子串个数(其中V的长度固定为g). 问题等价于求满足$g+1\leqslant |j-i|\leqslant g+LCP(i,j)$的后缀(i,j)的对数,即$\su ...
C++构造函数实例
#include<iostream> #include <string> using namespace std; class Person { public: //无参(默认 ...
printf计算参数是从右到左压栈的（a++和++a的压栈的区别）
一.问题 c++代码: #include <iostream> #include <stdio.h> using namespace std; int main(){ ; co ...
[洛谷P4072] SDOI2016 征途
问题描述 Pine开始了从S地到T地的征途. 从S地到T地的路可以划分成n段,相邻两段路的分界点设有休息站. Pine计划用m天到达T地.除第m天外,每一天晚上Pine都必须在休息站过夜.所以,一段路 ...
[人物存档]【AI少女】【捏脸数据】现代风格
点击下载:6543d037acaf2edd03b4679f821001e9380193ce.png
如何查看 SQL Server 执行的历史 SQL 语句记录？
SELECT st.text as sql_statement, qs.creation_time as plan_last_compiled, qs.last_execution_time as p ...
react 的className动态修改
https://blog.csdn.net/suwyer/article/details/81481507(copy) <div style={{display: (index===this.s ...
java web文件上传功能实现
核心原理: 该项目核心就是文件分块上传.前后端要高度配合,需要双方约定好一些数据,才能完成大文件分块,我们在项目中要重点解决的以下问题. * 如何分片: * 如何合成一个文件: * 中断了从哪个分片开 ...
poj 3662 Telephone Lines dijkstra+二分搜索
Telephone Lines Time Limit: 1000MS Memory Limit: 65536K Total Submissions: 5696 Accepted: 2071 D ...
ABI与ARM，X86的概念
Android系统目前支持以下七种不同的CPU架构:ARMv5,ARMv7 (从2010年起),x86 (从2011年起),MIPS (从2012年起),ARMv8,MIPS64和x86_64 (从2 ...

caffe-----使用C++ 提取网络中间层特征数据

caffe-----使用C++ 提取网络中间层特征数据的更多相关文章

随机推荐

热门专题