torchnet+VGG16计算patch之间相似度

torch

VGG16

similarity

本来打算使用VGG实现siamese CNN的，但是没想明白怎么使用torchnet对模型进行微调。。。所以只好把VGG的卷积层单独做一个数据预处理模块，后面跟一个网络，将两个VGG输出的结果输入该网络中，仅训练这个浅层网络。

数据：使用了MOTChallenge数据库MOT16-02中的pedestrian

代码：

-- ---------------------------------------------------------------------------------------
-- 读取MOT16-02数据集的groundtruth，分成训练集和测试集
-- ---------------------------------------------------------------------------------------
require 'torch'
require 'cutorch'
torch.setdefaulttensortype('torch.FloatTensor')
data_type = 'torch.CudaTensor' -- 设置数据类型，不适用GPU可以设置为torch.FloatTensor
require 'image'
local datapath = '/home/zwzhou/programFiles/2DMOT2015/MOT16/train/MOT16-02/'
local tmp = image.load(datapath .. 'img1/000001.jpg',3,'byte')
local width = tmp:size(3)
local height = tmp:size(2)
local num = 600
local imgs = torch.Tensor(num,3,height,width)
local file,_ = io.open('imgs.t7')
if not file then
for i=1,num do -- 读取视频帧
imgs[i]=image.load(datapath .. 'img1/' .. string.format('%06d.jpg',i))
end
torch.save('imgs.t7',imgs)
else
imgs = torch.load('imgs.t7')
end
require'sys'
local gt_path = datapath .. 'gt/gt.txt'
local gt_info={}
local i=0
for line in io.lines(gt_path) do -- pedestrians的patch信息
local v=sys.split(line,',')
if tonumber(v[7]) ==1 and tonumber(v[9]) > 0.8 then -- 筛选有效的patch，是pedestrian且可见度>0.8
table.insert(gt_info,{tonumber(v[1]),tonumber(v[2]),tonumber(v[3]),tonumber(v[4]),tonumber(v[5]),tonumber(v[6])})
-- 对应的是frame index,track index, x, y, w, h
end
end
-- 构建样本对，这里主要是为了正负样本个数相同，每个pedestrian选取25个相同id的patch，25个不同id的patch
local pairwise={}
for i=1,#gt_info do
local count=0
local iter=0
repeat
local j=torch.ceil(torch.rand(1)*(#gt_info))[1]
if gt_info[i][2] == gt_info[j][2] then
count=count+1
table.insert(pairwise,{i,j})
end
iter=iter+1
until(count >25 or iter>100)
repeat
local j=torch.ceil(torch.rand(1)*#gt_info)[1]
if gt_info[i][2] ~= gt_info[j][2] then
count=count-1
table.insert(pairwise,{i,j})
end
until(count <0)
end
local function cast(x) return x:type(data_type) end -- 类型转换
-- 加载pretrained VGG16 model
require 'nn'
require 'loadcaffe'
local function getPretrainedModel()
local proto = '/home/zwzhou/modelZoo/VGG_ILSVRC_16_layers_deploy.prototxt'
local caffemodel = '/home/zwzhou/modelZoo/VGG_ILSVRC_16_layers.caffemodel'
local VGG16 = loadcaffe.load(proto,caffemodel,'nn')
for i = 1,3 do
VGG16.modules[#VGG16.modules]=nil
end
return VGG16
end
-- 为了能够使用VGG，需要定义一些预处理方法
local loadSize = {3,256,256}
local sampleSize={3,224,224}
local function adjustScale(input) -- VGG需要先将输入图片的最小边缩放到256，另一边保持纵横比
if input:size(3) < input:size(2) then
input = image.scale(input,loadSize[2],loadSize[3]*input:size(2)/input:size(3))
else
input = image.scale(input,loadSize[2]*input:size(3)/input:size(2),loadSize[3])
end
return input
end
local bgr_means = {103.939,116.779,123.68} -- VGG使用的均值，注意是BGR通道，image.load()获得的是rgb
local function vggProcessing(img)
local img2 = img:clone() -- 深度拷贝
img2[{{1}}] = img[{{3}}]
img2[{{3}}] = img[{{1}}] -- rgb -> bgr
img2=img2:mul(255)
for i=1,3 do
img2[i]:add(-bgr_means[i])
end
return img2
end
local function centerCrop(input) -- 截取224*224大小
local oH = sampleSize[2]
local oW = sampleSize[3]
local iW = input:size(3)
local iH = input:size(2)
local w1 = math.ceil((iW-oW)/2)
local h1 = math.ceil((iH-oH)/2)
local out = image.crop(input,w1,h1,w1+oW,h1+oH)
return out
end
local file,_ = io.open('vgg_info.t7')
local vgg_info={}
if not file then
local VGG16_model = getPretrainedModel()
if data_type:match'torch.Cuda.*Tensor' then
require 'cudnn'
require 'cunn'
cudnn.convert(VGG16_model,cudnn):cuda()
cudnn.benchmark = true
end
cast(VGG16_model)
for i=1, #gt_info do
local idx=gt_info[i]
local img = imgs[idx[1]]
local x1 = math.max(idx[3],1)
local y1 = math.max(idx[4],1)
local x2 = math.min(idx[3]+idx[5],width)
local y2 = math.min(idx[4]+idx[6],height)
local patch = image.crop(img,x1,y1,x2,y2)
patch = adjustScale(patch)
patch = vggProcessing(patch)
patch = centerCrop(patch)
patch=cast(patch)
table.insert(vgg_info,VGG16_model:forward(patch):float())
end
torch.save('vgg_info.t7',vgg_info)
else
vgg_info=torch.load('vgg_info.t7')
end
local function getPatchPair(tmp) -- 获得patch 对
local pp = {}
pp[1] = vgg_info[tmp[1]]
pp[2] = vgg_info[tmp[2]]
local t=torch.cat(pp[1],pp[2],1)
return t
end
-- 定义datasetiterator
local tnt=require'torchnet'
local function getIterator(mode)
-- 创建model
local fc = nn.Sequential()
fc:add(nn.View(-1,4096*2))
fc:add(nn.Linear(4096*2,500))
fc:add(nn.ReLU(true))
fc:add(nn.Normalize(2))
fc:add(nn.Linear(500,500))
fc:add(nn.ReLU(true))
fc:add(nn.Linear(500,1))
-- print(fc:forward(torch.randn(2,4096*2)))
if data_type:match'torch.Cuda.*Tensor' then
require 'cudnn'
require 'cunn'
cudnn.convert(fc,cudnn):cuda()
cudnn.benchmark = true
end
cast(fc)
-- 构建训练引擎，使用OptimEngine
require 'optim'
local engine = tnt.OptimEngine()
local criterion = cast(nn.MarginCriterion())
-- 创建一些评估值
local train_timer = torch.Timer()
local test_timer = torch.Timer()
local data_timer = torch.Timer()
local meter = tnt.AverageValueMeter() -- 用于统计评估函数的输出
local confusion = optim.ConfusionMatrix(2) -- 2类混淆矩阵
local data_time_meter = tnt.AverageValueMeter()
-- log
local logtext=require 'torchnet.log.view.text'
log = tnt.Log{
keys = {'train_loss','train_acc','data_loading_time','epoch','test_acc','train_time','test_time'},
onFlush={
logtext{keys={'train_loss','train_acc','data_loading_time','epoch','test_acc','train_time','test_time'}}
}
}
local inputs = cast(torch.Tensor())
local targets = cast(torch.Tensor())
-- 填一些hook函数，以便观察训练过程
engine.hooks.onSample = function(state)
if state.training then
data_time_meter:add(data_timer:time().real)
end
inputs:resize(state.sample.input:size()):copy(state.sample.input)
targets:resize(state.sample.target:size()):copy(state.sample.target)
state.sample.input = inputs
state.sample.target = targets
end
engine.hooks.onForwardCriterion = function(state)
meter:add(state.criterion.output)
confusion:batchAdd(state.network.output:gt(0):add(1),state.sample.target:gt(0):add(1))
end
local function test() -- 用于测试
engine:test{
network = fc,
iterator = getIterator('test'),
criterion=criterion,
}
confusion:updateValids()
end
engine.hooks.onStartEpoch = function(state)
local epoch = state.epoch + 1
print('===>' .. ' online epoch # ' .. epoch .. '[batchsize = 256]')
meter:reset()
confusion:zero()
train_timer:reset()
data_time_meter:reset()
end
engine.hooks.onEndEpoch = function(state)
local train_loss = meter:value()
confusion:updateValids()
local train_acc = confusion.totalValid*100
local train_time = train_timer:time().real
meter:reset()
print(confusion)
confusion:zero()
test_timer:reset()
local cache = state.params:clone() -- 保存现场
--state.params:copy(state.optim.ax)
test()
--state.params:copy(cache) -- 恢复现场
log:set{
train_loss = train_loss,
train_acc = train_acc,
data_loading_time = data_time_meter:value(),
epoch = state.epoch,
test_acc = confusion.totalValid*100,
train_time = train_time,
test_time = test_timer:time().real,
}
log:flush()
end
engine.hooks.onUpdate = function(state)
data_timer:reset()
end
engine:train{
network = fc,
criterion = criterion,
iterator = getIterator('train'),
optimMethod = optim.sgd,
config = {learningRate = 0.05,
--weightDecay = 0.05,
momentum = 0.9,
--t0 = 1e+4,
--eta0 =0.1
},
maxepoch = 30,
}
-- 保存模型
local modelpath = 'SiaVGG16_model.t7'
print('Saving to ' .. modelpath)
torch.save(modelpath,fc:float():clearState())
--]]

输出：

1493386765674.jpg

发现网络太容易过拟合，主要一方面是数据太少，另一方面是视频中就那么几个人，所以patch之间的相关性太大，对网络提供的信息太少。所以使用更多的数据测试结果应该会好许多。

这个代码主要是为了熟悉torchnet package，感受呢，

对于数据的预处理，确实方便多了
如果使用提供的Engine，虽然训练过程简单了但是也太模块化了，比如某些层的微调，比如每层设置不同的学习率
使用Iterator时，尤其要小心

torchnet+VGG16计算patch之间相似度的更多相关文章

(转）c# math 计算两点之间的角度公式
计算两点之间的角度公式是: 假设点一(X1,Y1),点二(X2,Y2) double angleOfLine = Math.Atan2((Y2 - Y1), (X2 - X2)) * 180 / Ma ...
python-Levenshtein几个计算字串相似度的函数解析
linux环境下,没有首先安装python_Levenshtein,用法如下: 重点介绍几个该包中的几个计算字串相似度的几个函数实现. 1. Levenshtein.hamming(str1, str ...
sql server2008根据经纬度计算两点之间的距离
--通过经纬度计算两点之间的距离 create FUNCTION [dbo].[fnGetDistanceNew] --LatBegin 开始经度 --LngBegin 开始维度 --29.49029 ...
C#面向对象思想计算两点之间距离
题目为计算两点之间距离. 面向过程的思维方式,两点的横坐标之差,纵坐标之差,平方求和,再开跟,得到两点之间距离. using System; using System.Collections.Gene ...
2D和3D空间中计算两点之间的距离
自己在做游戏的忘记了Unity帮我们提供计算两点之间的距离,在百度搜索了下. 原来有一个公式自己就写了一个方法O(∩_∩)O~,到僵尸到达某一个点之后就向另一个奔跑过去 /// <summary ...
Jquery计算时间戳之间的差值，可返回年，月，日，小时等
/** * 计算时间戳之间的差值 * @param startTime 开始时间戳 * @param endTime 结束时间戳 * @param type 返回指定类型差值(year, month, ...
Levenshtein Distance莱文斯坦距离算法来计算字符串的相似度
Levenshtein Distance莱文斯坦距离定义: 数学上,两个字符串a.b之间的莱文斯坦距离表示为levab(|a|, |b|). levab(i, j) = max(i, j) 如果mi ...
<tf-idf + 余弦相似度> 计算文章的相似度
背景知识: (1)tf-idf 按照词TF-IDF值来衡量该词在该文档中的重要性的指导思想:如果某个词比较少见,但是它在这篇文章中多次出现,那么它很可能就反映了这篇文章的特性,正是我们所需要的关键词. ...
numpy :: 计算特征之间的余弦距离
余弦距离在计算相似度的应用中经常使用,比如: 文本相似度检索人脸识别检索相似图片检索原理简述下面是余弦相似度的计算公式(图来自wikipedia): 但是,余弦相似度和常用的欧式距离的有所区别 ...

随机推荐

无线路由器wan口和lan口ip同网段导致无法上网解决办法
环境本地网段为192.168.0.0/24 路由器默认网段也是192.168.0.0/24 设置好路由器wan口DHCP自动获取ip以后无法上网解决办法把路由器是lan口地址设置为192.168 ...
《挑战程序设计竞赛》2.5 最小生成树 POJ3723 3169 1258 2377 2395 AOJ2224（1）
POJ3723 http://poj.org/problem?id=3723 题意 windy要组建一支军队,召集了N个女孩和M个男孩,每个人要付10000RMB,但是如果一个女孩和一个男孩有关系d的 ...
UnicodeEncodeError: 'gbk' codec can't encode character '\xbb' in position 0: illegal multibyte sequence
使用Python写文件的时候,或者将网络数据流写入到本地文件的时候,大部分情况下会遇到:UnicodeEncodeError: 'gbk' codec can't encode character ' ...
network command assistant
这篇文章收集了久经考验靠谱的命令,也收集了几个比较新的命令.多数命令都可以在图形桌面执行,即使是没什么终端使用经验的Linux用户也会常常执行命令来使用ping或是其它的网络诊断工具. 1.curl ...
Caocao's Bridges---hdu4738（桥）
http://acm.hdu.edu.cn/showproblem.php?pid=4738 题就是求出所有的桥,然后输出桥的权值的最小值. 如果一开始是不连通的,输出0. 图有重边,需要处理, 不能 ...
11.Git分支管理
分支就是科幻电影里面的平行宇宙,当你正在电脑前努力学习Git的时候,另一个你正在另一个平行宇宙里努力学习SVN. 如果两个平行宇宙互不干扰,那对现在的你也没啥影响.不过,在某个时间点,两个平行宇宙合并 ...
005-java的Annotation
一.概述 Annotation,JDK1.5开始提供二.基本定义 public @interface HelloWorld { } 1.使用@Interface定义,名称大写 2.使用@Target ...
Hadoop权限认证的执行流程
Hadoop分布式文件系统实现了一个和POSIX系统类似的文件和目录的权限模型.每个文件和目录有一个所有者(owner)和一个组(group).文件或目录对其所有者.同组的其他用户以及所有其他用户分别 ...
python中的TCP及UDP
python中是通过套接字即socket来实现UDP及TCP通信的.有两种套接字面向连接的及无连接的,也就是TCP套接字及UDP套接字. TCP通信模型创建TCP服务器伪代码: ss = sock ...
机器学习实战python3 K近邻（KNN）算法实现
台大机器技法跟基石都看完了,但是没有编程一直,现在打算结合周志华的<机器学习>,撸一遍机器学习实战, 原书是python2 的,但是本人感觉python3更好用一些,所以打算用python ...

torchnet+VGG16计算patch之间相似度

torchnet+VGG16计算patch之间相似度

torchnet+VGG16计算patch之间相似度的更多相关文章

随机推荐

热门专题