cnn进行端到端的验证码识别改进

keras_cnn.py 训练及建模

#!/usr/bin/env python

# coding=utf-

"""

利用keras cnn进行端到端的验证码识别， 简单直接暴力。

迭代100次可以达到95%的准确率，但是很容易过拟合，泛化能力糟糕， 除了增加训练数据还没想到更好的方法.

__autho__: jkmiao

__email__: miao1202@.com

___date__:--

"""

from keras.models import Model

from keras.layers import Dense, Dropout, Flatten, Input, merge

from keras.layers import Convolution2D, MaxPooling2D

from keras.preprocessing.image import ImageDataGenerator

from PIL import Image

import os, random

import numpy as np

from keras.models import model_from_json

from util import CharacterTable

from keras.callbacks import EarlyStopping

from sklearn.model_selection import train_test_split

# from keras.utils.visualize_util import plot

def load_data(path='img/clearNoise/'):

    fnames = [os.path.join(path, fname) for fname in os.listdir(path) if fname.endswith('jpg')]

    random.shuffle(fnames)

    data, label = [], []

    for i, fname in enumerate(fnames):

        imgLabel = fname.split('/')[-].split('_')[]

        if len(imgLabel)!=:

            print 'error: ', fname

            continue

        imgM = np.array(Image.open(fname).convert('L'))

        imgM =  * (imgM>)

        data.append(imgM.reshape((, , )))

        label.append(imgLabel.lower())

    return np.array(data), label

ctable = CharacterTable()

data, label = load_data()

print data[].max(), data[].min()

label_onehot = np.zeros((len(label), ))

for i, lb in enumerate(label):

    label_onehot[i,:] = ctable.encode(lb)

print data.shape, data[-].max(), data[-].min()

print label_onehot.shape

datagen = ImageDataGenerator(shear_range=0.08, zoom_range=0.08, horizontal_flip=False,

                            rotation_range=, width_shift_range=0.06, height_shift_range=0.06)

datagen.fit(data)

x_train, x_test, y_train, y_test = train_test_split(data, label_onehot, test_size=0.1)

DEBUG = False

# 建模

if DEBUG:

    input_img = Input(shape=(, , ))

    inner = Convolution2D(, , , border_mode='same', activation='relu')(input_img)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    encoder_a = Flatten()(inner)

    inner = Convolution2D(, , , border_mode='same', activation='relu')(input_img)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    encoder_b = Flatten()(inner)

    inner = Convolution2D(, , , border_mode='same', activation='relu')(input_img)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    inner = MaxPooling2D(pool_size=(,))(inner)

    inner = Convolution2D(, , , border_mode='same')(inner)

    encoder_c = Flatten()(inner)

    input = merge([encoder_a, encoder_b, encoder_c], mode='concat', concat_axis=-)

    drop = Dropout(0.5)(input)

    flatten = Dense()(drop)

    flatten = Dropout(0.5)(flatten)

    fc1 = Dense(, activation='softmax')(flatten)

    fc2 = Dense(, activation='softmax')(flatten)

    fc3 = Dense(, activation='softmax')(flatten)

    fc4 = Dense(, activation='softmax')(flatten)

    fc5 = Dense(, activation='softmax')(flatten)

    fc6 = Dense(, activation='softmax')(flatten)

    merged = merge([fc1, fc2, fc3, fc4, fc5, fc6], mode='concat', concat_axis=-)

    model = Model(input=input_img, output=merged)

else:

    model = model_from_json(open('model/ba_cnn_model3.json').read())

    model.load_weights('model/ba_cnn_model3.h5')

# 编译

# model.compile(loss='categorical_crossentropy', optimizer='sgd', metrics=['accuracy'])

model.summary()

model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])

# plot(model, to_file='model3.png', show_shapes=True)

# 训练

early_stopping = EarlyStopping(monitor='val_loss', patience=)

model.fit_generator(datagen.flow(x_train, y_train, batch_size=), samples_per_epoch=len(x_train), nb_epoch=, validation_data=(x_test, y_test), callbacks=[early_stopping] )

json_string = model.to_json()

with open('./model/ba_cnn_model4.json', 'w') as fw:

    fw.write(json_string)

model.save_weights('./model/ba_cnn_model4.h5')

print 'done saved model cnn3'

# 测试

y_pred = model.predict(x_test, verbose=)

cnt =

for i in range(len(y_pred)):

    guess = ctable.decode(y_pred[i])

    correct = ctable.decode(y_test[i])

    if guess == correct:

        cnt +=

    if i%==:

        print '--'*, i

        print 'y_pred', guess

        print 'y_test', correct

print cnt/float(len(y_pred))

apicode.py 模型使用

#!/usr/bin/env python

# coding=utf-

from util import CharacterTable

from keras.models import model_from_json

from PIL import Image

import matplotlib.pyplot as plt

import os

import numpy as np

from prepare import clearNoise

def img2vec(fname):

    data = []

    img = clearNoise(fname).convert('L')

    imgM = 1.0 * (np.array(img)>)

    print imgM.max(), imgM.min()

    data.append(imgM.reshape((, , )))

    return np.array(data), imgM

ctable = CharacterTable()

model = model_from_json(open('model/ba_cnn_model4.json').read())

model.load_weights('model/ba_cnn_model4.h5')

def test(path):

    fnames = [ os.path.join(path, fname) for fname in os.listdir(path) ][:]

    correct =

    for idx, fname in enumerate(fnames, ):

        data, imgM = img2vec(fname)

        y_pred = model.predict(data)

        result = ctable.decode(y_pred[])

        label = fname.split('/')[-].split('_')[]

        if result == label:

            correct +=

            print 'correct', fname

        else:

            print result, label

        print 'accuracy: ',idx, float(correct)/idx

        print '=='*

#        plt.subplot()

#        plt.imshow(Image.open(fname).convert('L'), plt.cm.gray)

#        plt.title(fname)

#

#        plt.subplot()

#        plt.imshow(imgM, plt.cm.gray)

#        plt.title(result)

#        plt.show()

test('test')

cnn进行端到端的验证码识别改进的更多相关文章

基于tensorflow的‘端到端’的字符型验证码识别源码整理(github源码分享)
基于tensorflow的‘端到端’的字符型验证码识别 1 Abstract 验证码(CAPTCHA)的诞生本身是为了自动区分自然人和机器人的一套公开方法, 但是近几年的人工智能技术的发展 ...
基于python语言的tensorflow的‘端到端’的字符型验证码识别源码整理(github源码分享)
基于python语言的tensorflow的‘端到端’的字符型验证码识别 1 Abstract 验证码(CAPTCHA)的诞生本身是为了自动区分自然人和机器人的一套公开方法, 但是近几年的 ...
CNN+BLSTM+CTC的验证码识别从训练到部署
项目地址:https://github.com/kerlomz/captcha_trainer 1. 前言本项目适用于Python3.6,GPU>=NVIDIA GTX1050Ti,原mast ...
【转】CNN+BLSTM+CTC的验证码识别从训练到部署
[转]CNN+BLSTM+CTC的验证码识别从训练到部署转载地址:https://www.jianshu.com/p/80ef04b16efc 项目地址:https://github.com/ker ...
[验证码识别技术] 字符型验证码终结者-CNN+BLSTM+CTC
验证码识别(少样本,高精度)项目地址:https://github.com/kerlomz/captcha_trainer 1. 前言本项目适用于Python3.6,GPU>=NVIDIA G ...
Python实现各类验证码识别
项目地址: https://github.com/kerlomz/captcha_trainer 编译版下载地址: https://github.com/kerlomz/captcha_trainer ...
基于SVM的字母验证码识别
基于SVM的字母验证码识别摘要本文研究的问题是包含数字和字母的字符验证码的识别.我们采用的是传统的字符分割识别方法,首先将图像中的字符分割出来,然后再对单字符进行识别.首先通过图像的初步去噪.滤波 ...
[验证码识别技术]字符验证码杀手--CNN
字符验证码杀手--CNN 1 abstract 目前随着深度学习,越来越蓬勃的发展,在图像识别和语音识别中也表现出了强大的生产力.对于普通的深度学习爱好者来说,一上来就去跑那边公开的大型数据库,比如I ...
强智教务系统验证码识别 Tensorflow CNN
强智教务系统验证码识别 Tensorflow CNN 一直都是使用API取得数据,但是API提供的数据较少,且为了防止API关闭,先把验证码问题解决使用Tensorflow训练模型,强智教务系统的验 ...

随机推荐

《DSP using MATLAB》Problem 5.31
第3小题: 代码: %% ++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++++ %% Out ...
小白python 安装
小白python 安装: https://blog.csdn.net/qq_36667170/article/details/79275605 https://blog.csdn.net/nmjuzi ...
LG4238 【【模板】多项式求逆】
前言学习了Great_Influence的递推实现,我给大家说一下多项式求逆严格的边界条件,因为我发现改动一些很小的边界条件都会使程序出错.怎么办,背代码吗?背代码是不可能,这辈子都不会背代码的.理 ...
day 06云计算的三种服务模式：IaaS，PaaS和SaaS
云计算的三种服务模式:IaaS,PaaS和SaaS ”云服务”现在已经快成了一个家喻户晓的词了.如果你不知道PaaS, IaaS 和SaaS的区别,那么也没啥,因为很多人确实不知道. “云”其实是互联 ...
JS从数组中随机取出几个数组元素的方法
原文链接:http://caibaojian.com/js-get-random-elements-from-array.html js如何从一个数组中随机取出一个元素或者几个元素. 假如数组为· v ...
用Python开发Zeroc Ice应用
Zeroc Ice简介 Zeroc ICE(Internet Communications Engine ,互联网通信引擎)是目前功能比较强大和完善的RPC框架,支持跨平台.跨语言调用.它非常灵活 ...
oracle实用命令入门
登录oracle(需要在oracle用户下) 执行sqlplus,然后输入用户名和密码就可以了,如果是第一次使用oracle的话,可以直接使用sqlplus / as sysdba免密码以管理员的身份 ...
day 53 js学习之
---恢复内容开始--- 1.昨日作业讲解弄一个上图一样的选择器,可以全选,可以反选,取消 <!DOCTYPE html> <html lang="zh-CN" ...
(98)Address already in use: make_sock: could not bind to address 0.0.0.0:80
问题说明80端口被占用,用netstat -nlp |grep :80命令看看有什么进程占用了80端口,发现是httpd进程. 没想到安装了两个apache,我安装apache2.4的时候删除了2.2 ...
REPL
REPL(Read Eval Print Loop:交互式解释器) 表示一个电脑的环境,类似 Window 系统的终端或 Unix/Linux shell,我们可以在终端中输入命令,并接收系统的响应. ...

cnn进行端到端的验证码识别改进

cnn进行端到端的验证码识别改进的更多相关文章

随机推荐

热门专题