如果你最近在考虑OCR的问题，请进来~~~

本文主要是各类ocr的api对比问题，至于app推荐几款：合合信息(扫面全能王)，TextGrabber，白描等等等等

工作需要，搞文字识别技术，对比了几家

百度的OCR:

#!/usr/bin/env python3

# -*- coding: utf-8 -*-

"""

Created on Tue Jun 12 09:37:38 2018

利用百度api实现图片文本识别

@author: XnCSD

"""

import glob

from os import path

import os

from aip import AipOcr

from PIL import Image

def convertimg(picfile, outdir):

    '''

        调整图片大小，对于过大的图片进行压缩

        picfile:    图片路径

        outdir：    图片输出路径

    '''

    img = Image.open(picfile)

    width, height = img.size

    while (width * height > 4000000):  # 该数值压缩后的图片大约 两百多k

        width = width // 2

        height = height // 2

    new_img = img.resize((width, height), Image.BILINEAR)

    new_img.save(path.join(outdir, os.path.basename(picfile)))

def baiduOCR(picfile, outfile):

    """利用百度api识别文本，并保存提取的文字

    picfile:    图片文件名

    outfile:    输出文件

    """

    filename = path.basename(picfile)

    APP_ID = '你自己的appid'  # 刚才获取的 ID，下同

    API_KEY = '创建完实例人家给'

    SECRECT_KEY = '创建完实例人家给'

    client = AipOcr(APP_ID, API_KEY, SECRECT_KEY)

    i = open(picfile, 'rb')

    img = i.read()

    print("正在识别图片：\t" + filename)

    # message = client.basicGeneral(img)  # 通用文字识别，每天 50 000 次免费

    message = client.basicAccurate(img)   # 通用文字高精度识别，每天 800 次免费

    print("识别成功！")

    i.close()

    with open(outfile, 'a+', encoding='utf8') as fo:

        fo.writelines("+" * 60 + '\n')

        fo.writelines("识别图片：\t" + filename + "\n" * 2)

        fo.writelines("文本内容：\n")

        # 输出文本内容

        for text in message.get('words_result'):

            fo.writelines(text.get('words') + '\n')

        fo.writelines('\n' * 2)

    print("文本导出成功！")

    print()

if __name__ == "__main__":

    outfile = '最后写入的文件名'

    outdir ='图片压缩后存储的路径'

    if path.exists(outfile):

        os.remove(outfile)

    if not path.exists(outdir):

        os.mkdir(outdir)

    print("压缩过大的图片...")

    #  首先对过大的图片进行压缩，以提高识别速度，将压缩的图片保存与临时文件夹中

    for picfile in glob.glob("picture\*"):  # 在picture文件夹里放图片

        convertimg(picfile, outdir)

    print("图片识别...")

    for picfile in glob.glob("outdir\*"):

        baiduOCR(picfile, outfile)

        os.remove(picfile)

    print('图片文本提取结束！文本输出结果位于 %s 文件中。' % outfile)

    os.removedirs(outdir)

有道的OCR(加入了自己写的图片压缩以及循环的逻辑，如果有不对的地方请指出)：

#/usr/bin/env python

#coding=utf8

import hashlib

from PIL import Image

import os

import requests

import random

import glob

import json

from os import path

import base64

import time

def convertimg(picfile, outdir):

    '''

        调整图片大小，对于过大的图片进行压缩

        picfile:    图片路径

        outdir：    图片输出路径

    '''

    img = Image.open(picfile)

    width, height = img.size

    while (width * height > 4000000):  # 该数值压缩后的图片大约 两百多k

        width = width // 2

        height = height // 2

    new_img = img.resize((width, height), Image.BILINEAR)

    new_img.save(path.join(outdir, os.path.basename(picfile)))

def youdaoOCR(picfile, outfile):

    """利用有道api识别文本，并保存提取的文字

    picfile:    图片文件名

    outfile:    输出文件

    """

    appKey = '自己的appkey'  # 需要到有道云官网去注册实例

    secretKey = '自己的secretKey'

    httpClient = None

    try:

        filename = path.basename(picfile)

        print('正在识别%s' % filename)

        # print(picfile)

        f = open(picfile, 'rb')  # 二进制方式打开图文件

        img = base64.b64encode(f.read())  # 读取文件内容，转换为base64编码

        f.close()

        img = str(img, 'utf-8')

        detectType = ''

        imageType = ''

        langType = 'auto'

        salt = random.randint(1, 65536)

        sign = appKey + img + str(salt) + secretKey

        m1 = hashlib.md5()

        m1.update(sign.encode('utf-8'))

        sign = m1.hexdigest()

        data = {'appKey': appKey, 'img': img, 'detectType': detectType, 'imageType': imageType,

                'langType': langType, 'salt': str(salt), 'sign': sign}

        req = requests.post('http://openapi.youdao.com/ocrapi', data)

        content = req.text

        j = json.loads(content)

        # print(j)

        # print(j['Result']['regions'])

        lst = []

        for regionstr in j['Result']['regions']:

            for lineStr in regionstr['lines']:

                # print(lineStr['text'])

                lst.append(lineStr['text'])

        result = ','.join(lst)

        print(result)

    except ValueError:

        print("error")

if __name__ == '__main__':

    outfile = 'youdao.txt'  # 最后写入的文件

    outdir = '压缩的图片存储位置'

    if path.exists(outfile):

        os.remove(outfile)  # 如果有要写入的文件,删除

    if not path.exists(outdir):

        os.mkdir(outdir)  # 如果存储压缩后的图片的文件夹，创建

    print("正在压缩过大的图片....")

    for picfile in glob.glob(r"picture\*"):  # 图片存储路径

        convertimg(picfile, outdir)

    print('进行图片识别....')

    for picfile in glob.glob('压缩的图片存储位置\*'):

        youdaoOCR(picfile, outfile)

        os.remove(picfile)

    # print('图片提取结束！文本输出结果位于 %s 文件中。' % outfile)

    os.removedirs(outdir)

阿里的OCR(也加入了图片压缩以及循环功能(官网没有))：

import urllib.request

import urllib.parse

import json

import time

import base64

import glob

import re

from PIL import Image

from os import path

import os

import time

def convertimg(picfile, outdir):

    '''

        调整图片大小，对于过大的图片进行压缩

        picfile:    图片路径

        outdir：    图片输出路径

    '''

    img = Image.open(picfile)

    width, height = img.size

    while (width * height > 4000000):  # 该数值压缩后的图片大约 两百多k

        width = width // 2

        height = height // 2

    new_img = img.resize((width, height), Image.BILINEAR)

    new_img.save(path.join(outdir, os.path.basename(picfile)))

#请求头

headers = {

         'Authorization': 'APPCODE 自己的appcode',  # 阿里云官网上创建实例

         'Content-Type': 'application/json; charset=UTF-8'

    }

def posturl(url,data={}):  # data为第一张的默认参数， data1为第二张的默认参数

  try:

    params = json.dumps(dict).encode(encoding='UTF8')

    req = urllib.request.Request(url, params, headers)

    r = urllib.request.urlopen(req)

    html = r.read()

    r.close()

    return html.decode("utf8")

  except urllib.error.HTTPError as e:

      print(e.code)

      print(e.read().decode("utf8"))

  time.sleep(1)

if __name__=="__main__":

    url_request = "https://ocrapi-document.taobao.com/ocrservice/document"

    outfile = 'ali.txt'

    outdir = '压缩图片的存储位置'

    if path.exists(outfile):

        os.remove(outfile)

    if not path.exists(outdir):

        os.mkdir(outdir)

    print('开始进行图片压缩....')

    for picfile in glob.glob(r"picture\*"):  # 图片的存储位置

        convertimg(picfile, outdir)

    print('开始进行图片识别....')

    for picfile in glob.glob("outdir\*"):

        filename = path.basename(picfile)

        print('正在识别%s' % filename)

        with open(picfile, 'rb') as f:  # 以二进制读取本地图片

            data = f.read()

            encodestr = str(base64.b64encode(data), 'utf-8')

        dict = {'img': encodestr}

        html = posturl(url_request, data=dict)

        os.remove(picfile)

        html1 = json.loads(html)

        # print(html)

        # print(type(html))

        lst = []

        # print(html1['prism_wordsInfo'])

        for i in html1['prism_wordsInfo']:

            if i.get('pos'):

                i.pop('pos')

            for k, v in i.items():

                lst.append(v)

        # print(lst)

        str1 = ','.join(lst)

        print(str1)

    os.removedirs(outdir)

以下仅为个人意见：

我主要考虑的是有道和阿里：在准确度上差别不是很大，阿里稍微准确一丢丢

　　　　　　　　　　　　　价格方面阿里是有道的两倍左右(阿里的为高精度文字识别)

　　　　　　　　　　　　　速度上阿里更快一些。

如果你最近在考虑OCR的问题，请进来~~~的更多相关文章

如果你的unordered_map头文件报错请看这里
请将include<unordered_map>头文件换成下面代码 #if(__cplusplus == 201103L) #include <unordered_map> # ...
谈谈书本《c#物联网程序设计基础》中的技术瑕疵，如果你将要读本书，请进来看看！
今天去书店看到一本名为<c#物联网程序设计基础>的书,对物联网感兴趣的我抓起来就看,书中的项目都是上位机开发项目,较简单,如果物联网开发只是这样,看起来我做物联网开发也是绰绰有余.这边书我 ...
阿里巴巴-OS事业群-OS手机事业部-系统服务部门招聘Java开发工程师，有意者请进来
我是阿里巴巴-OS事业群-OS手机事业部-系统服务部的开发工程师,正在招聘Java开发工程师. 以下是职位描述: 岗位名称:Java开发工程师招聘人数:5人生效日期:2014-03-12 结束日期 ...
说说我在项目中为什么不用实体框架,如果说我在诋毁你所爱的EF,请进来.
1.坑多. 这一点没有人会否定.当然你可以说你很牛,但事实不会因为你牛就可以说不存在.从博客园中的博问中大家关于EF的提问量就问题的怪异程度就可以看出来. 1.Entity Framework 查询历 ...
C\C++各路高手以及操作系统专家请进来杀死这个进程
通常情况下编写一个程序,能够点击关闭button正常结束程序,也能够使用任务管理器结束任务,还能够使用taskkill等命令杀死进程,实在都不行也能够直接重新启动计算机. 可是,这些方法真的都管用吗? ...
【MongoDB】从入门到精通mongdb系列学习宝典，想学mongodb小伙伴请进来
最近一段时间在学习MongoDB,在学习过程中总共编写了四十余篇博客.从mongodb软件下载到分片集群的搭建. 从理论讲解到实例练习.现在把所有博客的内容做个简单目录,方便阅读的小伙伴查询. 一. ...
Postman SMTP 存在跨站脚本（XSS）漏洞，请换用Post SMTP Mailer/Email Log
Postman SMTP 是一个安装量超过10W的WordPress插件,但是已经2年多没有更新,2017年6月29日,被发现存在跨站脚本(XSS)漏洞(查看详情),并且作者一直没有更新,所以被从Wo ...
毕业N年后，请不要像我一样被档案烦死
目录一. 提醒大学生:深刻重视档案,避免以后麻烦! 二.说说我因为档案造成的烦心事! 三.说说档案这档子事: 四.档案如此重要,为什么有些人却成了弃档族? 五.档案该怎么操作才能不当"弃档 ...
[转自老马的文章]用MODI OCR 21种语言
作者:马健邮箱:stronghorse_mj@hotmail.com发布:2007.12.08更新:2012.07.09按照<MODI中的OCR模块>一文相关内容进行修订2012.07.0 ...

随机推荐

mybatis框架入门程序：演示通过mybatis实现数据库的删除操作
1.mybatis的基本配置工作可以在我的这篇博客中查看:https://www.cnblogs.com/wyhluckdog/p/10149480.html 2.删除用户的映射文件: <!-- ...
利率计算v2.0--web版--软件工程
.客户说:帮我开发一个复利计算软件. .如果按照单利计算,本息又是多少呢? .假如30年之后要筹措到300万元的养老金,平均的年回报率是3%,那么,现在必须投入的本金是多少呢? .利率这么低,复利计算 ...
WebClient使用与IIS7最大上传文件--升级&引导窗口&目录同步完整解决方法
IIS7最大上传文件说明:http://www.mzwu.com/article.asp?id=2449 WebClient使用说明使用using 及时回收资源 using(var wc=new W ...
网络中的A、B、C类地址
1.A类ip地址(1.0.0.0到126.255.255.255) A类地址只有第一个8位表示网络地址,最高位一定为0,所以A类地址的网络号范围可以为:64+32+16+8+4+2+1=127,也就是 ...
SDK管理利器——sdkman
SDK管理利器--sdkman 项目使用java的开发者一定会为新配环境变量而头大,sdkman很好的解决了系统sdk管理的痛点,仅需简单的几行命令就可以完成sdk的安装,更改默认版本.再也不用担心环 ...
underscore collections
1._.each(list, iterator, [context]):对集合中每一元素执行处理器方法. 如果传递了context参数,则把iterator绑定到context对象上.每次调用iter ...
handsontable-developer guide-setting options,callback
1.cell数组 cell: [ {row: 0, col: 0, readOnly: true} ] 2.cells函数 cells: function(row, col, prop){ var c ...
[C#]获取当前程序运行路径的方法集合(转)
//获取当前进程的完整路径,包含文件名(进程名).string str = this.GetType().Assembly.Location;result: X:\xxx\xxx\xxx.exe (. ...
通过一个例子感受C# 6.0新特性
微软在Visual Studio 2015中更新C#语言到6.0,添加了很多很好的特性,以使C#语言继续跻身于最优秀语言之行列.下面通过一个例子快速感受一下C# 6.0的新特性,以下程序在VS2015 ...
字体变色详解链接：https://www.cnblogs.com/daofaziran/p/9015284.html
格式:\033[显示方式;前景色;背景色m + 结尾部分:\033[0m 字体色 | 背景色 | 颜色描述 ------------------------------------------- 30 ...

如果你最近在考虑OCR的问题，请进来~~~

如果你最近在考虑OCR的问题，请进来~~~的更多相关文章

随机推荐

热门专题