基于Poco的UTF8、UTF16、GBK、Hex之间的转换

/******Encoding.h*******/

#include "Poco/UnicodeConverter.h"

#include "Poco/Exception.h"

#include "Poco/DigestEngine.h"

#define MyLib_API Foundation_API

using namespace Poco;

POCO_DECLARE_EXCEPTION(MyLib_API, EncodeException, Exception)

class Encoding

{

public:

    enum ByteOrderType

    {

        BIG_ENDIAN_BYTE_ORDER,

        LITTLE_ENDIAN_BYTE_ORDER,

        UNKNOW

    };

    static void GBKToUTF16(const std::string& gbkString, std::wstring& utf16String) throw(EncodeException);

    static void UTF16ToGBK(const std::wstring& utf16String, std::string& gbkString) throw(EncodeException);

    static void UTF8ToUTF16(const std::string& utf8String, std::wstring& utf16String) throw(EncodeException);

    static void UTF16ToUTF8(const std::wstring& utf16String, std::string& utf8String) throw(EncodeException);

    static void UTF8ToGBK(const std::string& utf8String, std::string& gbkString) throw(EncodeException);

    static void GBKToUTF8(const std::string& gbkString, std::string& utf8String) throw(EncodeException);

    static void EncodeHexString(const std::string& bytes, std::string& hexString);

    static void DecodeHexString(const std::string& hexString, std::string& bytes);

    static void EncodeHexString(const std::wstring& bytes, std::string& hexString);

    static void DecodeHexString(const std::string& hexString, std::wstring& bytes);

    static ByteOrderType GetCurrentByteOrder();

private:

    static Poco::UnicodeConverter _unicodeConverter;

    static ByteOrderType _currentByteOrder;

};

/********Encoding.cpp********/#include "Encoding.h"

#include "Poco/NumberParser.h"

Poco::UnicodeConverter Encoding::_unicodeConverter;

Encoding::ByteOrderType Encoding::_currentByteOrder;

POCO_IMPLEMENT_EXCEPTION(EncodeException, Poco::Exception, "Encoding error")

void Encoding::GBKToUTF16(const std::string& gbkString, std::wstring& utf16String)

{

    //获得需要分配的空间大小

    int size = MultiByteToWideChar(, , gbkString.c_str(), -, NULL, );

    std::vector<wchar_t> buff(size);

    if(MultiByteToWideChar(, , gbkString.c_str(), -, buff.data(), size) == )

    {

        //throw a exception

        throw EncodeException("GBK convert to UTF16 failed", GetLastError());

    }

    if(!utf16String.empty())

        utf16String.clear();

    utf16String.append(buff.data(), buff.size());

}

void Encoding::UTF16ToGBK(const std::wstring& utf16String, std::string& gbkString)

{

    int size = ;

    //获得需要分配的空间大小

    size = WideCharToMultiByte(, , utf16String.c_str(), -, NULL, , NULL, NULL);

    std::vector<char> buff(size);

    if(WideCharToMultiByte(, , utf16String.c_str(), -, buff.data(), size, NULL, NULL) == )

        throw EncodeException("UTF16 convert to GBK failed", GetLastError());

    if(!gbkString.empty())

        gbkString.clear();

    gbkString.append(buff.data(), buff.size());

}

void Encoding::UTF8ToUTF16(const std::string& utf8String, std::wstring& utf16String)

{

    std::string errorMessage;

    try

    {

        _unicodeConverter.toUTF16(utf8String, utf16String);

    }

    catch(Poco::Exception &e)

    {

        errorMessage.append("UTF8 convert to UTF16 failed, ");

        errorMessage.append(e.message());

    }

    if(!errorMessage.empty())

        throw EncodeException(errorMessage, GetLastError());

}

void Encoding::UTF16ToUTF8(const std::wstring& utf16String, std::string& utf8String)

{

    std::string errorMessage;

    try

    {

        _unicodeConverter.toUTF8(utf16String, utf8String);

    }

    catch(Poco::Exception &e)

    {

        errorMessage.append("UTF8 convert to UTF16 failed, ");

        errorMessage.append(e.message());

    }

    if(!errorMessage.empty())

        throw EncodeException(errorMessage, GetLastError());

}

void Encoding::UTF8ToGBK(const std::string& utf8String, std::string& gbkString)

{

    std::wstring utf16String;

    std::string errorMessage;

    try

    {

        _unicodeConverter.toUTF16(utf8String, utf16String);

        UTF16ToGBK(utf16String, gbkString);

    }

    catch(EncodeException)

    {

        errorMessage = "UTF8 convert to GBK failed";

    }

    catch(Poco::Exception &e)

    {

        errorMessage.append("UTF8 convert to UTF16 failed, ");

        errorMessage.append(e.message());

    }

    if(!errorMessage.empty())

        throw EncodeException(errorMessage, GetLastError());

}

void Encoding::GBKToUTF8(const std::string& gbkString, std::string& utf8String)

{

    std::wstring utf16String;

    std::string errorMessage;

    try

    {

        GBKToUTF16(gbkString, utf16String);

        _unicodeConverter.toUTF8(utf16String, utf8String);

    }

    catch(EncodeException)

    {

        errorMessage = "GBK convert to UTF8 failed";

    }

    catch(Poco::Exception &e)

    {

        errorMessage.append("UTF8 convert to UTF16 failed, ");

        errorMessage.append(e.message());

    }

    if(!errorMessage.empty())

        throw EncodeException(errorMessage, GetLastError());

}

void Encoding::EncodeHexString(const std::string& bytes, std::string& hexString)

{

    if(!hexString.empty())

        hexString.clear();

    Poco::DigestEngine::Digest digest(bytes.begin(), bytes.end());

    hexString = Poco::DigestEngine::digestToHex(digest);

}

void Encoding::DecodeHexString(const std::string& hexString, std::string& bytes)

{

    unsigned int _value;

    if(!bytes.empty())

        bytes.clear();

    for(std::string::size_type i = , j = ; i <  hexString.length(); i+=)

    {

        if(NumberParser::tryParseHex(hexString.substr(i, ), _value))

            bytes.push_back(_value);

    }

}

void Encoding::EncodeHexString(const std::wstring& utf16String, std::string& hexString)

{

    if(!hexString.empty())

        hexString.clear();

    Poco::DigestEngine::Digest digest;

    for(auto iter = utf16String.begin(); iter != utf16String.end(); ++iter)

    {

        const unsigned char* ptr = (const unsigned char*)&*iter;

        if(GetCurrentByteOrder() == BIG_ENDIAN_BYTE_ORDER)

        {

            digest.push_back(*ptr);

            digest.push_back(*(ptr + ));

        }

        else if(GetCurrentByteOrder() == LITTLE_ENDIAN_BYTE_ORDER)

        {

            digest.push_back(*(ptr + ));

            digest.push_back(*ptr);

        }

        else

            return;

    }

    hexString = Poco::DigestEngine::digestToHex(digest);

}

void Encoding::DecodeHexString(const std::string& hexString, std::wstring& utf16String)

{

    unsigned int _value;

    if(!utf16String.empty())

        utf16String.clear();

    for(std::string::size_type i = , j = ; i <  hexString.length(); i+=)

    {

        if(NumberParser::tryParseHex(hexString.substr(i, ), _value))

            utf16String.push_back(_value);

    }

}

Encoding::ByteOrderType Encoding::GetCurrentByteOrder()

{

    static bool flag = false;

    if(flag)

        return _currentByteOrder;

    union

    {

        char16_t s;

        char c[];

    }un;

    un.s = 0x0102;

    if(un.c[] ==  && un.c[] == )

        _currentByteOrder = BIG_ENDIAN_BYTE_ORDER;

    else if(un.c[] ==  && un.c[] == )

        _currentByteOrder = LITTLE_ENDIAN_BYTE_ORDER;

    else

        _currentByteOrder = UNKNOW;

    flag = true;

    return _currentByteOrder;

}

基于Poco的UTF8、UTF16、GBK、Hex之间的转换的更多相关文章

UTF-8和GBK编码之间的区别(页面编码、数据库编码区别)以及在实际项目中的应用
第一节:UTF-8和GBK编码概述 UTF-8 (8-bit Unicode Transformation Format) 是一种针对Unicode的可变长度字符编码,又称万国码,它包含全世界所有国家 ...
ASC与HEX之间的转换
ASC与HEX之间的转换有这么两个函数: 函数原型功能返回值参数备注 hex2asc __int16 hex2asc(unsigned char *strhex,unsigned char ...
C#中的Byte，String，Int，Hex之间的转换函数。
/// <summary> Convert a string of hex digits (ex: E4 CA B2) to a byte array. </summary> ...
ascii、unicode、utf-8、gbk区别及转换
一.编码 ascii: A:00000010 8位一个字节 unicode: A:00000000 00000001 00000010 00000100 32位四个字节中:00000000 00 ...
ascii、unicode、utf-8、gbk 区别？
发展史: https://www.cnblogs.com/houxt/p/11250878.html python2内容进行编码(默认ascii),而python3对内容进行编码的默认为utf-8. ...
UTF8,UTF16,UTF32,UTF16-LE,UTF16-BE,GBK 之间的转换
Unicode是Unicode.org制定的编码标准,目前得到了绝大部分操作系统和编程语言的支持.Unicode.org官方对Unicode的定义是:Unicode provides a unique ...
字符编码之间的相互转换 UTF8与GBK(转载)
转载自http://www.cnblogs.com/azraelly/archive/2012/06/21/2558360.html UTF8与GBK字符编码之间的相互转换 C++ UTF8编码转换 ...
【miscellaneous】【C/C++语言】UTF8与GBK字符编码之间的相互转换
UTF8与GBK字符编码之间的相互转换 C++ UTF8编码转换 CChineseCode 一预备知识 1,字符:字符是抽象的最小文本单位.它没有固定的形状(可能是一个字形),而且没有值." ...
UNICODE与UTF8和GBK之间的关系
http://wenku.baidu.com/link?url=bheGEzfSjEx-QX-ciME5oKooKYE08_NJZ02l2kKFa7kVZJ4t8Ks2uSNByovgP2QL6btq ...

随机推荐

Clojure 的 Enlive 库尝试
Enlive 是一个 Clojure 下的 html 模板引擎.其特别之处在于,它既没有发明任何 html 内嵌的模板 DSL 语法:也不会混杂代码和表现. 一切的一切,都是按下列模型定义的次序执行的 ...
vim：关于映射和跳出括号
先说如何自动补全. 命令:vim .vimrc inoremap ( ()<ESC>i inoremap [ []<ESC>i inoremap { {}<ESC> ...
Aurora 8B/10B、PCIe 2.0、SRIO 2.0三种协议比较
在高性能雷达信号处理机研制中,高速串行总线正逐步取代并行总线.业界广泛使用的Xilinx公司Virtex-6系列FPGA支持多种高速串行通信协议,本文针对其中较为常用的Aurora 8B/10B和PC ...
linux进程 kipmi0
top 发现负载很低,没有连接的时候,一个进程经常跳到最前面,用户是root, 命令是 kipmi0 , 后来查询了一下,很可能是外部设备要使用到的 IPMI , 智能型平台管理接口(Intell ...
什么是WMS系统金蝶仓库条码管理WMS系统介绍
汉码盘点机-专注于傻瓜式的仓库条码管理系统,是当前出入库工作效率最高.数据最准确的仓库管理办法. "WMS,即q=%E4%BB%93%E5%BA%93%E7%AE%A1%E7%90%86%E ...
ORACLE 多列合并成一行数据 WM_CONCAT函数以及REPLACE
WM_CONCAT()方法注意字符长度 SELECT BERTHCODE,tpf.freedatetype, ( SELECT WM_CONCAT(SBPT.PARKSTIME||'~'||SBPT ...
使用base64:url 来定义背景图片url
普通的背景图片css是这样的: background-image:url(http://www.zhangxinxu.com/wordpress/wp-content/themes/default/i ...
linux命令（30）：tail
linux ---tail命令 linux中tail命令---用于查看文件内容最基本的是cat.more和less. 1. 如果你只想看文件的前5行,可以使用head命令,如: head -5 /e ...
HttpClient 教程 (一)
转自:http://www.cnblogs.com/loveyakamoz/archive/2011/07/21/2112804.html HttpClient 教程 (一) 前言超文本传输协议 ...
工厂模式——（Head first设计模式4）
所谓工厂,肯定是和生产有关.工厂模式主要包括工厂方法模式和抽象工厂模式,有些人把简单工厂也作为一种模式,在本文我分别讨论简单工厂模式,工厂方法模式,抽象工厂模式.这些模式中同样也和生产有关.接下来,我 ...

基于Poco的UTF8、UTF16、GBK、Hex之间的转换

基于Poco的UTF8、UTF16、GBK、Hex之间的转换的更多相关文章

随机推荐

热门专题