字符编码转换，utf16 utf8 ascii unicode

大小: 37KB

文件类型: .zip

金币: 2

下载: 0 次

发布日期: 2021-05-17
语言: 其他
标签: utf8 unicode utf16 ascii 编码转换

高速下载

资源简介

utf16 utf8 ascii unicode 所有代码都已经经过验证。而且里面也有相应的例子。所有的编码格式进行转换，windows平台。

资源截图

小图大图

代码片段和文件信息

#include “utfTools.h“
#include 
#include 
using namespace std;

CUtfTools* CUtfTools::getInstance（）
{
	static CUtfTools gCUtfTools;
	return &gCUtfTools;
}


CUtfTools::CUtfTools（）
{

}

CUtfTools::~CUtfTools（）
{

}

int CUtfTools::Utf16_To_Utf8（MYUTF16* sourceStart MYUTF8* targetStart size_t outLen ConversionFlags flags SourceDataByteOrder byteOrder）
{
	int result = 0;
	MYUTF16* source = sourceStart;
	MYUTF8* target = targetStart;
	MYUTF8* targetEnd = targetStart + outLen;

	if （（NULL == source） || （NULL == targetStart））{
		printf（“ERR Utf16_To_Utf8: source=%p targetStart=%p\n“ source targetStart）;
		return conversionFailed;
	}

	while （*source） {
		//网络上的数据都是大端，权重越大的数据优先传输
		if （byteOrder == BigEndian）
		{
			*source = ntohs（*source）;
		}
		MYUTF32 ch;
		unsigned short bytesToWrite = 0;
		const MYUTF32 byteMask = 0xBF;
		const MYUTF32 byteMark = 0x80;
		MYUTF16* oldSource = source; /* In case we have to back up because of target overflow. */
		ch = *source++;
		/* If we have a surrogate pair convert to UTF32 first. */
		if （ch >= UNI_SUR_HIGH_START && ch <= UNI_SUR_HIGH_END） {
			/* If the 16 bits following the high surrogate are in the source buffer... */
			if （*source）{
				MYUTF32 ch2 = *source;
				/* If it‘s a low surrogate convert to UTF32. */
				if （ch2 >= UNI_SUR_LOW_START && ch2 <= UNI_SUR_LOW_END） {
					ch = （（ch - UNI_SUR_HIGH_START） << halfShift） + （ch2 - UNI_SUR_LOW_START） + halfbase;
					++source;
				}
				else if （flags == strictConversion） { /* it‘s an unpaired high surrogate */
					--source; /* return to the illegal value itself */
					result = sourceIllegal;
					break;
				}
			}
			else { /* We don‘t have the 16 bits following the high surrogate. */
				--source; /* return to the high surrogate */
				result = sourceExhausted;
				break;
			}
		}
		else if （flags == strictConversion） {
			/* UTF-16 surrogate values are illegal in UTF-32 */
			if （ch >= UNI_SUR_LOW_START && ch <= UNI_SUR_LOW_END）{
				--source; /* return to the illegal value itself */
				result = sourceIllegal;
				break;
			}
		}
		/* Figure out how many bytes the result will require */
		if （ch < （MYUTF32）0x80）{
			bytesToWrite = 1;
		}
		else if （ch < （MYUTF32）0x800） {
			bytesToWrite = 2;
		}
		else if （ch < （MYUTF32）0x10000） {
			bytesToWrite = 3;
		}
		else if （ch < （MYUTF32）0x110000）{
			bytesToWrite = 4;
		}
		else {
			bytesToWrite = 3;
			ch = UNI_REPLACEMENT_CHAR;
		}

		target += bytesToWrite;
		if （target > targetEnd） {
			source = oldSource; /* Back up source pointer! */
			target -= bytesToWrite; result = targetExhausted; break;
		}
		switch （bytesToWrite） { /* note: everything falls through. */
		case 4: *--target = （MYUTF8）（（ch | byteMark） & byteMask）; ch >>= 6;
		case 3: *--target = （MYUTF8）（（ch | byteMark） & byteMask）; ch >>= 6;
		case 2: *--target = （MYUTF8）（（ch | byteMark） & byteMask）; ch >>= 6;
		case 1

属性            大小     日期    时间   名称
----------- ---------  ---------- -----  ----
     文件         320  2019-01-25 09:32  readMe.txt
     文件       16729  2019-01-25 09:17  utfTools.cpp
     文件        3762  2019-01-25 09:10  utfTools.h
     文件       33628  2019-01-25 09:33  字符编码.docx

共有条评论

字符编码转换，utf16 utf8 ascii unicode

资源简介

资源截图

代码片段和文件信息

评论

相关资源