欢迎您访问程序员文章站本站旨在为大家提供分享程序员计算机编程知识!
您现在的位置是: 首页  >  数据库

No2:luacom中文内容输出BUG及修正

程序员文章站 2022-06-17 12:41:14
...

使 用cell.Value2输出中文内容时总是乱码。怀疑是utf-8的原因,转换后结果仍然是乱码。自己再写个转换的再测试,依然是乱码,莫非有BUG!? 下个LUACOM的源码,查看函数 tLuaCOMTypeHandler::com2lua 和 tStringBuffer tUtil::bstr2string 。整个过程看起来

使用cell.Value2输出中文内容时总是乱码。怀疑是utf-8的原因,转换后结果仍然是乱码。自己再写个转换的再测试,依然是乱码,莫非有BUG!?

下个LUACOM的源码,查看函数tLuaCOMTypeHandler::com2luatStringBuffer tUtil::bstr2string。整个过程看起来都OK,但再测试发现,结果字符串少了一个bytes。

tLuaCOMTypeHandler::com2lua VT_BSTR分支中返回结果恰好是减去1,将其修改

lua_pushlstring(L, str, str.getSize()-1);修改为lua_pushlstring(L, str, str.getSize());

重新编译LUACOM,再看cell.Value2输出结果,终于正确了。由于没进行全面测试,不知道其此修改会不会引入错误。资源里有个已经编译好的。

--lc是从网上抄来的unicode utf-8 ansi相互转换的函数

package.cpath=[[C:\Program Files\Lua\5.1\clibs\?.dll;d:\loonlib\sample\lc\?.dll]]
require "luacom"
require "lc"

function print_table(t) for k,v in pairs(t) do print(k,v) end end
excel = luacom.CreateObject("Excel.Application")
excel.Visible = true
excel.Workbooks:Add();
--luacom.ViewTypeLib(excel);
sheet=excel.Sheets(1);
local r=sheet:Range("E6");

local s = "严中";
ws, s2=lc.a2w(s); --0x25 0x4e 0x2d 0x4e 0x00 0x00 6
print("unicode : " .. lc.bstr(ws, s2));
us, s2=lc.w2u(ws, s2); --0xe4 0xb8 0xa5 0xe4 0xb8 0xad 0x00 0x00 8
print("utf8 : " .. lc.bstr(us, s2));

r.Value2=us;
ws, s2=lc.u2w(r.Value2, s2);
print("unicode : " .. lc.bstr(ws, s2));
as, s2=lc.w2a(ws, s2);
print("ansi : " .. lc.bstr(as, s2));
print(as);

lc.def

LIBRARY	"lc"

EXPORTS
	luaopen_lc


lc.h

extern "C" {
#include "lua.h"
#include "lualib.h" 
#include "lauxlib.h"
int luaopen_local(lua_State* L);
}

#include 
#include 
#ifdef WIN32
#include 
#include 
#else
#include 
#endif


#define LN_lc "lc"
int lua_a2w(lua_State* L);
int lua_u2w(lua_State* L);
int lua_w2a(lua_State* L);
int lua_w2u(lua_State* L);
int lua_u2a(lua_State* L);
int lua_a2u(lua_State* L);
int lua_bstr(lua_State* L);

int lua_help(lua_State* L);
wchar_t* mb2wc(const char* mbstr, int& s2, int cp);
char* wc2mb(const wchar_t* wcstr, int& s2, int cp);


lc.cpp

#include "lc.h"
//g++ -shared -s -o lc.dll -O3 lc.cpp lc.def -llua5.1 -DWIN32 -I%loon%/lua/src -L%loon%/lib/gcc_dll/debug -Wl,--out-implib,liblc.a 

int lua_bstr(lua_State* L) {
	const char* s = luaL_optstring(L, 1, "");
	int len = luaL_optnumber(L, 2, 0);
	if (strcmp(s, "")==0 || 0==len) {
		lua_pushstring(L, s);
	} else {
		luaL_Buffer b;
		luaL_buffinit(L, &b);
		char* byte = (char*)malloc(64);
		for (int i=0; i0) {
		int s2 = 0;
		wchar_t* wcstr = mb2wc(mbstr, s2, CP_UTF8);
		if (wcstr) {
			lua_pushlstring(L, (const char*)wcstr, s2);
			lua_pushnumber(L, s2);
			delete[] wcstr;
			result = 2;
		}
	}
	return result;
}

int lua_a2w(lua_State* L) {
	int result = 0;
	size_t len = 0;
	const char* mbstr = lua_tolstring(L, 1, &len);
	if (mbstr && len>0) {
		int s2 = 0;
		wchar_t* wcstr = mb2wc(mbstr, s2, CP_ACP);
		if (wcstr) {
			lua_pushlstring(L, (const char*)wcstr, s2);
			lua_pushnumber(L, s2);
			delete[] wcstr;
			result = 2;
		}
	}
	return result;
}

int lua_w2a(lua_State* L) {
	int result = 0;
	size_t len = 0;
	const char* wcstr = lua_tolstring(L, 1, &len);
	if (wcstr && len>0) {
		int s2 = 0;
		char* mbstr = wc2mb((wchar_t*)wcstr, s2, CP_ACP);
		if (mbstr) {
			lua_pushlstring(L, mbstr, s2);
			lua_pushnumber(L, s2);
			delete[] mbstr;
			result = 2;
		}
	}
	return result;
}

int lua_w2u(lua_State* L) {
	int result = 0;
	size_t len = 0;
	const char* wcstr = lua_tolstring(L, 1, &len);
	if (wcstr && len>0) {
		int s2 = 0;
		char* mbstr = wc2mb((wchar_t*)wcstr, s2, CP_UTF8);
		if (mbstr) {
			lua_pushlstring(L, mbstr, s2);
			lua_pushnumber(L, s2);
			delete[] mbstr;
			result = 2;
		}
	}
	return result;
}

int lua_u2a(lua_State* L) {
	int result = 0;
	size_t len = 0;
	const char* mbstr = lua_tolstring(L, 1, &len);
	if (mbstr && len>0) {
		int s2 = 0;
		wchar_t* wcstr = mb2wc(mbstr, s2, CP_UTF8);
		if (wcstr) {
			char* nmbstr = wc2mb(wcstr, s2, CP_ACP);
			if (nmbstr) {
				lua_pushlstring(L, nmbstr, s2);
				lua_pushnumber(L, s2);
				result = 2;
				delete[] nmbstr;
			}
			delete[] wcstr;
		}
	}
	return result;
}

int lua_a2u(lua_State* L) {
	int result = 0;
	size_t len = 0;
	const char* mbstr = lua_tolstring(L, 1, &len);
	if (mbstr && len>0) {
		int s2 = 0;
		wchar_t* wcstr = mb2wc(mbstr, s2, CP_ACP);
		if (wcstr) {
			char* nmbstr = wc2mb(wcstr, s2, CP_UTF8);
			if (nmbstr) {
				lua_pushlstring(L, nmbstr, s2);
				lua_pushnumber(L, s2);
				result = 2;
				delete[] nmbstr;
			}
			delete[] wcstr;
		}
	}
	return result;
}

wchar_t* mb2wc(const char* mbstr, int& s2, int cp) {
	wchar_t* wcstr = NULL;
#ifdef WIN32
	int size = MultiByteToWideChar(cp, 0, mbstr, -1, NULL, 0);
#else
	size_t size = mbstowcs(NULL, mbstr, 0);
#endif
	wcstr = new wchar_t[size];
	if (wcstr) {
		memset(wcstr, 0, size * sizeof(wchar_t));
#ifdef WIN32
		int ret = MultiByteToWideChar(cp, 0, mbstr, -1, wcstr, size);
		if (ret == 0) { // MultiByteToWideChar returns 0 if it does not succeed.
#else
		size_t ret = mbstowcs(wcstr, mbstr, size+1);
		if (ret == -1) {
#endif
			delete[] wcstr;
			wcstr = NULL;
		}
		s2 = 2*size;
	}
	return wcstr;
}

char* wc2mb(const wchar_t* wcstr, int& s2, int cp) {
	char* mbstr = NULL;
#ifdef WIN32
	int size = WideCharToMultiByte(cp, 0, wcstr, -1, NULL, 0, NULL, NULL);
#else
	size_t size = wcstombs(NULL, wcstr, 0);
#endif
	mbstr = new char[size];
	if (mbstr) {
		memset(mbstr, 0, size * sizeof(char));
#ifdef WIN32
		int ret = WideCharToMultiByte(cp, 0, wcstr, -1, mbstr, size, NULL, NULL);
		if (ret == 0) { // MultiByteToWideChar returns 0 if it does not succeed.
#else
		size_t ret = wcstombs(mbstr, wcstr, size+1);
		if (ret == -1) {
#endif
			delete[] mbstr;
			mbstr = NULL;
		}
		s2 = size;
	}
	return mbstr;
}

int lua_help(lua_State* L) {
	const char* s= 
		"Simple Characters Transformation\n"
		"  a2w(ansi to unicode)\n"
		"  u2w(utf8 to unicode)\n"
		"  w2a(unicode to ansi)\n"
		"  w2u(unicode to utf8)\n"
		"  u2a(utf8 to ansi)\n"
		"  a2u(ansi to utf8)\n"
		"  bstr(bytes of str)\n"
		"  help(show this)\n\n"
		"  example :\n"
		"    local s = \"I like lua\"\n"
		"    print(lc.bstr(s, string.len(s)+1))\n"
		"    local ws, s2 = lc.a2w(s)\n"
		"wunoman@qq.com 2012/03/06\n"
		;
	lua_pushstring(L, s);

	return 1;
}

luaL_reg lrg_lc[] = {
	{"a2w", lua_a2w},
	{"u2w", lua_u2w},
	{"w2a", lua_w2a},
	{"w2u", lua_w2u},
	{"u2a", lua_u2a},
	{"a2u", lua_a2u},
	{"bstr", lua_bstr},
	{"help", lua_help},
    {NULL, NULL}
};

extern "C" int luaopen_lc(lua_State* L) {
    luaL_register(L, LN_lc, lrg_lc);
	return 1;
}