字符编码 utf-8 与 gb2312之间的转换
字符编码查询 汉字字符集编码查询
设备之间的收发端使用的gb2312, 比如“早”字编码为(D4E7), 而网络下载的txt文件的编码为utf-8
为了比较这两类文件,需要转化到统一的编码,这里将 utf-8转化为gb2312
C 实现
//代码转换:从一种编码转为另一种编码
static int code_convert(char * from_charset, char * to_charset, char * inbuf, size_t inlen, char * outbuf, size_t outlen)
{
iconv_t cd;
char **pin = &inbuf;
char **pout = &outbuf;
int ret ;
cd = iconv_open(to_charset, from_charset);
if(cd == (iconv_t)-1)
{
perror("open iconv_open failed");
return -1;
}
memset(outbuf,0,outlen);
ret = iconv(cd, (char **)pin, &inlen, (char **)pout, &outlen);
if( ret < 0)
{
perror("iconv failed");
iconv_close(cd); /*by zyy*/
return -1;
}
iconv_close(cd);
return 0;
}
/*UTF-8 码转为GB2312码*/
static int u2g(char *inbuf, size_t inlen, char *outbuf, size_t outlen)
{
int ret;
ret =code_convert("UTF-8","GBK//IGNORE",inbuf,inlen,outbuf,outlen);
return ret;
}