add Big5 charset support to iconv

at this point, it is just the common base charset equivalent to
Windows CP 950, with no further extensions. HKSCS and possibly other
supersets will be added later. other aliases may need to be added too.
This commit is contained in:
Rich Felker 2013-08-07 13:16:14 -04:00
parent 983acebc8a
commit 19b4a0a20e
2 changed files with 1066 additions and 0 deletions

1048
src/locale/big5.h Normal file

File diff suppressed because it is too large Load Diff

View File

@ -20,6 +20,7 @@
#define GB18030 0330
#define GBK 0331
#define GB2312 0332
#define BIG5 0340
#define EUC_KR 0350
/* FIXME: these are not implemented yet
@ -48,6 +49,7 @@ static const unsigned char charmaps[] =
"gb18030\0\0\330"
"gbk\0\0\331"
"gb2312\0\0\332"
"big5\0bigfive\0cp950\0\0\340"
"euckr\0ksc5601\0ksx1001\0cp949\0\0\350"
#include "codepages.h"
;
@ -64,6 +66,10 @@ static const unsigned short gb18030[126][190] = {
#include "gb18030.h"
};
static const unsigned short big5[89][157] = {
#include "big5.h"
};
static const unsigned short ksc[93][94] = {
#include "ksc.h"
};
@ -284,6 +290,18 @@ size_t iconv(iconv_t cd0, char **restrict in, size_t *restrict inb, char **restr
if (d>63) d--;
c = gb18030[c][d];
break;
case BIG5:
l = 2;
if (*inb < 2) goto starved;
d = *((unsigned char *)*in + 1);
if (c-0xa1>=0xfa-0xa1) goto ilseq;
c -= 0xa1;
if (d-0x40>=0xff-0x40 || d-0x7f<0xa1-0x7f) goto ilseq;
d -= 0x40;
if (d > 0x3e) d -= 0x22;
c = big5[c][d];
if (!c) goto ilseq;
break;
case EUC_KR:
l = 2;
if (*inb < 2) goto starved;