mirror of https://github.com/python/cpython
181 lines
5.2 KiB
C
181 lines
5.2 KiB
C
/*
|
|
* _euc_jisx0213.c: the EUC-JISX0213 codec
|
|
*
|
|
* Written by Hye-Shik Chang <perky@FreeBSD.org>
|
|
* $CJKCodecs: _euc_jisx0213.c,v 1.2 2003/12/31 05:46:55 perky Exp $
|
|
*/
|
|
|
|
#define USING_BINARY_PAIR_SEARCH
|
|
#include "codeccommon.h"
|
|
#include "map_jisx0213_pairs.h"
|
|
|
|
ENCMAP(jisxcommon)
|
|
DECMAP(jisx0208)
|
|
DECMAP(jisx0212)
|
|
ENCMAP(jisx0213_bmp)
|
|
DECMAP(jisx0213_1_bmp)
|
|
DECMAP(jisx0213_2_bmp)
|
|
ENCMAP(jisx0213_emp)
|
|
DECMAP(jisx0213_1_emp)
|
|
DECMAP(jisx0213_2_emp)
|
|
|
|
#define EMPBASE 0x20000
|
|
|
|
ENCODER(euc_jisx0213)
|
|
{
|
|
while (inleft > 0) {
|
|
ucs4_t c = IN1;
|
|
DBCHAR code;
|
|
int insize;
|
|
|
|
if (c < 0x80) {
|
|
WRITE1(c)
|
|
NEXT(1, 1)
|
|
continue;
|
|
}
|
|
|
|
DECODE_SURROGATE(c)
|
|
insize = GET_INSIZE(c);
|
|
|
|
if (c <= 0xFFFF) {
|
|
/* try 0213 first because it might have MULTIC */
|
|
TRYMAP_ENC(jisx0213_bmp, code, c) {
|
|
if (code == MULTIC) {
|
|
if (inleft < 2) {
|
|
if (flags & MBENC_FLUSH) {
|
|
code = find_pairencmap((ucs2_t)c, 0,
|
|
jisx0213_pairencmap, JISX0213_ENCPAIRS);
|
|
if (code == DBCINV)
|
|
return 1;
|
|
} else
|
|
return MBERR_TOOFEW;
|
|
} else {
|
|
code = find_pairencmap((ucs2_t)c, (*inbuf)[1],
|
|
jisx0213_pairencmap, JISX0213_ENCPAIRS);
|
|
if (code == DBCINV) {
|
|
code = find_pairencmap((ucs2_t)c, 0,
|
|
jisx0213_pairencmap, JISX0213_ENCPAIRS);
|
|
if (code == DBCINV)
|
|
return 1;
|
|
} else
|
|
insize = 2;
|
|
}
|
|
}
|
|
} else TRYMAP_ENC(jisxcommon, code, c);
|
|
else if (c >= 0xff61 && c <= 0xff9f) {
|
|
/* JIS X 0201 half-width katakana */
|
|
WRITE2(0x8e, c - 0xfec0)
|
|
NEXT(1, 2)
|
|
continue;
|
|
} else if (c == 0xff3c)
|
|
/* F/W REVERSE SOLIDUS (see NOTES.euc-jisx0213) */
|
|
code = 0x2140;
|
|
else if (c == 0xff5e)
|
|
/* F/W TILDE (see NOTES.euc-jisx0213) */
|
|
code = 0x2232;
|
|
else
|
|
return 1;
|
|
} else if (c >> 16 == EMPBASE >> 16) {
|
|
TRYMAP_ENC(jisx0213_emp, code, c & 0xffff);
|
|
else return insize;
|
|
} else
|
|
return insize;
|
|
|
|
if (code & 0x8000) {
|
|
/* Codeset 2 */
|
|
WRITE3(0x8f, code >> 8, (code & 0xFF) | 0x80)
|
|
NEXT(insize, 3)
|
|
} else {
|
|
/* Codeset 1 */
|
|
WRITE2((code >> 8) | 0x80, (code & 0xFF) | 0x80)
|
|
NEXT(insize, 2)
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
DECODER(euc_jisx0213)
|
|
{
|
|
while (inleft > 0) {
|
|
unsigned char c = IN1;
|
|
ucs4_t code;
|
|
|
|
RESERVE_OUTBUF(1)
|
|
|
|
if (c < 0x80) {
|
|
OUT1(c)
|
|
NEXT(1, 1)
|
|
continue;
|
|
}
|
|
|
|
if (c == 0x8e) {
|
|
/* JIS X 0201 half-width katakana */
|
|
unsigned char c2;
|
|
|
|
RESERVE_INBUF(2)
|
|
c2 = IN2;
|
|
if (c2 >= 0xa1 && c2 <= 0xdf) {
|
|
OUT1(0xfec0 + c2)
|
|
NEXT(2, 1)
|
|
} else
|
|
return 2;
|
|
} else if (c == 0x8f) {
|
|
unsigned char c2, c3;
|
|
|
|
RESERVE_INBUF(3)
|
|
c2 = IN2 ^ 0x80;
|
|
c3 = IN3 ^ 0x80;
|
|
|
|
/* JIS X 0213 Plane 2 or JIS X 0212 (see NOTES.euc-jisx0213) */
|
|
TRYMAP_DEC(jisx0213_2_bmp, **outbuf, c2, c3) ;
|
|
else TRYMAP_DEC(jisx0213_2_emp, code, c2, c3) {
|
|
PUTUCS4(EMPBASE | code)
|
|
NEXT_IN(3)
|
|
continue;
|
|
} else TRYMAP_DEC(jisx0212, **outbuf, c2, c3) ;
|
|
else return 3;
|
|
NEXT(3, 1)
|
|
} else {
|
|
unsigned char c2;
|
|
|
|
RESERVE_INBUF(2)
|
|
c ^= 0x80;
|
|
c2 = IN2 ^ 0x80;
|
|
|
|
/* JIS X 0213 Plane 1 */
|
|
if (c == 0x21 && c2 == 0x40) **outbuf = 0xff3c;
|
|
else if (c == 0x22 && c2 == 0x32) **outbuf = 0xff5e;
|
|
else TRYMAP_DEC(jisx0208, **outbuf, c, c2);
|
|
else TRYMAP_DEC(jisx0213_1_bmp, **outbuf, c, c2);
|
|
else TRYMAP_DEC(jisx0213_1_emp, code, c, c2) {
|
|
PUTUCS4(EMPBASE | code)
|
|
NEXT_IN(2)
|
|
continue;
|
|
} else TRYMAP_DEC(jisx0213_pair, code, c, c2) {
|
|
WRITE2(code >> 16, code & 0xffff)
|
|
NEXT(2, 2)
|
|
continue;
|
|
} else return 2;
|
|
NEXT(2, 1)
|
|
}
|
|
}
|
|
|
|
return 0;
|
|
}
|
|
|
|
#include "codecentry.h"
|
|
BEGIN_CODEC_REGISTRY(euc_jisx0213)
|
|
MAPOPEN(ja_JP)
|
|
IMPORTMAP_ENC(jisxcommon)
|
|
IMPORTMAP_DEC(jisx0208)
|
|
IMPORTMAP_DEC(jisx0212)
|
|
IMPORTMAP_ENC(jisx0213_bmp)
|
|
IMPORTMAP_DEC(jisx0213_1_bmp)
|
|
IMPORTMAP_DEC(jisx0213_2_bmp)
|
|
IMPORTMAP_ENC(jisx0213_emp)
|
|
IMPORTMAP_DEC(jisx0213_1_emp)
|
|
IMPORTMAP_DEC(jisx0213_2_emp)
|
|
MAPCLOSE()
|
|
END_CODEC_REGISTRY(euc_jisx0213)
|