summaryrefslogtreecommitdiffstats
path: root/Modules/cjkcodecs/_euc_jisx0213.c
diff options
context:
space:
mode:
Diffstat (limited to 'Modules/cjkcodecs/_euc_jisx0213.c')
-rw-r--r--Modules/cjkcodecs/_euc_jisx0213.c180
1 files changed, 180 insertions, 0 deletions
diff --git a/Modules/cjkcodecs/_euc_jisx0213.c b/Modules/cjkcodecs/_euc_jisx0213.c
new file mode 100644
index 0000000..3f7fbd7
--- /dev/null
+++ b/Modules/cjkcodecs/_euc_jisx0213.c
@@ -0,0 +1,180 @@
+/*
+ * _euc_jisx0213.c: the EUC-JISX0213 codec
+ *
+ * Written by Hye-Shik Chang <perky@FreeBSD.org>
+ * $CJKCodecs: _euc_jisx0213.c,v 1.2 2003/12/31 05:46:55 perky Exp $
+ */
+
+#define USING_BINARY_PAIR_SEARCH
+#include "codeccommon.h"
+#include "map_jisx0213_pairs.h"
+
+ENCMAP(jisxcommon)
+DECMAP(jisx0208)
+DECMAP(jisx0212)
+ENCMAP(jisx0213_bmp)
+DECMAP(jisx0213_1_bmp)
+DECMAP(jisx0213_2_bmp)
+ENCMAP(jisx0213_emp)
+DECMAP(jisx0213_1_emp)
+DECMAP(jisx0213_2_emp)
+
+#define EMPBASE 0x20000
+
+ENCODER(euc_jisx0213)
+{
+ while (inleft > 0) {
+ ucs4_t c = IN1;
+ DBCHAR code;
+ int insize;
+
+ if (c < 0x80) {
+ WRITE1(c)
+ NEXT(1, 1)
+ continue;
+ }
+
+ DECODE_SURROGATE(c)
+ insize = GET_INSIZE(c);
+
+ if (c <= 0xFFFF) {
+ /* try 0213 first because it might have MULTIC */
+ TRYMAP_ENC(jisx0213_bmp, code, c) {
+ if (code == MULTIC) {
+ if (inleft < 2) {
+ if (flags & MBENC_FLUSH) {
+ code = find_pairencmap(c, 0, jisx0213_pairencmap,
+ JISX0213_ENCPAIRS);
+ if (code == DBCINV)
+ return 1;
+ } else
+ return MBERR_TOOFEW;
+ } else {
+ code = find_pairencmap(c, (*inbuf)[1],
+ jisx0213_pairencmap, JISX0213_ENCPAIRS);
+ if (code == DBCINV) {
+ code = find_pairencmap(c, 0, jisx0213_pairencmap,
+ JISX0213_ENCPAIRS);
+ if (code == DBCINV)
+ return 1;
+ } else
+ insize = 2;
+ }
+ }
+ } else TRYMAP_ENC(jisxcommon, code, c);
+ else if (c >= 0xff61 && c <= 0xff9f) {
+ /* JIS X 0201 half-width katakana */
+ WRITE2(0x8e, c - 0xfec0)
+ NEXT(1, 2)
+ continue;
+ } else if (c == 0xff3c)
+ /* F/W REVERSE SOLIDUS (see NOTES.euc-jisx0213) */
+ code = 0x2140;
+ else if (c == 0xff5e)
+ /* F/W TILDE (see NOTES.euc-jisx0213) */
+ code = 0x2232;
+ else
+ return 1;
+ } else if (c >> 16 == EMPBASE >> 16) {
+ TRYMAP_ENC(jisx0213_emp, code, c & 0xffff);
+ else return insize;
+ } else
+ return insize;
+
+ if (code & 0x8000) {
+ /* Codeset 2 */
+ WRITE3(0x8f, code >> 8, (code & 0xFF) | 0x80)
+ NEXT(insize, 3)
+ } else {
+ /* Codeset 1 */
+ WRITE2((code >> 8) | 0x80, (code & 0xFF) | 0x80)
+ NEXT(insize, 2)
+ }
+ }
+
+ return 0;
+}
+
+DECODER(euc_jisx0213)
+{
+ while (inleft > 0) {
+ unsigned char c = IN1;
+ ucs4_t code;
+
+ RESERVE_OUTBUF(1)
+
+ if (c < 0x80) {
+ OUT1(c)
+ NEXT(1, 1)
+ continue;
+ }
+
+ if (c == 0x8e) {
+ /* JIS X 0201 half-width katakana */
+ unsigned char c2;
+
+ RESERVE_INBUF(2)
+ c2 = IN2;
+ if (c2 >= 0xa1 && c2 <= 0xdf) {
+ OUT1(0xfec0 + c2)
+ NEXT(2, 1)
+ } else
+ return 2;
+ } else if (c == 0x8f) {
+ unsigned char c2, c3;
+
+ RESERVE_INBUF(3)
+ c2 = IN2 ^ 0x80;
+ c3 = IN3 ^ 0x80;
+
+ /* JIS X 0213 Plane 2 or JIS X 0212 (see NOTES.euc-jisx0213) */
+ TRYMAP_DEC(jisx0213_2_bmp, **outbuf, c2, c3) ;
+ else TRYMAP_DEC(jisx0213_2_emp, code, c2, c3) {
+ PUTUCS4(EMPBASE | code)
+ NEXT_IN(3)
+ continue;
+ } else TRYMAP_DEC(jisx0212, **outbuf, c2, c3) ;
+ else return 3;
+ NEXT(3, 1)
+ } else {
+ unsigned char c2;
+
+ RESERVE_INBUF(2)
+ c ^= 0x80;
+ c2 = IN2 ^ 0x80;
+
+ /* JIS X 0213 Plane 1 */
+ if (c == 0x21 && c2 == 0x40) **outbuf = 0xff3c;
+ else if (c == 0x22 && c2 == 0x32) **outbuf = 0xff5e;
+ else TRYMAP_DEC(jisx0208, **outbuf, c, c2);
+ else TRYMAP_DEC(jisx0213_1_bmp, **outbuf, c, c2);
+ else TRYMAP_DEC(jisx0213_1_emp, code, c, c2) {
+ PUTUCS4(EMPBASE | code)
+ NEXT_IN(2)
+ continue;
+ } else TRYMAP_DEC(jisx0213_pair, code, c, c2) {
+ WRITE2(code >> 16, code & 0xffff)
+ NEXT(2, 2)
+ continue;
+ } else return 2;
+ NEXT(2, 1)
+ }
+ }
+
+ return 0;
+}
+
+#include "codecentry.h"
+BEGIN_CODEC_REGISTRY(euc_jisx0213)
+ MAPOPEN(ja_JP)
+ IMPORTMAP_ENC(jisxcommon)
+ IMPORTMAP_DEC(jisx0208)
+ IMPORTMAP_DEC(jisx0212)
+ IMPORTMAP_ENC(jisx0213_bmp)
+ IMPORTMAP_DEC(jisx0213_1_bmp)
+ IMPORTMAP_DEC(jisx0213_2_bmp)
+ IMPORTMAP_ENC(jisx0213_emp)
+ IMPORTMAP_DEC(jisx0213_1_emp)
+ IMPORTMAP_DEC(jisx0213_2_emp)
+ MAPCLOSE()
+END_CODEC_REGISTRY(euc_jisx0213)