8sa1-gcc/libjava/gnu/gcj/convert/natOutput_EUCJIS.cc
Per Bothner 7b824de381 JIS0201.h: New file, generated from Unicode table.
�
	* gnu/gcj/convert/JIS0201.h:  New file, generated from Unicode table.
	* gnu/gcj/convert/Input_JavaSrc.java: New BytesToUnicode class.
	* gnu/gcj/convert/Input_SJIS.java: New BytesToUnicode class.
	* gnu/gcj/convert/Output_EUCJIS.java:  New UnicodeToBytes class.
	* gnu/gcj/convert/Output_SJIS.java:  New UnicodeToBytes class.
	* gnu/gcj/convert/natInput_EUCJIS.cc:  New file.
	* gnu/gcj/convert/natInput_SJIS.cc:  New file.
	* gnu/gcj/convert/natOutput_EUCJIS.cc:  New file.
	* gnu/gcj/convert/natOutput_SJIS.cc:  New file.
	* gnu/gcj/convert/make-trie.c:  New file: functions to make a trie.
	* gnu/gcj/convert/gen-from-JIS.c:  Invoke make-trie for output.
	* gnu/gcj/convert/Unicode_to_JIS.cc:  New generated trie table.

From-SVN: r26501
1999-04-16 10:25:08 -07:00

103 lines
2.4 KiB
C++

/* Copyright (C) 1999 Cygnus Solutions
This file is part of libgcj.
This software is copyrighted work licensed under the terms of the
Libgcj License. Please consult the file "LIBGCJ_LICENSE" for
details. */
#include <config.h>
#include <cni.h>
#include <gnu/gcj/convert/Output_EUCJIS.h>
/* A trie structure to map unicode values to JIS codes.
* code == -1: the character is undefined.
* code >= 0 && code < 128: JIS-Roman - mostly Ascii.
* code >= 128 && code < 256: Half-width Katakana.
* code >= 256 && code < 0x8000: JIS X 0208:1997.
* code >= 0x8000 && code < 0xFFFF: JIX X 0212-1990.
*/
extern unsigned short Unicode_to_JIS[];
int
trie_lookup (unsigned short *trie, unsigned short key)
{
unsigned short branch = trie[(key >> 12) & 0xf];
if (branch == 0)
return -1;
branch = trie[branch + ((key >> 8) & 0xf)];
if (branch == 0)
return -1;
branch = trie[branch + ((key >> 4) & 0xf)];
if (branch == 0)
return -1;
return trie[branch + (key & 0xf)];
}
static jint
convert_TO_EUCJIS (gnu::gcj::convert::Output_EUCJIS *encoder,
jchar *ptr, jint inlength)
{
int orig_inlength = inlength;
jint outbuf_length = encoder->buf->length;
for (;;)
{
if (encoder->count >= outbuf_length)
break;
if (encoder->pending1 >= 0)
{
elements(encoder->buf)[encoder->count++] = encoder->pending1;
encoder->pending1 = encoder->pending2;
encoder->pending2 = -1;
continue;
}
if (inlength == 0)
break;
jchar ch = *ptr++;
inlength--;
unsigned short val = trie_lookup(Unicode_to_JIS, ch);
if (val < 0x80)
{
if (val == 0xffff)
val = '?';
}
else if (val <= 0xFF)
{
encoder->pending1 = val;
encoder->pending2 = -1;
val = 0x8e;
}
else if (val < 0x8000)
{
val |= 0x8080;
encoder->pending1 = val & 0xff;
val = val >> 8;
encoder->pending2 = -1;
}
else
{
val |= 0x8080;
encoder->pending1 = val >> 8;
encoder->pending2 = val & 0xff;
val = 0x8f;
}
elements(encoder->buf)[encoder->count++] = val;
}
return orig_inlength - inlength;
}
jint
gnu::gcj::convert::Output_EUCJIS::write (jcharArray inbuffer,
jint inpos, jint inlength)
{
return convert_TO_EUCJIS(this, &elements(inbuffer)[inpos], inlength);
}
jint
gnu::gcj::convert::Output_EUCJIS::write (jstring str, jint inpos,
jint inlength, jcharArray)
{
return convert_TO_EUCJIS(this, _Jv_GetStringChars(str)+inpos, inlength);
}