|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
*/ |
|
|
|
package sun.nio.cs; |
|
|
|
import java.nio.ByteBuffer; |
|
import java.nio.CharBuffer; |
|
import java.nio.charset.Charset; |
|
import java.nio.charset.CharsetDecoder; |
|
import java.nio.charset.CharsetEncoder; |
|
import java.nio.charset.CoderResult; |
|
import java.util.Arrays; |
|
import sun.nio.cs.DoubleByte; |
|
import sun.nio.cs.Surrogate; |
|
import static sun.nio.cs.CharsetMapping.*; |
|
|
|
public class HKSCS { |
|
|
|
public static class Decoder extends DoubleByte.Decoder { |
|
static int b2Min = 0x40; |
|
static int b2Max = 0xfe; |
|
|
|
private char[][] b2cBmp; |
|
private char[][] b2cSupp; |
|
private DoubleByte.Decoder big5Dec; |
|
|
|
protected Decoder(Charset cs, |
|
DoubleByte.Decoder big5Dec, |
|
char[][] b2cBmp, char[][] b2cSupp) |
|
{ |
|
// super(cs, 0.5f, 1.0f); |
|
// need to extends DoubleByte.Decoder so the |
|
|
|
super(cs, 0.5f, 1.0f, null, null, 0, 0, true); |
|
this.big5Dec = big5Dec; |
|
this.b2cBmp = b2cBmp; |
|
this.b2cSupp = b2cSupp; |
|
} |
|
|
|
public char decodeSingle(int b) { |
|
return big5Dec.decodeSingle(b); |
|
} |
|
|
|
public char decodeBig5(int b1, int b2) { |
|
return big5Dec.decodeDouble(b1, b2); |
|
} |
|
|
|
public char decodeDouble(int b1, int b2) { |
|
return b2cBmp[b1][b2 - b2Min]; |
|
} |
|
|
|
public char decodeDoubleEx(int b1, int b2) { |
|
|
|
|
|
|
|
|
|
*/ |
|
return b2cSupp[b1][b2 - b2Min]; |
|
} |
|
|
|
protected CoderResult decodeArrayLoop(ByteBuffer src, CharBuffer dst) { |
|
byte[] sa = src.array(); |
|
int sp = src.arrayOffset() + src.position(); |
|
int sl = src.arrayOffset() + src.limit(); |
|
|
|
char[] da = dst.array(); |
|
int dp = dst.arrayOffset() + dst.position(); |
|
int dl = dst.arrayOffset() + dst.limit(); |
|
|
|
try { |
|
while (sp < sl) { |
|
int b1 = sa[sp] & 0xff; |
|
char c = decodeSingle(b1); |
|
int inSize = 1, outSize = 1; |
|
char[] cc = null; |
|
if (c == UNMAPPABLE_DECODING) { |
|
if (sl - sp < 2) |
|
return CoderResult.UNDERFLOW; |
|
int b2 = sa[sp + 1] & 0xff; |
|
inSize++; |
|
if (b2 < b2Min || b2 > b2Max) |
|
return CoderResult.unmappableForLength(2); |
|
c = decodeDouble(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) { |
|
c = decodeDoubleEx(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) { |
|
c = decodeBig5(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) |
|
return CoderResult.unmappableForLength(2); |
|
} else { |
|
|
|
outSize = 2; |
|
} |
|
} |
|
} |
|
if (dl - dp < outSize) |
|
return CoderResult.OVERFLOW; |
|
if (outSize == 2) { |
|
|
|
da[dp++] = Surrogate.high(0x20000 + c); |
|
da[dp++] = Surrogate.low(0x20000 + c); |
|
} else { |
|
da[dp++] = c; |
|
} |
|
sp += inSize; |
|
} |
|
return CoderResult.UNDERFLOW; |
|
} finally { |
|
src.position(sp - src.arrayOffset()); |
|
dst.position(dp - dst.arrayOffset()); |
|
} |
|
} |
|
|
|
protected CoderResult decodeBufferLoop(ByteBuffer src, CharBuffer dst) { |
|
int mark = src.position(); |
|
try { |
|
while (src.hasRemaining()) { |
|
char[] cc = null; |
|
int b1 = src.get() & 0xff; |
|
int inSize = 1, outSize = 1; |
|
char c = decodeSingle(b1); |
|
if (c == UNMAPPABLE_DECODING) { |
|
if (src.remaining() < 1) |
|
return CoderResult.UNDERFLOW; |
|
int b2 = src.get() & 0xff; |
|
inSize++; |
|
if (b2 < b2Min || b2 > b2Max) |
|
return CoderResult.unmappableForLength(2); |
|
c = decodeDouble(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) { |
|
c = decodeDoubleEx(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) { |
|
c = decodeBig5(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) |
|
return CoderResult.unmappableForLength(2); |
|
} else { |
|
outSize = 2; |
|
} |
|
} |
|
} |
|
if (dst.remaining() < outSize) |
|
return CoderResult.OVERFLOW; |
|
if (outSize == 2) { |
|
dst.put(Surrogate.high(0x20000 + c)); |
|
dst.put(Surrogate.low(0x20000 + c)); |
|
} else { |
|
dst.put(c); |
|
} |
|
mark += inSize; |
|
} |
|
return CoderResult.UNDERFLOW; |
|
} finally { |
|
src.position(mark); |
|
} |
|
} |
|
|
|
public int decode(byte[] src, int sp, int len, char[] dst) { |
|
int dp = 0; |
|
int sl = sp + len; |
|
char repl = replacement().charAt(0); |
|
while (sp < sl) { |
|
int b1 = src[sp++] & 0xff; |
|
char c = decodeSingle(b1); |
|
if (c == UNMAPPABLE_DECODING) { |
|
if (sl == sp) { |
|
c = repl; |
|
} else { |
|
int b2 = src[sp++] & 0xff; |
|
if (b2 < b2Min || b2 > b2Max) { |
|
c = repl; |
|
} else if ((c = decodeDouble(b1, b2)) == UNMAPPABLE_DECODING) { |
|
c = decodeDoubleEx(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) { |
|
c = decodeBig5(b1, b2); |
|
if (c == UNMAPPABLE_DECODING) |
|
c = repl; |
|
} else { |
|
|
|
dst[dp++] = Surrogate.high(0x20000 + c); |
|
dst[dp++] = Surrogate.low(0x20000 + c); |
|
continue; |
|
} |
|
} |
|
} |
|
} |
|
dst[dp++] = c; |
|
} |
|
return dp; |
|
} |
|
|
|
public CoderResult decodeLoop(ByteBuffer src, CharBuffer dst) { |
|
if (src.hasArray() && dst.hasArray()) |
|
return decodeArrayLoop(src, dst); |
|
else |
|
return decodeBufferLoop(src, dst); |
|
} |
|
|
|
public static void initb2c(char[][]b2c, String[] b2cStr) |
|
{ |
|
for (int i = 0; i < b2cStr.length; i++) { |
|
if (b2cStr[i] == null) |
|
b2c[i] = DoubleByte.B2C_UNMAPPABLE; |
|
else |
|
b2c[i] = b2cStr[i].toCharArray(); |
|
} |
|
} |
|
|
|
} |
|
|
|
public static class Encoder extends DoubleByte.Encoder { |
|
private DoubleByte.Encoder big5Enc; |
|
private char[][] c2bBmp; |
|
private char[][] c2bSupp; |
|
|
|
protected Encoder(Charset cs, |
|
DoubleByte.Encoder big5Enc, |
|
char[][] c2bBmp, |
|
char[][] c2bSupp) |
|
{ |
|
super(cs, null, null, true); |
|
this.big5Enc = big5Enc; |
|
this.c2bBmp = c2bBmp; |
|
this.c2bSupp = c2bSupp; |
|
} |
|
|
|
public int encodeBig5(char ch) { |
|
return big5Enc.encodeChar(ch); |
|
} |
|
|
|
public int encodeChar(char ch) { |
|
int bb = c2bBmp[ch >> 8][ch & 0xff]; |
|
if (bb == UNMAPPABLE_ENCODING) |
|
return encodeBig5(ch); |
|
return bb; |
|
} |
|
|
|
public int encodeSupp(int cp) { |
|
if ((cp & 0xf0000) != 0x20000) |
|
return UNMAPPABLE_ENCODING; |
|
return c2bSupp[(cp >> 8) & 0xff][cp & 0xff]; |
|
} |
|
|
|
public boolean canEncode(char c) { |
|
return encodeChar(c) != UNMAPPABLE_ENCODING; |
|
} |
|
|
|
protected CoderResult encodeArrayLoop(CharBuffer src, ByteBuffer dst) { |
|
char[] sa = src.array(); |
|
int sp = src.arrayOffset() + src.position(); |
|
int sl = src.arrayOffset() + src.limit(); |
|
|
|
byte[] da = dst.array(); |
|
int dp = dst.arrayOffset() + dst.position(); |
|
int dl = dst.arrayOffset() + dst.limit(); |
|
|
|
try { |
|
while (sp < sl) { |
|
char c = sa[sp]; |
|
int inSize = 1; |
|
int bb = encodeChar(c); |
|
if (bb == UNMAPPABLE_ENCODING) { |
|
if (Character.isSurrogate(c)) { |
|
int cp; |
|
if ((cp = sgp().parse(c, sa, sp, sl)) < 0) |
|
return sgp.error(); |
|
bb = encodeSupp(cp); |
|
if (bb == UNMAPPABLE_ENCODING) |
|
return CoderResult.unmappableForLength(2); |
|
inSize = 2; |
|
} else { |
|
return CoderResult.unmappableForLength(1); |
|
} |
|
} |
|
if (bb > MAX_SINGLEBYTE) { |
|
if (dl - dp < 2) |
|
return CoderResult.OVERFLOW; |
|
da[dp++] = (byte)(bb >> 8); |
|
da[dp++] = (byte)bb; |
|
} else { |
|
if (dl - dp < 1) |
|
return CoderResult.OVERFLOW; |
|
da[dp++] = (byte)bb; |
|
} |
|
sp += inSize; |
|
} |
|
return CoderResult.UNDERFLOW; |
|
} finally { |
|
src.position(sp - src.arrayOffset()); |
|
dst.position(dp - dst.arrayOffset()); |
|
} |
|
} |
|
|
|
protected CoderResult encodeBufferLoop(CharBuffer src, ByteBuffer dst) { |
|
int mark = src.position(); |
|
try { |
|
while (src.hasRemaining()) { |
|
int inSize = 1; |
|
char c = src.get(); |
|
int bb = encodeChar(c); |
|
if (bb == UNMAPPABLE_ENCODING) { |
|
if (Character.isSurrogate(c)) { |
|
int cp; |
|
if ((cp = sgp().parse(c, src)) < 0) |
|
return sgp.error(); |
|
bb = encodeSupp(cp); |
|
if (bb == UNMAPPABLE_ENCODING) |
|
return CoderResult.unmappableForLength(2); |
|
inSize = 2; |
|
} else { |
|
return CoderResult.unmappableForLength(1); |
|
} |
|
} |
|
if (bb > MAX_SINGLEBYTE) { |
|
if (dst.remaining() < 2) |
|
return CoderResult.OVERFLOW; |
|
dst.put((byte)(bb >> 8)); |
|
dst.put((byte)(bb)); |
|
} else { |
|
if (dst.remaining() < 1) |
|
return CoderResult.OVERFLOW; |
|
dst.put((byte)bb); |
|
} |
|
mark += inSize; |
|
} |
|
return CoderResult.UNDERFLOW; |
|
} finally { |
|
src.position(mark); |
|
} |
|
} |
|
|
|
protected CoderResult encodeLoop(CharBuffer src, ByteBuffer dst) { |
|
if (src.hasArray() && dst.hasArray()) |
|
return encodeArrayLoop(src, dst); |
|
else |
|
return encodeBufferLoop(src, dst); |
|
} |
|
|
|
private byte[] repl = replacement(); |
|
protected void implReplaceWith(byte[] newReplacement) { |
|
repl = newReplacement; |
|
} |
|
|
|
public int encode(char[] src, int sp, int len, byte[] dst) { |
|
int dp = 0; |
|
int sl = sp + len; |
|
while (sp < sl) { |
|
char c = src[sp++]; |
|
int bb = encodeChar(c); |
|
if (bb == UNMAPPABLE_ENCODING) { |
|
if (!Character.isHighSurrogate(c) || sp == sl || |
|
!Character.isLowSurrogate(src[sp]) || |
|
(bb = encodeSupp(Character.toCodePoint(c, src[sp++]))) |
|
== UNMAPPABLE_ENCODING) { |
|
dst[dp++] = repl[0]; |
|
if (repl.length > 1) |
|
dst[dp++] = repl[1]; |
|
continue; |
|
} |
|
} |
|
if (bb > MAX_SINGLEBYTE) { |
|
dst[dp++] = (byte)(bb >> 8); |
|
dst[dp++] = (byte)bb; |
|
} else { |
|
dst[dp++] = (byte)bb; |
|
} |
|
} |
|
return dp; |
|
} |
|
|
|
public int encodeFromUTF16(byte[] src, int sp, int len, byte[] dst) { |
|
int dp = 0; |
|
int sl = sp + len; |
|
int dl = dst.length; |
|
while (sp < sl) { |
|
char c = StringUTF16.getChar(src, sp++); |
|
int bb = encodeChar(c); |
|
if (bb == UNMAPPABLE_ENCODING) { |
|
if (!Character.isHighSurrogate(c) || sp == sl || |
|
!Character.isLowSurrogate(StringUTF16.getChar(src,sp)) || |
|
(bb = encodeSupp(Character.toCodePoint(c, StringUTF16.getChar(src, sp++)))) |
|
== UNMAPPABLE_ENCODING) { |
|
dst[dp++] = repl[0]; |
|
if (repl.length > 1) |
|
dst[dp++] = repl[1]; |
|
continue; |
|
} |
|
} |
|
if (bb > MAX_SINGLEBYTE) { |
|
dst[dp++] = (byte)(bb >> 8); |
|
dst[dp++] = (byte)bb; |
|
} else { |
|
dst[dp++] = (byte)bb; |
|
} |
|
} |
|
return dp; |
|
} |
|
|
|
static char[] C2B_UNMAPPABLE = new char[0x100]; |
|
static { |
|
Arrays.fill(C2B_UNMAPPABLE, (char)UNMAPPABLE_ENCODING); |
|
} |
|
|
|
public static void initc2b(char[][] c2b, String[] b2cStr, String pua) { |
|
|
|
int b2Min = 0x40; |
|
Arrays.fill(c2b, C2B_UNMAPPABLE); |
|
for (int b1 = 0; b1 < 0x100; b1++) { |
|
String s = b2cStr[b1]; |
|
if (s == null) |
|
continue; |
|
for (int i = 0; i < s.length(); i++) { |
|
char c = s.charAt(i); |
|
if (c == UNMAPPABLE_DECODING) |
|
continue; |
|
int hi = c >> 8; |
|
if (c2b[hi] == C2B_UNMAPPABLE) { |
|
c2b[hi] = new char[0x100]; |
|
Arrays.fill(c2b[hi], (char)UNMAPPABLE_ENCODING); |
|
} |
|
c2b[hi][c & 0xff] = (char)((b1 << 8) | (i + b2Min)); |
|
} |
|
} |
|
if (pua != null) { // add the compatibility pua entries |
|
char c = '\ue000'; |
|
for (int i = 0; i < pua.length(); i++) { |
|
char bb = pua.charAt(i); |
|
if (bb != UNMAPPABLE_DECODING) { |
|
int hi = c >> 8; |
|
if (c2b[hi] == C2B_UNMAPPABLE) { |
|
c2b[hi] = new char[0x100]; |
|
Arrays.fill(c2b[hi], (char)UNMAPPABLE_ENCODING); |
|
} |
|
c2b[hi][c & 0xff] = bb; |
|
} |
|
c++; |
|
} |
|
} |
|
} |
|
} |
|
} |