| /* |
| * Copyright (c) 2010, 2013, Oracle and/or its affiliates. All rights reserved. |
| * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. |
| * |
| * This code is free software; you can redistribute it and/or modify it |
| * under the terms of the GNU General Public License version 2 only, as |
| * published by the Free Software Foundation. Oracle designates this |
| * particular file as subject to the "Classpath" exception as provided |
| * by Oracle in the LICENSE file that accompanied this code. |
| * |
| * This code is distributed in the hope that it will be useful, but WITHOUT |
| * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or |
| * FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License |
| * version 2 for more details (a copy is included in the LICENSE file that |
| * accompanied this code). |
| * |
| * You should have received a copy of the GNU General Public License version |
| * 2 along with this work; if not, write to the Free Software Foundation, |
| * Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA. |
| * |
| * Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA |
| * or visit www.oracle.com if you need additional information or have any |
| * questions. |
| */ |
| |
| package sun.nio.cs; |
| |
| import java.nio.ByteBuffer; |
| import java.nio.CharBuffer; |
| import java.nio.charset.Charset; |
| import java.nio.charset.CharsetDecoder; |
| import java.nio.charset.CharsetEncoder; |
| import java.nio.charset.CoderResult; |
| import java.util.Arrays; |
| import sun.nio.cs.DoubleByte; |
| import sun.nio.cs.Surrogate; |
| import static sun.nio.cs.CharsetMapping.*; |
| |
| public class HKSCS { |
| |
| public static class Decoder extends DoubleByte.Decoder { |
| static int b2Min = 0x40; |
| static int b2Max = 0xfe; |
| |
| private char[][] b2cBmp; |
| private char[][] b2cSupp; |
| private DoubleByte.Decoder big5Dec; |
| |
| protected Decoder(Charset cs, |
| DoubleByte.Decoder big5Dec, |
| char[][] b2cBmp, char[][] b2cSupp) |
| { |
| // super(cs, 0.5f, 1.0f); |
| // need to extends DoubleByte.Decoder so the |
| // sun.io can use it. this implementation |
| super(cs, 0.5f, 1.0f, null, null, 0, 0, true); |
| this.big5Dec = big5Dec; |
| this.b2cBmp = b2cBmp; |
| this.b2cSupp = b2cSupp; |
| } |
| |
| public char decodeSingle(int b) { |
| return big5Dec.decodeSingle(b); |
| } |
| |
| public char decodeBig5(int b1, int b2) { |
| return big5Dec.decodeDouble(b1, b2); |
| } |
| |
| public char decodeDouble(int b1, int b2) { |
| return b2cBmp[b1][b2 - b2Min]; |
| } |
| |
| public char decodeDoubleEx(int b1, int b2) { |
| /* if the b2cSupp is null, the subclass need |
| to override the methold |
| if (b2cSupp == null) |
| return UNMAPPABLE_DECODING; |
| */ |
| return b2cSupp[b1][b2 - b2Min]; |
| } |
| |
| protected CoderResult decodeArrayLoop(ByteBuffer src, CharBuffer dst) { |
| byte[] sa = src.array(); |
| int sp = src.arrayOffset() + src.position(); |
| int sl = src.arrayOffset() + src.limit(); |
| |
| char[] da = dst.array(); |
| int dp = dst.arrayOffset() + dst.position(); |
| int dl = dst.arrayOffset() + dst.limit(); |
| |
| try { |
| while (sp < sl) { |
| int b1 = sa[sp] & 0xff; |
| char c = decodeSingle(b1); |
| int inSize = 1, outSize = 1; |
| char[] cc = null; |
| if (c == UNMAPPABLE_DECODING) { |
| if (sl - sp < 2) |
| return CoderResult.UNDERFLOW; |
| int b2 = sa[sp + 1] & 0xff; |
| inSize++; |
| if (b2 < b2Min || b2 > b2Max) |
| return CoderResult.unmappableForLength(2); |
| c = decodeDouble(b1, b2); //bmp |
| if (c == UNMAPPABLE_DECODING) { |
| c = decodeDoubleEx(b1, b2); //supp |
| if (c == UNMAPPABLE_DECODING) { |
| c = decodeBig5(b1, b2); //big5 |
| if (c == UNMAPPABLE_DECODING) |
| return CoderResult.unmappableForLength(2); |
| } else { |
| // supplementary character in u+2xxxx area |
| outSize = 2; |
| } |
| } |
| } |
| if (dl - dp < outSize) |
| return CoderResult.OVERFLOW; |
| if (outSize == 2) { |
| // supplementary characters |
| da[dp++] = Surrogate.high(0x20000 + c); |
| da[dp++] = Surrogate.low(0x20000 + c); |
| } else { |
| da[dp++] = c; |
| } |
| sp += inSize; |
| } |
| return CoderResult.UNDERFLOW; |
| } finally { |
| src.position(sp - src.arrayOffset()); |
| dst.position(dp - dst.arrayOffset()); |
| } |
| } |
| |
| protected CoderResult decodeBufferLoop(ByteBuffer src, CharBuffer dst) { |
| int mark = src.position(); |
| try { |
| while (src.hasRemaining()) { |
| char[] cc = null; |
| int b1 = src.get() & 0xff; |
| int inSize = 1, outSize = 1; |
| char c = decodeSingle(b1); |
| if (c == UNMAPPABLE_DECODING) { |
| if (src.remaining() < 1) |
| return CoderResult.UNDERFLOW; |
| int b2 = src.get() & 0xff; |
| inSize++; |
| if (b2 < b2Min || b2 > b2Max) |
| return CoderResult.unmappableForLength(2); |
| c = decodeDouble(b1, b2); //bmp |
| if (c == UNMAPPABLE_DECODING) { |
| c = decodeDoubleEx(b1, b2); //supp |
| if (c == UNMAPPABLE_DECODING) { |
| c = decodeBig5(b1, b2); //big5 |
| if (c == UNMAPPABLE_DECODING) |
| return CoderResult.unmappableForLength(2); |
| } else { |
| outSize = 2; |
| } |
| } |
| } |
| if (dst.remaining() < outSize) |
| return CoderResult.OVERFLOW; |
| if (outSize == 2) { |
| dst.put(Surrogate.high(0x20000 + c)); |
| dst.put(Surrogate.low(0x20000 + c)); |
| } else { |
| dst.put(c); |
| } |
| mark += inSize; |
| } |
| return CoderResult.UNDERFLOW; |
| } finally { |
| src.position(mark); |
| } |
| } |
| |
| public int decode(byte[] src, int sp, int len, char[] dst) { |
| int dp = 0; |
| int sl = sp + len; |
| char repl = replacement().charAt(0); |
| while (sp < sl) { |
| int b1 = src[sp++] & 0xff; |
| char c = decodeSingle(b1); |
| if (c == UNMAPPABLE_DECODING) { |
| if (sl == sp) { |
| c = repl; |
| } else { |
| int b2 = src[sp++] & 0xff; |
| if (b2 < b2Min || b2 > b2Max) { |
| c = repl; |
| } else if ((c = decodeDouble(b1, b2)) == UNMAPPABLE_DECODING) { |
| c = decodeDoubleEx(b1, b2); //supp |
| if (c == UNMAPPABLE_DECODING) { |
| c = decodeBig5(b1, b2); //big5 |
| if (c == UNMAPPABLE_DECODING) |
| c = repl; |
| } else { |
| // supplementary character in u+2xxxx area |
| dst[dp++] = Surrogate.high(0x20000 + c); |
| dst[dp++] = Surrogate.low(0x20000 + c); |
| continue; |
| } |
| } |
| } |
| } |
| dst[dp++] = c; |
| } |
| return dp; |
| } |
| |
| public CoderResult decodeLoop(ByteBuffer src, CharBuffer dst) { |
| if (src.hasArray() && dst.hasArray()) |
| return decodeArrayLoop(src, dst); |
| else |
| return decodeBufferLoop(src, dst); |
| } |
| |
| public static void initb2c(char[][]b2c, String[] b2cStr) |
| { |
| for (int i = 0; i < b2cStr.length; i++) { |
| if (b2cStr[i] == null) |
| b2c[i] = DoubleByte.B2C_UNMAPPABLE; |
| else |
| b2c[i] = b2cStr[i].toCharArray(); |
| } |
| } |
| |
| } |
| |
| public static class Encoder extends DoubleByte.Encoder { |
| private DoubleByte.Encoder big5Enc; |
| private char[][] c2bBmp; |
| private char[][] c2bSupp; |
| |
| protected Encoder(Charset cs, |
| DoubleByte.Encoder big5Enc, |
| char[][] c2bBmp, |
| char[][] c2bSupp) |
| { |
| super(cs, null, null, true); |
| this.big5Enc = big5Enc; |
| this.c2bBmp = c2bBmp; |
| this.c2bSupp = c2bSupp; |
| } |
| |
| public int encodeBig5(char ch) { |
| return big5Enc.encodeChar(ch); |
| } |
| |
| public int encodeChar(char ch) { |
| int bb = c2bBmp[ch >> 8][ch & 0xff]; |
| if (bb == UNMAPPABLE_ENCODING) |
| return encodeBig5(ch); |
| return bb; |
| } |
| |
| public int encodeSupp(int cp) { |
| if ((cp & 0xf0000) != 0x20000) |
| return UNMAPPABLE_ENCODING; |
| return c2bSupp[(cp >> 8) & 0xff][cp & 0xff]; |
| } |
| |
| public boolean canEncode(char c) { |
| return encodeChar(c) != UNMAPPABLE_ENCODING; |
| } |
| |
| protected CoderResult encodeArrayLoop(CharBuffer src, ByteBuffer dst) { |
| char[] sa = src.array(); |
| int sp = src.arrayOffset() + src.position(); |
| int sl = src.arrayOffset() + src.limit(); |
| |
| byte[] da = dst.array(); |
| int dp = dst.arrayOffset() + dst.position(); |
| int dl = dst.arrayOffset() + dst.limit(); |
| |
| try { |
| while (sp < sl) { |
| char c = sa[sp]; |
| int inSize = 1; |
| int bb = encodeChar(c); |
| if (bb == UNMAPPABLE_ENCODING) { |
| if (Character.isSurrogate(c)) { |
| int cp; |
| if ((cp = sgp().parse(c, sa, sp, sl)) < 0) |
| return sgp.error(); |
| bb = encodeSupp(cp); |
| if (bb == UNMAPPABLE_ENCODING) |
| return CoderResult.unmappableForLength(2); |
| inSize = 2; |
| } else { |
| return CoderResult.unmappableForLength(1); |
| } |
| } |
| if (bb > MAX_SINGLEBYTE) { // DoubleByte |
| if (dl - dp < 2) |
| return CoderResult.OVERFLOW; |
| da[dp++] = (byte)(bb >> 8); |
| da[dp++] = (byte)bb; |
| } else { // SingleByte |
| if (dl - dp < 1) |
| return CoderResult.OVERFLOW; |
| da[dp++] = (byte)bb; |
| } |
| sp += inSize; |
| } |
| return CoderResult.UNDERFLOW; |
| } finally { |
| src.position(sp - src.arrayOffset()); |
| dst.position(dp - dst.arrayOffset()); |
| } |
| } |
| |
| protected CoderResult encodeBufferLoop(CharBuffer src, ByteBuffer dst) { |
| int mark = src.position(); |
| try { |
| while (src.hasRemaining()) { |
| int inSize = 1; |
| char c = src.get(); |
| int bb = encodeChar(c); |
| if (bb == UNMAPPABLE_ENCODING) { |
| if (Character.isSurrogate(c)) { |
| int cp; |
| if ((cp = sgp().parse(c, src)) < 0) |
| return sgp.error(); |
| bb = encodeSupp(cp); |
| if (bb == UNMAPPABLE_ENCODING) |
| return CoderResult.unmappableForLength(2); |
| inSize = 2; |
| } else { |
| return CoderResult.unmappableForLength(1); |
| } |
| } |
| if (bb > MAX_SINGLEBYTE) { // DoubleByte |
| if (dst.remaining() < 2) |
| return CoderResult.OVERFLOW; |
| dst.put((byte)(bb >> 8)); |
| dst.put((byte)(bb)); |
| } else { |
| if (dst.remaining() < 1) |
| return CoderResult.OVERFLOW; |
| dst.put((byte)bb); |
| } |
| mark += inSize; |
| } |
| return CoderResult.UNDERFLOW; |
| } finally { |
| src.position(mark); |
| } |
| } |
| |
| protected CoderResult encodeLoop(CharBuffer src, ByteBuffer dst) { |
| if (src.hasArray() && dst.hasArray()) |
| return encodeArrayLoop(src, dst); |
| else |
| return encodeBufferLoop(src, dst); |
| } |
| |
| private byte[] repl = replacement(); |
| protected void implReplaceWith(byte[] newReplacement) { |
| repl = newReplacement; |
| } |
| |
| public int encode(char[] src, int sp, int len, byte[] dst) { |
| int dp = 0; |
| int sl = sp + len; |
| while (sp < sl) { |
| char c = src[sp++]; |
| int bb = encodeChar(c); |
| if (bb == UNMAPPABLE_ENCODING) { |
| if (!Character.isHighSurrogate(c) || sp == sl || |
| !Character.isLowSurrogate(src[sp]) || |
| (bb = encodeSupp(Character.toCodePoint(c, src[sp++]))) |
| == UNMAPPABLE_ENCODING) { |
| dst[dp++] = repl[0]; |
| if (repl.length > 1) |
| dst[dp++] = repl[1]; |
| continue; |
| } |
| } |
| if (bb > MAX_SINGLEBYTE) { // DoubleByte |
| dst[dp++] = (byte)(bb >> 8); |
| dst[dp++] = (byte)bb; |
| } else { // SingleByte |
| dst[dp++] = (byte)bb; |
| } |
| } |
| return dp; |
| } |
| |
| public int encodeFromUTF16(byte[] src, int sp, int len, byte[] dst) { |
| int dp = 0; |
| int sl = sp + len; |
| int dl = dst.length; |
| while (sp < sl) { |
| char c = StringUTF16.getChar(src, sp++); |
| int bb = encodeChar(c); |
| if (bb == UNMAPPABLE_ENCODING) { |
| if (!Character.isHighSurrogate(c) || sp == sl || |
| !Character.isLowSurrogate(StringUTF16.getChar(src,sp)) || |
| (bb = encodeSupp(Character.toCodePoint(c, StringUTF16.getChar(src, sp++)))) |
| == UNMAPPABLE_ENCODING) { |
| dst[dp++] = repl[0]; |
| if (repl.length > 1) |
| dst[dp++] = repl[1]; |
| continue; |
| } |
| } |
| if (bb > MAX_SINGLEBYTE) { // DoubleByte |
| dst[dp++] = (byte)(bb >> 8); |
| dst[dp++] = (byte)bb; |
| } else { // SingleByte |
| dst[dp++] = (byte)bb; |
| } |
| } |
| return dp; |
| } |
| |
| static char[] C2B_UNMAPPABLE = new char[0x100]; |
| static { |
| Arrays.fill(C2B_UNMAPPABLE, (char)UNMAPPABLE_ENCODING); |
| } |
| |
| public static void initc2b(char[][] c2b, String[] b2cStr, String pua) { |
| // init c2b/c2bSupp from b2cStr and supp |
| int b2Min = 0x40; |
| Arrays.fill(c2b, C2B_UNMAPPABLE); |
| for (int b1 = 0; b1 < 0x100; b1++) { |
| String s = b2cStr[b1]; |
| if (s == null) |
| continue; |
| for (int i = 0; i < s.length(); i++) { |
| char c = s.charAt(i); |
| if (c == UNMAPPABLE_DECODING) |
| continue; |
| int hi = c >> 8; |
| if (c2b[hi] == C2B_UNMAPPABLE) { |
| c2b[hi] = new char[0x100]; |
| Arrays.fill(c2b[hi], (char)UNMAPPABLE_ENCODING); |
| } |
| c2b[hi][c & 0xff] = (char)((b1 << 8) | (i + b2Min)); |
| } |
| } |
| if (pua != null) { // add the compatibility pua entries |
| char c = '\ue000'; //first pua character |
| for (int i = 0; i < pua.length(); i++) { |
| char bb = pua.charAt(i); |
| if (bb != UNMAPPABLE_DECODING) { |
| int hi = c >> 8; |
| if (c2b[hi] == C2B_UNMAPPABLE) { |
| c2b[hi] = new char[0x100]; |
| Arrays.fill(c2b[hi], (char)UNMAPPABLE_ENCODING); |
| } |
| c2b[hi][c & 0xff] = bb; |
| } |
| c++; |
| } |
| } |
| } |
| } |
| } |