blob: 59dddef373ad24b036f717593ac888f9f8eaf04e [file] [log] [blame]
/*
* Copyright 1997-1999 Sun Microsystems, Inc. All Rights Reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Sun designates this
* particular file as subject to the "Classpath" exception as provided
* by Sun in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Sun Microsystems, Inc., 4150 Network Circle, Santa Clara,
* CA 95054 USA or visit www.sun.com if you need additional information or
* have any questions.
*/
package sun.io;
public abstract class CharToByteDBCS_EBCDIC extends CharToByteConverter
{
private static final int SBCS = 0;
private static final int DBCS = 1;
private static final byte SO = 0x0e;
private static final byte SI = 0x0f;
private int currentState;
private char highHalfZoneCode;
private byte[] outputByte = new byte[2];
protected short index1[];
protected String index2;
protected String index2a;
protected int mask1;
protected int mask2;
protected int shift;
public CharToByteDBCS_EBCDIC() {
super();
highHalfZoneCode = 0;
currentState = SBCS;
}
/**
* flush out any residual data and reset the buffer state
*/
public int flush(byte [] output, int outStart, int outEnd)
throws MalformedInputException, ConversionBufferFullException
{
int bytesOut = 0;
if (highHalfZoneCode != 0) {
reset();
badInputLength = 0;
throw new MalformedInputException();
}
if (currentState == DBCS) {
if (outStart >= outEnd)
throw new ConversionBufferFullException();
output[outStart] = SI;
bytesOut++;
}
reset();
return bytesOut;
}
/**
* Character conversion
*/
public int convert(char[] input, int inOff, int inEnd,
byte[] output, int outOff, int outEnd)
throws UnknownCharacterException, MalformedInputException,
ConversionBufferFullException
{
char inputChar;
int inputSize;
byteOff = outOff;
charOff = inOff;
while(charOff < inEnd) {
int index;
int theBytes;
int spaceNeeded;
if (highHalfZoneCode == 0) {
inputChar = input[charOff];
inputSize = 1;
} else {
inputChar = highHalfZoneCode;
inputSize = 0;
highHalfZoneCode = 0;
}
// Is this a high surrogate?
if(inputChar >= '\ud800' && inputChar <= '\udbff') {
// Is this the last character of the input?
if (charOff + inputSize >= inEnd) {
highHalfZoneCode = inputChar;
charOff += inputSize;
break;
}
// Is there a low surrogate following?
inputChar = input[charOff + inputSize];
if (inputChar >= '\udc00' && inputChar <= '\udfff') {
// We have a valid surrogate pair. Too bad we don't do
// surrogates. Is substitution enabled?
if (subMode) {
if (subBytes.length == 1) {
outputByte[0] = 0x00;
outputByte[1] = subBytes[0];
}
else {
outputByte[0] = subBytes[0];
outputByte[1] = subBytes[1];
}
inputSize++;
} else {
badInputLength = 2;
throw new UnknownCharacterException();
}
} else {
// We have a malformed surrogate pair
badInputLength = 1;
throw new MalformedInputException();
}
}
// Is this an unaccompanied low surrogate?
else
if (inputChar >= '\uDC00' && inputChar <= '\uDFFF') {
badInputLength = 1;
throw new MalformedInputException();
} else {
// We have a valid character, get the bytes for it
index = index1[((inputChar & mask1) >> shift)] + (inputChar & mask2);
//System.out.println("Index for U+" + Integer.toHexString(inputChar) + " = " + index); // for debugging purposes
if (index < 15000)
theBytes = (int)(index2.charAt(index));
else
theBytes = (int)(index2a.charAt(index-15000));
outputByte[0] = (byte)((theBytes & 0x0000ff00)>>8);
outputByte[1] = (byte)(theBytes & 0x000000ff);
}
// if there was no mapping - look for substitution characters
if (outputByte[0] == 0x00 && outputByte[1] == 0x00
&& inputChar != '\u0000')
{
if (subMode) {
if (subBytes.length == 1) {
outputByte[0] = 0x00;
outputByte[1] = subBytes[0];
} else {
outputByte[0] = subBytes[0];
outputByte[1] = subBytes[1];
}
} else {
badInputLength = 1;
throw new UnknownCharacterException();
}
}
//Set the output buffer into the correct state
if (currentState == DBCS && outputByte[0] == 0x00) {
if (byteOff >= outEnd)
throw new ConversionBufferFullException();
currentState = SBCS;
output[byteOff++] = SI;
} else
if (currentState == SBCS && outputByte[0] != 0x00) {
if (byteOff >= outEnd) {
throw new ConversionBufferFullException();
}
currentState = DBCS;
output[byteOff++] = SO;
}
if (currentState == DBCS)
spaceNeeded = 2;
else
spaceNeeded = 1;
if (byteOff + spaceNeeded > outEnd) {
throw new ConversionBufferFullException();
}
if (currentState == SBCS)
output[byteOff++] = outputByte[1];
else {
output[byteOff++] = outputByte[0];
output[byteOff++] = outputByte[1];
}
charOff += inputSize;
}
return byteOff - outOff;
}
/**
* Resets converter to its initial state.
*/
public void reset() {
charOff = byteOff = 0;
highHalfZoneCode = 0;
currentState = SBCS;
}
/**
* Returns the maximum number of bytes needed to convert a char.
*/
public int getMaxBytesPerChar() {
return 4; //Fixed with bug 4199599 so tests would pass.
}
/**
* Sets the substitution bytes to use when the converter is in
* substitution mode. The given bytes should represent a valid
* character in the target character encoding.
*/
public void setSubstitutionBytes( byte[] newSubBytes )
throws IllegalArgumentException
{
if( newSubBytes.length > 2 || newSubBytes.length == 0) {
throw new IllegalArgumentException();
}
subBytes = new byte[ newSubBytes.length ];
System.arraycopy( newSubBytes, 0, subBytes, 0, newSubBytes.length );
}
/**
* Returns true if the given character can be converted to the
* target character encoding.
*/
public boolean canConvert(char ch) {
int index;
int theBytes;
index = index1[((ch & mask1) >> shift)] + (ch & mask2);
if (index < 15000)
theBytes = (int)(index2.charAt(index));
else
theBytes = (int)(index2a.charAt(index-15000));
if (theBytes != 0)
return (true);
// only return true if input char was unicode null - all others are
// undefined
return( ch == '\u0000');
}
}