blob: c3509d7c2f3a5caa392c7fc62ddd0b37f8e4b318 [file] [log] [blame]
/*
* Copyright (c) 2000, 2006, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation. Oracle designates this
* particular file as subject to the "Classpath" exception as provided
* by Oracle in the LICENSE file that accompanied this code.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
package sun.nio.cs;
import java.nio.ByteBuffer;
import java.nio.CharBuffer;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.CoderResult;
import java.nio.charset.CharacterCodingException;
import java.nio.charset.MalformedInputException;
abstract class UnicodeDecoder extends CharsetDecoder {
protected static final char BYTE_ORDER_MARK = (char) 0xfeff;
protected static final char REVERSED_MARK = (char) 0xfffe;
protected static final int NONE = 0;
protected static final int BIG = 1;
protected static final int LITTLE = 2;
private final int expectedByteOrder;
private int currentByteOrder;
private int defaultByteOrder = BIG;
public UnicodeDecoder(Charset cs, int bo) {
super(cs, 0.5f, 1.0f);
expectedByteOrder = currentByteOrder = bo;
}
public UnicodeDecoder(Charset cs, int bo, int defaultBO) {
this(cs, bo);
defaultByteOrder = defaultBO;
}
private char decode(int b1, int b2) {
if (currentByteOrder == BIG)
return (char)((b1 << 8) | b2);
else
return (char)((b2 << 8) | b1);
}
protected CoderResult decodeLoop(ByteBuffer src, CharBuffer dst) {
int mark = src.position();
try {
while (src.remaining() > 1) {
int b1 = src.get() & 0xff;
int b2 = src.get() & 0xff;
// Byte Order Mark interpretation
if (currentByteOrder == NONE) {
char c = (char)((b1 << 8) | b2);
if (c == BYTE_ORDER_MARK) {
currentByteOrder = BIG;
mark += 2;
continue;
} else if (c == REVERSED_MARK) {
currentByteOrder = LITTLE;
mark += 2;
continue;
} else {
currentByteOrder = defaultByteOrder;
// FALL THROUGH to process b1, b2 normally
}
}
char c = decode(b1, b2);
if (c == REVERSED_MARK) {
// A reversed BOM cannot occur within middle of stream
return CoderResult.malformedForLength(2);
}
// Surrogates
if (Character.isSurrogate(c)) {
if (Character.isHighSurrogate(c)) {
if (src.remaining() < 2)
return CoderResult.UNDERFLOW;
char c2 = decode(src.get() & 0xff, src.get() & 0xff);
if (!Character.isLowSurrogate(c2))
return CoderResult.malformedForLength(4);
if (dst.remaining() < 2)
return CoderResult.OVERFLOW;
mark += 4;
dst.put(c);
dst.put(c2);
continue;
}
// Unpaired low surrogate
return CoderResult.malformedForLength(2);
}
if (!dst.hasRemaining())
return CoderResult.OVERFLOW;
mark += 2;
dst.put(c);
}
return CoderResult.UNDERFLOW;
} finally {
src.position(mark);
}
}
protected void implReset() {
currentByteOrder = expectedByteOrder;
}
}