blob: 84d76538949421c388c159cc204ed583e4fffd73 [file] [log] [blame]
/*
* Copyright (c) 2008, Oracle and/or its affiliates. All rights reserved.
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
*
* This code is free software; you can redistribute it and/or modify it
* under the terms of the GNU General Public License version 2 only, as
* published by the Free Software Foundation.
*
* This code is distributed in the hope that it will be useful, but WITHOUT
* ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License
* version 2 for more details (a copy is included in the LICENSE file that
* accompanied this code).
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work; if not, write to the Free Software Foundation,
* Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
*
* Please contact Oracle, 500 Oracle Parkway, Redwood Shores, CA 94065 USA
* or visit www.oracle.com if you need additional information or have any
* questions.
*/
/* @test
@bug 4508058 6378911
@summary Check if UTF8 decoder handles BOM correctly
*/
import java.io.IOException;
import java.nio.BufferOverflowException;
import java.nio.*;
import java.nio.charset.*;
/* The fix for 6378911 is to backout the change we made for 4508058,
so this regtest is modified accordingly to leave the beginning
BOM untouched during decoding.
*/
public class TestUTF8BOM {
private static ByteBuffer bf = ByteBuffer.allocateDirect(1000);
private static void testDecode(String expected, byte[] input)
throws Exception
{
String out = new String(input, "utf8");
if (!out.equals(expected)) {
failureReport (out, expected);
throw new Exception("UTF_8 Decoding test failed");
}
//try directBuffer.
bf.clear();
bf.put(input).flip();
out = Charset.forName("UTF-8")
.decode(bf)
.toString();
if (!out.equals(expected)) {
failureReport (out, expected);
throw new Exception("UTF_8 Decoding test failed(directbuffer)");
}
}
private static void failureReport(String testStr,
String expected) {
System.err.println ("Expected Characters:");
for (int i = 0; i < expected.length() ; i++) {
System.out.println("expected char[" + i + "] : " +
Integer.toHexString((int)expected.charAt(i)) +
" obtained char[" + i + "] : " +
Integer.toHexString((int)testStr.charAt(i)));
}
}
public static void main (String[] args) throws Exception {
// Test 1: with BOM at beginning
testDecode("\ufeff\u0092\u0093",
new byte[] { (byte) 0xef, (byte) 0xbb, (byte) 0xbf,
(byte) 0xc2, (byte) 0x92,
(byte) 0xc2, (byte) 0x93 });
// Test 2: with BOM at middle
testDecode("\u9200\ufeff\u9300",
new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
(byte) 0xef, (byte) 0xbb, (byte) 0xbf,
(byte) 0xe9, (byte) 0x8c, (byte) 0x80 });
// Test 3: with BOM at end
testDecode("\u9200\u9300\ufeff",
new byte[] { (byte) 0xe9, (byte) 0x88, (byte) 0x80,
(byte) 0xe9, (byte) 0x8c, (byte) 0x80,
(byte) 0xef, (byte) 0xbb, (byte) 0xbf });
System.err.println ("\nPASSED UTF-8 decode BOM test");
}
}