/*
* Copyright ( c ) 2002 , 2013 , Oracle and / or its affiliates . All rights reserved .
* DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER .
*
* This code is free software ; you can redistribute it and / or modify it
* under the terms of the GNU General Public License version 2 only , as
* published by the Free Software Foundation .
*
* This code is distributed in the hope that it will be useful , but WITHOUT
* ANY WARRANTY ; without even the implied warranty of MERCHANTABILITY or
* FITNESS FOR A PARTICULAR PURPOSE . See the GNU General Public License
* version 2 for more details ( a copy is included in the LICENSE file that
* accompanied this code ) .
*
* You should have received a copy of the GNU General Public License version
* 2 along with this work ; if not , write to the Free Software Foundation ,
* Inc . , 51 Franklin St , Fifth Floor , Boston , MA 02110 - 1301 USA .
*
* Please contact Oracle , 500 Oracle Parkway , Redwood Shores , CA 94065 USA
* or visit www . oracle . com if you need additional information or have any
* questions .
*/
/* @test
* @ bug 4153987
* @ summary Malformed surrogates should be handled by the converter in
* substitution mode .
*/
import java.io.*;
import java.nio.charset.Charset;
import java.nio.charset.CharsetDecoder;
import java.nio.charset.CharsetEncoder;
import java.nio.CharBuffer;
import java.nio.ByteBuffer;
import java.nio.charset.CodingErrorAction;
import java.nio.charset.MalformedInputException;
import java.nio.charset.UnmappableCharacterException;
import java.util.SortedMap;
public class MalformedSurrogates {
private static final String PREFIX = "abc" ;
private static final String SUFFIX = "efgh" ;
private static final String MALFORMED_SURROGATE = PREFIX + "\uD800\uDB00" + SUFFIX;
private static final String NORMAL_SURROGATE = PREFIX + "\uD800\uDC00" + SUFFIX;
private static final String REVERSED_SURROGATE = PREFIX + "\uDC00\uD800" + SUFFIX;
private static final String SOLITARY_HIGH_SURROGATE = PREFIX + "\uD800" + SUFFIX;
private static final String SOLITARY_LOW_SURROGATE = PREFIX + "\uDC00" + SUFFIX;
public static void main(String[] args) throws IOException {
SortedMap<String, Charset> map = Charset.availableCharsets();
for (String name : map.keySet()) {
Charset charset = map.get(name);
if (charset.canEncode() && !charset.name().equals("x-COMPOUND_TEXT" )) {
testNormalSurrogate(charset, NORMAL_SURROGATE);
testMalformedSurrogate(charset, MALFORMED_SURROGATE);
testMalformedSurrogate(charset, REVERSED_SURROGATE);
testMalformedSurrogate(charset, SOLITARY_HIGH_SURROGATE);
testMalformedSurrogate(charset, SOLITARY_LOW_SURROGATE);
testSurrogateWithReplacement(charset, NORMAL_SURROGATE);
testSurrogateWithReplacement(charset, MALFORMED_SURROGATE);
testSurrogateWithReplacement(charset, REVERSED_SURROGATE);
testSurrogateWithReplacement(charset, SOLITARY_HIGH_SURROGATE);
testSurrogateWithReplacement(charset, SOLITARY_LOW_SURROGATE);
}
}
}
public static void testMalformedSurrogate(Charset cs, String surrogate) throws IOException {
CharsetEncoder en = cs.newEncoder();
if (en.canEncode(surrogate)) {
throw new RuntimeException("testMalformedSurrogate failed with charset " + cs.name());
}
try {
en.encode(CharBuffer.wrap(surrogate));
throw new RuntimeException("Should throw MalformedInputException or UnmappableCharacterException" );
} catch (MalformedInputException | UnmappableCharacterException ex) {
} finally {
en.reset();
}
try (OutputStreamWriter osw = new OutputStreamWriter(new ByteArrayOutputStream(), en)) {
osw.write(surrogate);
throw new RuntimeException("Should throw MalformedInputException or UnmappableCharacterException" );
} catch (MalformedInputException | UnmappableCharacterException ex) {
}
}
public static void testNormalSurrogate(Charset cs, String surrogate) throws IOException {
CharsetEncoder en = cs.newEncoder();
try {
en.encode(CharBuffer.wrap(surrogate));
} catch (UnmappableCharacterException ex) {
} finally {
en.reset();
}
try (OutputStreamWriter osw = new OutputStreamWriter(new ByteArrayOutputStream(), en)) {
osw.write(surrogate);
} catch (UnmappableCharacterException ex) {
}
}
public static void testSurrogateWithReplacement(Charset cs, String surrogate) throws IOException {
CharsetEncoder en = cs.newEncoder();
CharsetDecoder de = cs.newDecoder();
if (!en.canEncode(NORMAL_SURROGATE)) {
return ;
}
String expected = null ;
String replace = new String(en.replacement(), cs);
switch (surrogate) {
case MALFORMED_SURROGATE:
case REVERSED_SURROGATE:
expected = PREFIX + replace + replace + SUFFIX;
break ;
case SOLITARY_HIGH_SURROGATE:
case SOLITARY_LOW_SURROGATE:
expected = PREFIX + replace + SUFFIX;
break ;
default :
expected = NORMAL_SURROGATE;
}
try {
en.onMalformedInput(CodingErrorAction.REPLACE);
en.onUnmappableCharacter(CodingErrorAction.REPLACE);
ByteBuffer bbuf = en.encode(CharBuffer.wrap(surrogate));
CharBuffer cbuf = de.decode(bbuf);
if (!cbuf.toString().equals(expected)) {
throw new RuntimeException("charset " + cs.name() + " (en)decoded the surrogate " + surrogate + " to " + cbuf.toString() + " which is not same as the expected " + expected);
}
} finally {
en.reset();
de.reset();
}
try (ByteArrayOutputStream bos = new ByteArrayOutputStream();
OutputStreamWriter osw = new OutputStreamWriter(bos, en);) {
osw.write(surrogate);
osw.flush();
try (InputStreamReader isr = new InputStreamReader(new ByteArrayInputStream(bos.toByteArray()), de)) {
CharBuffer cbuf = CharBuffer.allocate(expected.length());
isr.read(cbuf);
cbuf.rewind();
if (!cbuf.toString().equals(expected)) {
throw new RuntimeException("charset " + cs.name() + " (en)decoded the surrogate " + surrogate + " to " + cbuf.toString() + " which is not same as the expected " + expected);
}
}
}
}
}
Messung V0.5 in Prozent C=100 H=100 G=100
¤ Dauer der Verarbeitung: 0.11 Sekunden
(vorverarbeitet am 2026-06-10)
¤
*© Formatika GbR, Deutschland