blob: 1b379e68120a7fde3b003b20aa6ac1d67945273a [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.xml.security.test.dom.c14n.implementations;
import java.io.ByteArrayOutputStream;
import java.nio.charset.StandardCharsets;
import org.apache.xml.security.c14n.implementations.UtfHelpper;
import static org.junit.Assert.assertArrayEquals;
public class UtfHelperTest {
@org.junit.Test
public void testBug40156() {
String s = "\u00e4\u00f6\u00fc";
byte[] a = UtfHelpper.getStringInUtf8(s);
byte[] correct = s.getBytes(StandardCharsets.UTF_8);
assertArrayEquals(correct, a);
}
@org.junit.Test
public void testUtf() throws Exception {
//
// This test fails with the IBM JDK
//
if ("IBM Corporation".equals(System.getProperty("java.vendor"))) {
return;
}
// if system property org.apache.xml.security.c14n.oldUtf8=true, can only validate
// 16bit chars against String.getBytes(StandardCharsets.UTF_8);
int chunk = Boolean.getBoolean("org.apache.xml.security.c14n.oldUtf8") ? 1 << 16
: Character.MAX_CODE_POINT + 1;
int j = 0;
ByteArrayOutputStream charByCharOs = new ByteArrayOutputStream();
ByteArrayOutputStream strOs = new ByteArrayOutputStream();
char[] chs = new char[chunk * 2];
int pos = 0;
for (int i = 0; i < chunk; i++) {
int ch = chunk * j + i;
int offset = Character.toChars(ch, chs, pos);
pos += offset;
if (ch == 0xDBFF) {
// since 0xDBFF with next character 0xDC00 will form a surrogate pair, so insert a space character in between
offset = Character.toChars(Character.SPACE_SEPARATOR, chs, pos);
pos += offset;
}
}
char[] newResult = new char[pos];
System.arraycopy(chs, 0, newResult, 0, pos);
for (int i = 0; i < pos; ) {
int ch = Character.codePointAt(newResult, i);
i += Character.charCount(ch);
UtfHelpper.writeCodePointToUtf8(ch, charByCharOs);
}
String str = new String(newResult);
byte[] a = UtfHelpper.getStringInUtf8(str);
// System.out.println("chunk:"+j);
byte[] correct = str.getBytes(StandardCharsets.UTF_8);
assertArrayEquals("UtfHelper.getStringInUtf8 false", correct, a);
assertArrayEquals(
"UtfHelper.getStringInUtf8 false",
correct, charByCharOs.toByteArray()
);
UtfHelpper.writeStringToUtf8(str, strOs);
assertArrayEquals(
"UtfHelper.writeStringToUtf8 false",
correct, strOs.toByteArray()
);
}
}