blob: 19eb4c87f94cebcf6341e07d4c45cd6d7c79f046 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.jena.atlas.io;
import static org.junit.Assert.assertArrayEquals;
import static org.junit.Assert.assertEquals;
import java.io.ByteArrayInputStream ;
import java.io.ByteArrayOutputStream ;
import java.io.IOException ;
import java.io.OutputStreamWriter ;
import java.io.Writer ;
import java.nio.charset.Charset ;
import java.nio.charset.CharsetDecoder ;
import java.nio.charset.CharsetEncoder ;
import org.apache.jena.atlas.lib.Chars ;
import org.junit.Test ;
public class TestStreamUTF8
{
static Charset utf8 = Chars.charsetUTF8 ;
static CharsetDecoder dec = utf8.newDecoder() ;
static CharsetEncoder enc = utf8.newEncoder() ;
// UTF-8 encoding.
// character '¢' = code point U+00A2 -> C2 A2
// character '€' = code point U+20AC -> E2 82 AC
static private final String asciiBase = "abc" ;
static private final String latinBase = "Àéíÿ" ;
static private final String latinExtraBase = "ỹfifl" ; // fi-ligature, fl-ligature
static private final String greekBase = "αβγ" ;
static private final String hewbrewBase = "אבג" ;
static private final String arabicBase = "ءآأ";
static private final String symbolsBase = "☺☻♪♫" ;
static private final String chineseBase = "孫子兵法" ; // The Art of War
static private final String japaneseBase = "日本" ; // Japanese
@Test public void test_in_00() { testIn("") ; }
@Test public void test_in_01() { testIn(asciiBase) ; }
@Test public void test_in_02() { testIn(latinBase) ; }
@Test public void test_in_03() { testIn(latinExtraBase) ; }
@Test public void test_in_04() { testIn(greekBase) ; }
@Test public void test_in_05() { testIn(hewbrewBase) ; }
@Test public void test_in_06() { testIn(arabicBase) ; }
@Test public void test_in_07() { testIn(symbolsBase) ; }
@Test public void test_in_08() { testIn(chineseBase) ; }
@Test public void test_in_09() { testIn(japaneseBase) ; }
@Test public void test_out_00() { testIn("") ; }
@Test public void test_out_01() { testOut(asciiBase) ; }
@Test public void test_out_02() { testOut(latinBase) ; }
@Test public void test_out_03() { testOut(latinExtraBase) ; }
@Test public void test_out_04() { testOut(greekBase) ; }
@Test public void test_out_05() { testOut(hewbrewBase) ; }
@Test public void test_out_06() { testOut(arabicBase) ; }
@Test public void test_out_07() { testOut(symbolsBase) ; }
@Test public void test_out_08() { testOut(chineseBase) ; }
@Test public void test_out_09() { testOut(japaneseBase) ; }
static void testIn(String x)
{
try {
byte[] bytes = stringAsBytes(x) ;
ByteArrayInputStream bin = new ByteArrayInputStream(bytes) ;
// Create string from bytes
try(InStreamUTF8 r = new InStreamUTF8(bin)) {
char[] cbuff = new char[x.length()*10] ; // Way too big
int len = r.read(cbuff) ;
String str = new String(cbuff, 0 , len) ;
assertEquals(x, str) ;
}
} catch (IOException ex) { throw new RuntimeException(ex) ; }
}
static void testOut(String x)
{
try {
byte[] bytes = stringAsBytes(x) ;
ByteArrayOutputStream bout = new ByteArrayOutputStream() ;
try(Writer out = new OutStreamUTF8(bout)) {
out.write(x) ;
}
byte[] bytes2 = bout.toByteArray() ;
assertArrayEquals(bytes, bytes2) ;
} catch (IOException ex) { throw new RuntimeException(ex) ; }
}
static byte[] stringAsBytes(String x)
{
try {
ByteArrayOutputStream bout = new ByteArrayOutputStream() ;
try(Writer out = new OutputStreamWriter(bout, utf8)) {
out.write(x) ;
}
byte[] bytes = bout.toByteArray() ;
return bytes ;
} catch (IOException ex) { throw new RuntimeException(ex) ; }
}
}