1de76a5adSDamjan Jovanovic /************************************************************** 2de76a5adSDamjan Jovanovic * 3de76a5adSDamjan Jovanovic * Licensed to the Apache Software Foundation (ASF) under one 4de76a5adSDamjan Jovanovic * or more contributor license agreements. See the NOTICE file 5de76a5adSDamjan Jovanovic * distributed with this work for additional information 6de76a5adSDamjan Jovanovic * regarding copyright ownership. The ASF licenses this file 7de76a5adSDamjan Jovanovic * to you under the Apache License, Version 2.0 (the 8de76a5adSDamjan Jovanovic * "License"); you may not use this file except in compliance 9de76a5adSDamjan Jovanovic * with the License. You may obtain a copy of the License at 10de76a5adSDamjan Jovanovic * 11de76a5adSDamjan Jovanovic * http://www.apache.org/licenses/LICENSE-2.0 12de76a5adSDamjan Jovanovic * 13de76a5adSDamjan Jovanovic * Unless required by applicable law or agreed to in writing, 14de76a5adSDamjan Jovanovic * software distributed under the License is distributed on an 15de76a5adSDamjan Jovanovic * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY 16de76a5adSDamjan Jovanovic * KIND, either express or implied. See the License for the 17de76a5adSDamjan Jovanovic * specific language governing permissions and limitations 18de76a5adSDamjan Jovanovic * under the License. 19de76a5adSDamjan Jovanovic * 20de76a5adSDamjan Jovanovic *************************************************************/ 21de76a5adSDamjan Jovanovic 22de76a5adSDamjan Jovanovic 23de76a5adSDamjan Jovanovic 242f709283SDamjan Jovanovic package api.i18n; 25de76a5adSDamjan Jovanovic 26de76a5adSDamjan Jovanovic import com.sun.star.i18n.KParseTokens; 27de76a5adSDamjan Jovanovic import com.sun.star.i18n.KParseType; 28de76a5adSDamjan Jovanovic import com.sun.star.i18n.ParseResult; 29de76a5adSDamjan Jovanovic import com.sun.star.i18n.XCharacterClassification; 30de76a5adSDamjan Jovanovic import com.sun.star.lang.Locale; 312f709283SDamjan Jovanovic import com.sun.star.uno.UnoRuntime; 322f709283SDamjan Jovanovic import com.sun.star.uno.XComponentContext; 332f709283SDamjan Jovanovic import org.junit.After; 342f709283SDamjan Jovanovic import org.junit.AfterClass; 352f709283SDamjan Jovanovic import org.junit.Before; 362f709283SDamjan Jovanovic import org.junit.BeforeClass; 372f709283SDamjan Jovanovic import org.junit.Assert; 38*daf711bfSDamjan Jovanovic import org.junit.Ignore; 392f709283SDamjan Jovanovic import org.junit.Test; 402f709283SDamjan Jovanovic import org.openoffice.test.uno.UnoApp; 41de76a5adSDamjan Jovanovic 42de76a5adSDamjan Jovanovic /** 43de76a5adSDamjan Jovanovic * Testing <code>com.sun.star.i18n.XCharacterClassification</code> 44de76a5adSDamjan Jovanovic * interface methods: 45de76a5adSDamjan Jovanovic * <ul> 46de76a5adSDamjan Jovanovic * <li><code> toUpper() </code></li> 47de76a5adSDamjan Jovanovic * <li><code> toLower() </code></li> 48de76a5adSDamjan Jovanovic * <li><code> toTitle() </code></li> 49de76a5adSDamjan Jovanovic * <li><code> getType() </code></li> 50de76a5adSDamjan Jovanovic * <li><code> getCharacterType() </code></li> 51de76a5adSDamjan Jovanovic * <li><code> getStringType() </code></li> 52de76a5adSDamjan Jovanovic * <li><code> getCharacterDirection() </code></li> 53de76a5adSDamjan Jovanovic * <li><code> getScript() </code></li> 54de76a5adSDamjan Jovanovic * <li><code> parseAnyToken() </code></li> 55de76a5adSDamjan Jovanovic * <li><code> parsePredefinedToken() </code></li> 56de76a5adSDamjan Jovanovic * </ul><p> 57de76a5adSDamjan Jovanovic * Test is <b> NOT </b> multithread compliant. <p> 58de76a5adSDamjan Jovanovic * @see com.sun.star.i18n.XCharacterClassification 59de76a5adSDamjan Jovanovic */ 602f709283SDamjan Jovanovic public class XCharacterClassificationTest { 612f709283SDamjan Jovanovic private static final UnoApp app = new UnoApp(); 622f709283SDamjan Jovanovic 632f709283SDamjan Jovanovic private XComponentContext xContext = null; 64de76a5adSDamjan Jovanovic public XCharacterClassification oObj = null; 65de76a5adSDamjan Jovanovic public String[] languages = new String[]{"de","en","es","fr","ja","ko","zh"}; 66de76a5adSDamjan Jovanovic public String[] countries = new String[]{"DE","US","ES","FR","JP","KR","CN"}; 67de76a5adSDamjan Jovanovic 68de76a5adSDamjan Jovanovic public String[] charstyles_java = new String[] {"UNASSIGNED","UPPERCASE_LETTER", 69de76a5adSDamjan Jovanovic "LOWERCASE_LETTER","TITLECASE_LETTER","MODIFIER_LETTER","OTHER_LETTER", 70de76a5adSDamjan Jovanovic "NON_SPACING_MARK","ENCLOSING_MARK","COMBINING_SPACING_MARK", 71de76a5adSDamjan Jovanovic "DECIMAL_DIGIT_NUMBER","LETTER_NUMBER","OTHER_NUMBER","SPACE_SEPARATOR", 72de76a5adSDamjan Jovanovic "LINE_SEPARATOR","PARAGRAPH_SEPARATOR","CONTROL","FORMAT","none17", 73de76a5adSDamjan Jovanovic "PRIVATE_USE","none19","DASH_PUNCTUATION","START_PUNCTUATION","END_PUNCTUATION", 74de76a5adSDamjan Jovanovic "CONNECTOR_PUNCTUATION","OTHER_PUNCTUATION","MATH_SYMBOL","CURRENCY_SYMBOL", 75de76a5adSDamjan Jovanovic "MODIFIER_SYMBOL","OTHER_SYMBOL"}; 76de76a5adSDamjan Jovanovic 77de76a5adSDamjan Jovanovic public String[] charstyles_office = new String[] {"UNASSIGNED","UPPERCASE_LETTER", 78de76a5adSDamjan Jovanovic "LOWERCASE_LETTER","TITLECASE_LETTER","MODIFIER_LETTER","OTHER_LETTER", 79de76a5adSDamjan Jovanovic "NON_SPACING_MARK","ENCLOSING_MARK","COMBINING_SPACING_MARK", 80de76a5adSDamjan Jovanovic "DECIMAL_DIGIT_NUMBER","LETTER_NUMBER","OTHER_NUMBER","SPACE_SEPARATOR", 81de76a5adSDamjan Jovanovic "LINE_SEPARATOR","PARAGRAPH_SEPARATOR","CONTROL","FORMAT","PRIVATE_USE", 82de76a5adSDamjan Jovanovic "OTHER_PUNCTUATION","DASH_PUNCTUATION","START_PUNCTUATION","END_PUNCTUATION", 83de76a5adSDamjan Jovanovic "CONNECTOR_PUNCTUATION", 84de76a5adSDamjan Jovanovic "OTHER_PUNCTUATION","MATH_SYMBOL","CURRENCY_SYMBOL","MODIFIER_SYMBOL", 85de76a5adSDamjan Jovanovic "OTHER_SYMBOL","INITIAL_PUNCTUATION","FINAL_PUNCTUATION","GENERAL_TYPES_COUNT"}; 86de76a5adSDamjan Jovanovic 87de76a5adSDamjan Jovanovic public String[] unicode_script = new String[] {"U_BASIC_LATIN","U_LATIN_1_SUPPLEMENT", 88de76a5adSDamjan Jovanovic "U_LATIN_EXTENDED_A","U_LATIN_EXTENDED_B","U_IPA_EXTENSIONS","U_SPACING_MODIFIER_LETTERS", 89de76a5adSDamjan Jovanovic "U_COMBINING_DIACRITICAL_MARKS","U_GREEK","U_CYRILLIC","U_ARMENIAN","U_HEBREW", 90de76a5adSDamjan Jovanovic "U_ARABIC","U_SYRIAC","U_THAANA","U_DEVANAGARI","U_BENGALI","U_GURMUKHI", 91de76a5adSDamjan Jovanovic "U_GUJARATI","U_ORIYA","U_TAMIL","U_TELUGU","U_KANNADA","U_MALAYALAM", 92de76a5adSDamjan Jovanovic "U_SINHALA","U_THAI","U_LAO","U_TIBETAN","U_MYANMAR","U_GEORGIAN", 93de76a5adSDamjan Jovanovic "U_HANGUL_JAMO","U_ETHIOPIC","U_CHEROKEE","U_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS", 94de76a5adSDamjan Jovanovic "U_OGHAM","U_RUNIC","U_KHMER","U_MONGOLIAN","U_LATIN_EXTENDED_ADDITIONAL", 95de76a5adSDamjan Jovanovic "U_GREEK_EXTENDED","U_GENERAL_PUNCTUATION","U_SUPERSCRIPTS_AND_SUBSCRIPTS", 96de76a5adSDamjan Jovanovic "U_CURRENCY_SYMBOLS","U_COMBINING_MARKS_FOR_SYMBOLS","U_LETTERLIKE_SYMBOLS", 97de76a5adSDamjan Jovanovic "U_NUMBER_FORMS","U_ARROWS","U_MATHEMATICAL_OPERATORS","U_MISCELLANEOUS_TECHNICAL", 98de76a5adSDamjan Jovanovic "U_CONTROL_PICTURES","U_OPTICAL_CHARACTER_RECOGNITION","U_ENCLOSED_ALPHANUMERICS", 99de76a5adSDamjan Jovanovic "U_BOX_DRAWING","U_BLOCK_ELEMENTS","U_GEOMETRIC_SHAPES","U_MISCELLANEOUS_SYMBOLS", 100de76a5adSDamjan Jovanovic "U_DINGBATS","U_BRAILLE_PATTERNS","U_CJK_RADICALS_SUPPLEMENT","U_KANGXI_RADICALS", 101de76a5adSDamjan Jovanovic "U_IDEOGRAPHIC_DESCRIPTION_CHARACTERS","U_CJK_SYMBOLS_AND_PUNCTUATION", 102de76a5adSDamjan Jovanovic "U_HIRAGANA","U_KATAKANA","U_BOPOMOFO","U_HANGUL_COMPATIBILITY_JAMO","U_KANBUN", 103de76a5adSDamjan Jovanovic "U_BOPOMOFO_EXTENDED","U_ENCLOSED_CJK_LETTERS_AND_MONTHS","U_CJK_COMPATIBILITY", 104de76a5adSDamjan Jovanovic "U_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A","U_CJK_UNIFIED_IDEOGRAPHS","U_YI_SYLLABLES", 105de76a5adSDamjan Jovanovic "U_YI_RADICALS","U_HANGUL_SYLLABLES","U_HIGH_SURROGATES","U_HIGH_PRIVATE_USE_SURROGATES", 106de76a5adSDamjan Jovanovic "U_LOW_SURROGATES","U_PRIVATE_USE_AREA","U_CJK_COMPATIBILITY_IDEOGRAPHS", 107de76a5adSDamjan Jovanovic "U_ALPHABETIC_PRESENTATION_FORMS","U_ARABIC_PRESENTATION_FORMS_A","U_COMBINING_HALF_MARKS", 108de76a5adSDamjan Jovanovic "U_CJK_COMPATIBILITY_FORMS","U_SMALL_FORM_VARIANTS","U_ARABIC_PRESENTATION_FORMS_B", 109de76a5adSDamjan Jovanovic "U_SPECIALS","U_HALFWIDTH_AND_FULLWIDTH_FORMS","U_CHAR_SCRIPT_COUNT","U_NO_SCRIPT"}; 110de76a5adSDamjan Jovanovic 1112f709283SDamjan Jovanovic // setup and close connections 1122f709283SDamjan Jovanovic @BeforeClass setUpConnection()1132f709283SDamjan Jovanovic public static void setUpConnection() throws Exception 1142f709283SDamjan Jovanovic { 1152f709283SDamjan Jovanovic app.start(); 1162f709283SDamjan Jovanovic } 1172f709283SDamjan Jovanovic 1182f709283SDamjan Jovanovic @AfterClass tearDownConnection()1192f709283SDamjan Jovanovic public static void tearDownConnection() throws InterruptedException, com.sun.star.uno.Exception 1202f709283SDamjan Jovanovic { 1212f709283SDamjan Jovanovic app.close(); 1222f709283SDamjan Jovanovic } 1232f709283SDamjan Jovanovic 1242f709283SDamjan Jovanovic @Before before()1252f709283SDamjan Jovanovic public void before() throws Exception { 1262f709283SDamjan Jovanovic xContext = app.getComponentContext(); 1272f709283SDamjan Jovanovic oObj = UnoRuntime.queryInterface( 1282f709283SDamjan Jovanovic XCharacterClassification.class, 1292f709283SDamjan Jovanovic xContext.getServiceManager().createInstanceWithContext("com.sun.star.i18n.CharacterClassification", xContext) 1302f709283SDamjan Jovanovic ); 1312f709283SDamjan Jovanovic } 1322f709283SDamjan Jovanovic 133de76a5adSDamjan Jovanovic /** 134de76a5adSDamjan Jovanovic * Test calls the method for different locales. Then each result is compared 135de76a5adSDamjan Jovanovic * with a string, converted to a upper case using 136de76a5adSDamjan Jovanovic * <code>java.lang.String</code> method <code>toUpperCase()</code>.<p> 137de76a5adSDamjan Jovanovic * Has <b> OK </b> status if string, returned by the method is equal to 138de76a5adSDamjan Jovanovic * a string that is returned by String.toUpperCase() for all locales. 139de76a5adSDamjan Jovanovic */ 1402f709283SDamjan Jovanovic @Test _toUpper()141de76a5adSDamjan Jovanovic public void _toUpper() { 142de76a5adSDamjan Jovanovic boolean res = true; 143de76a5adSDamjan Jovanovic char[] characters = new char[]{586,65,97,498,721,4588,772,8413,3404}; 144de76a5adSDamjan Jovanovic String toCheck = new String(characters); 145de76a5adSDamjan Jovanovic String get = ""; 146de76a5adSDamjan Jovanovic String exp = ""; 147de76a5adSDamjan Jovanovic 148de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 149de76a5adSDamjan Jovanovic get = oObj.toUpper(toCheck, 0, toCheck.length(), getLocale(i)); 150de76a5adSDamjan Jovanovic exp = toCheck.toUpperCase( 151de76a5adSDamjan Jovanovic new java.util.Locale(languages[i], countries[i])); 152de76a5adSDamjan Jovanovic res &= get.equals(exp); 153de76a5adSDamjan Jovanovic if (!res) { 1542f709283SDamjan Jovanovic System.out.println("FAILED for: language=" + languages[i] + 155de76a5adSDamjan Jovanovic " ; country=" + countries[i]); 1562f709283SDamjan Jovanovic System.out.println("Expected: " + exp); 1572f709283SDamjan Jovanovic System.out.println("Gained : " + get); 158de76a5adSDamjan Jovanovic } 159de76a5adSDamjan Jovanovic } 1602f709283SDamjan Jovanovic Assert.assertTrue("toUpper()", res); 161de76a5adSDamjan Jovanovic } 162de76a5adSDamjan Jovanovic 163de76a5adSDamjan Jovanovic /** 164de76a5adSDamjan Jovanovic * Test calls the method for different locales. Then each result is compared 165de76a5adSDamjan Jovanovic * with a string, converted to a lower case using 166de76a5adSDamjan Jovanovic * <code>java.lang.String</code> method <code>toLowerCase()</code>.<p> 167de76a5adSDamjan Jovanovic * Has <b> OK </b> status if string, returned by the method is equal to 168de76a5adSDamjan Jovanovic * a string that is returned by String.toLowerCase() for all locales. 169de76a5adSDamjan Jovanovic */ 1702f709283SDamjan Jovanovic @Test 171*daf711bfSDamjan Jovanovic @Ignore("Bug #87590 Incorrect casing for U+026A, U+0268, U+0197...") _toLower()172de76a5adSDamjan Jovanovic public void _toLower() { 173de76a5adSDamjan Jovanovic boolean res = true; 174de76a5adSDamjan Jovanovic char[] characters = new char[]{586,65,97,498,721,4588,772,8413,3404}; 175de76a5adSDamjan Jovanovic String toCheck = new String(characters); 176de76a5adSDamjan Jovanovic String get = ""; 177de76a5adSDamjan Jovanovic String exp = ""; 178de76a5adSDamjan Jovanovic 179de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 180de76a5adSDamjan Jovanovic get = oObj.toLower(toCheck,0,toCheck.length(),getLocale(i)); 181de76a5adSDamjan Jovanovic exp = toCheck.toLowerCase( 182de76a5adSDamjan Jovanovic new java.util.Locale(languages[i],countries[i])); 183de76a5adSDamjan Jovanovic res &= get.equals(exp); 184de76a5adSDamjan Jovanovic if (!res) { 1852f709283SDamjan Jovanovic System.out.println("FAILED for: language=" + languages[i] 186de76a5adSDamjan Jovanovic + " ; country=" + countries[i]); 1872f709283SDamjan Jovanovic System.out.println("Expected: " + exp); 1882f709283SDamjan Jovanovic System.out.println("Gained : " + get); 189de76a5adSDamjan Jovanovic } 190de76a5adSDamjan Jovanovic } 1912f709283SDamjan Jovanovic Assert.assertTrue("toLower()", res); 192de76a5adSDamjan Jovanovic } 193de76a5adSDamjan Jovanovic 194de76a5adSDamjan Jovanovic /** 195de76a5adSDamjan Jovanovic * Test calls the method for different locales. Then each result is compared 196de76a5adSDamjan Jovanovic * with a string, converted to a title case using 197de76a5adSDamjan Jovanovic * <code>java.lang.Character</code> method <code>toTitleCase()</code>.<p> 198de76a5adSDamjan Jovanovic * Has <b> OK </b> status if string, returned by the method is equal to 199de76a5adSDamjan Jovanovic * a string that was converted using Character.toTitleCase() for all locales. 200de76a5adSDamjan Jovanovic */ 2012f709283SDamjan Jovanovic @Test _toTitle()202de76a5adSDamjan Jovanovic public void _toTitle() { 203de76a5adSDamjan Jovanovic boolean res = true; 204de76a5adSDamjan Jovanovic String toCheck = new String(new char[]{8112}); 205de76a5adSDamjan Jovanovic String get = ""; 206de76a5adSDamjan Jovanovic String exp = ""; 207de76a5adSDamjan Jovanovic 208de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 209de76a5adSDamjan Jovanovic get = oObj.toTitle(toCheck, 0, 1, getLocale(i)); 210de76a5adSDamjan Jovanovic exp = new String( 211de76a5adSDamjan Jovanovic new char[]{Character.toTitleCase(toCheck.toCharArray()[0])}); 212de76a5adSDamjan Jovanovic res &= get.equals(exp); 213de76a5adSDamjan Jovanovic if (!res) { 2142f709283SDamjan Jovanovic System.out.println("FAILED for: language=" + languages[i] 215de76a5adSDamjan Jovanovic + " ; country=" + countries[i]); 2162f709283SDamjan Jovanovic System.out.println("Expected: " + exp); 2172f709283SDamjan Jovanovic System.out.println("Gained : " + get); 218de76a5adSDamjan Jovanovic } 219de76a5adSDamjan Jovanovic } 2202f709283SDamjan Jovanovic Assert.assertTrue("toTitle()", res); 221de76a5adSDamjan Jovanovic } 222de76a5adSDamjan Jovanovic 223de76a5adSDamjan Jovanovic /** 224de76a5adSDamjan Jovanovic * At first we define <code>int[]</code> and <code>char[]</code> arrays of 225de76a5adSDamjan Jovanovic * unicode symbol numbers, arranged as sequences, where symbols are sorted 226de76a5adSDamjan Jovanovic * by type, so the character of <code>i<sup><small>th</small></sup></code> 227de76a5adSDamjan Jovanovic * type is located on <code>i<sup><small>th</small></sup></code> position.<p> 228de76a5adSDamjan Jovanovic * Has <b> OK </b> status if for all 30 types the method returns value, that 229de76a5adSDamjan Jovanovic * is equal to an element number.<p> 230de76a5adSDamjan Jovanovic * @see com.sun.star.i18n.CharType 231de76a5adSDamjan Jovanovic */ 2322f709283SDamjan Jovanovic @Test _getType()233de76a5adSDamjan Jovanovic public void _getType() { 234de76a5adSDamjan Jovanovic boolean res = true; 23524ef62edSDamjan Jovanovic // If or when this list gets out of date again, 23624ef62edSDamjan Jovanovic // find new characters of the required type with: 23724ef62edSDamjan Jovanovic // for (int i = 30; i <= 0xffff; i++) { 23824ef62edSDamjan Jovanovic // String s = new String("" + (char)i); 23924ef62edSDamjan Jovanovic // int type = oObj.getType(s, 0); 24024ef62edSDamjan Jovanovic // System.out.println("character " + i + " has type " + charstyles_office[type]); 24124ef62edSDamjan Jovanovic // } 24224ef62edSDamjan Jovanovic char[] characters = new char[]{888,65,97,498,721,4588,772,8413,3404, 24324ef62edSDamjan Jovanovic 48,8544,179,32,8232,8233,144,8204,57344,56320,45,40,41,95,3852,247, 244de76a5adSDamjan Jovanovic 3647,901,3896,171,187}; 245de76a5adSDamjan Jovanovic String toCheck = new String(characters); 246de76a5adSDamjan Jovanovic 247de76a5adSDamjan Jovanovic for (int i=0;i<characters.length;i++) { 248de76a5adSDamjan Jovanovic int get = oObj.getType(toCheck, i); 249de76a5adSDamjan Jovanovic res &= (charstyles_office[get] == charstyles_office[i]); 250de76a5adSDamjan Jovanovic if (!res) { 25124ef62edSDamjan Jovanovic System.out.println("Code: " + Integer.toHexString((int)characters[i])); 2522f709283SDamjan Jovanovic System.out.println("Gained: " + charstyles_office[get]); 2532f709283SDamjan Jovanovic System.out.println("Expected: " + charstyles_office[i]); 254de76a5adSDamjan Jovanovic } 255de76a5adSDamjan Jovanovic } 2562f709283SDamjan Jovanovic Assert.assertTrue("getType()", res); 257de76a5adSDamjan Jovanovic } 258de76a5adSDamjan Jovanovic 259de76a5adSDamjan Jovanovic /** 260de76a5adSDamjan Jovanovic * After defining string to be checked and array of expected types, test 261de76a5adSDamjan Jovanovic * calls the method for each character of a string and for all locales.<p> 262de76a5adSDamjan Jovanovic * Has <b> OK </b> status if the method returns type, expected for a given 263de76a5adSDamjan Jovanovic * character and locale. 264de76a5adSDamjan Jovanovic */ 2652f709283SDamjan Jovanovic @Test _getCharacterType()266de76a5adSDamjan Jovanovic public void _getCharacterType() { 267de76a5adSDamjan Jovanovic boolean res = true; 2685c977050SDamjan Jovanovic // If or when this list gets out of date again, 2695c977050SDamjan Jovanovic // find new characters of the required type with: 2705c977050SDamjan Jovanovic //for (int i = 32; i <= 0xffff; i++) { 2715c977050SDamjan Jovanovic // int charType = oObj.getCharacterType("" + (char)i, 0, getLocale(1)); 2725c977050SDamjan Jovanovic // if (charType == 32) { 2735c977050SDamjan Jovanovic // System.out.println("character " + i + " has type 32"); 2745c977050SDamjan Jovanovic // } 2755c977050SDamjan Jovanovic //} 2765c977050SDamjan Jovanovic String toCheck = "Ab0*"; 277de76a5adSDamjan Jovanovic int[] expected = new int[]{226,228,97,32}; 278de76a5adSDamjan Jovanovic 279de76a5adSDamjan Jovanovic for (int i=0;i<toCheck.length();i++) { 280de76a5adSDamjan Jovanovic for (int j=1;j<7;j++) { 281de76a5adSDamjan Jovanovic int get = oObj.getCharacterType(toCheck, i, getLocale(j)); 282de76a5adSDamjan Jovanovic res &= (get == expected[i]); 283de76a5adSDamjan Jovanovic if (!res) { 2842f709283SDamjan Jovanovic System.out.println("FAILED for: language=" + languages[j] + 285de76a5adSDamjan Jovanovic " ; country=" + countries[j]); 2868619c510SDamjan Jovanovic System.out.println("Symbol: " + toCheck.toCharArray()[i]); 2872f709283SDamjan Jovanovic System.out.println("Gained: " + get); 2882f709283SDamjan Jovanovic System.out.println("Expected: " + expected[i]); 289de76a5adSDamjan Jovanovic } 290de76a5adSDamjan Jovanovic } 291de76a5adSDamjan Jovanovic } 2922f709283SDamjan Jovanovic Assert.assertTrue("getCharacterType()", res); 293de76a5adSDamjan Jovanovic } 294de76a5adSDamjan Jovanovic 295de76a5adSDamjan Jovanovic /** 296de76a5adSDamjan Jovanovic * After defining array of strings to be checked and array of expected types, 297de76a5adSDamjan Jovanovic * test calls the method for each string of an array and for all locales.<p> 298de76a5adSDamjan Jovanovic * Has <b> OK </b> status if the method returns type, expected for a given 299de76a5adSDamjan Jovanovic * string and locale. 300de76a5adSDamjan Jovanovic */ 3012f709283SDamjan Jovanovic @Test _getStringType()302de76a5adSDamjan Jovanovic public void _getStringType() { 303de76a5adSDamjan Jovanovic boolean res = true; 304de76a5adSDamjan Jovanovic String[] toCheck = new String[]{"01234","AAAAA","bbbbb","AA()bb"}; 305de76a5adSDamjan Jovanovic int[] exp = new int[]{97,226,228,230}; 306de76a5adSDamjan Jovanovic 307de76a5adSDamjan Jovanovic for (int j=0;j<toCheck.length;j++) { 308de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 309de76a5adSDamjan Jovanovic int get = oObj.getStringType(toCheck[j], 0, 310de76a5adSDamjan Jovanovic toCheck[j].length(), getLocale(i)); 311de76a5adSDamjan Jovanovic res &= (get == exp[j]); 312de76a5adSDamjan Jovanovic if (!res) { 3132f709283SDamjan Jovanovic System.out.println("FAILED for: language=" + languages[i] + 314de76a5adSDamjan Jovanovic " ; country=" + countries[i]); 3152f709283SDamjan Jovanovic System.out.println("Expected: " + exp[j]); 3162f709283SDamjan Jovanovic System.out.println("Gained : " + get); 317de76a5adSDamjan Jovanovic } 318de76a5adSDamjan Jovanovic } 319de76a5adSDamjan Jovanovic } 3202f709283SDamjan Jovanovic Assert.assertTrue("getStringType()", res); 321de76a5adSDamjan Jovanovic } 322de76a5adSDamjan Jovanovic 323de76a5adSDamjan Jovanovic /** 324de76a5adSDamjan Jovanovic * After string to be checked is initialized (all symbols are sorted 325de76a5adSDamjan Jovanovic * by direction, so the character of <code>i<sup><small>th</small></sup></code> 326de76a5adSDamjan Jovanovic * direction is located on <code>i<sup><small>th</small></sup></code> 327de76a5adSDamjan Jovanovic * position), test calls the method for every character of that string. <p> 328de76a5adSDamjan Jovanovic * Has <b> OK </b> status if the method returns direction, that's equal to 329de76a5adSDamjan Jovanovic * a symbol position in the string. 330de76a5adSDamjan Jovanovic */ 3312f709283SDamjan Jovanovic @Test _getCharacterDirection()332de76a5adSDamjan Jovanovic public void _getCharacterDirection() { 333de76a5adSDamjan Jovanovic boolean res = true; 334cc5c65fbSDamjan Jovanovic String toCheck = new String(new char[]{65,1470,48,43,35,1632,44,10, 335de76a5adSDamjan Jovanovic 9,12,33,8234,8237,1563,8235,8238,8236,768,1}); 336de76a5adSDamjan Jovanovic for (short i=0;i<19;i++) { 337de76a5adSDamjan Jovanovic short get = oObj.getCharacterDirection(toCheck, i); 338de76a5adSDamjan Jovanovic res &= (get == i); 339de76a5adSDamjan Jovanovic if (!res) { 3402f709283SDamjan Jovanovic System.out.println("Code :" + toCheck.toCharArray()[i]); 3412f709283SDamjan Jovanovic System.out.println("Gained: " + get); 3422f709283SDamjan Jovanovic System.out.println("Expected: " + i); 343de76a5adSDamjan Jovanovic } 344de76a5adSDamjan Jovanovic } 3452f709283SDamjan Jovanovic Assert.assertTrue("getCharacterDirection()", res); 346de76a5adSDamjan Jovanovic } 347de76a5adSDamjan Jovanovic 348de76a5adSDamjan Jovanovic /** 349de76a5adSDamjan Jovanovic * At first we define <code>int[]</code> and <code>char[]</code> arrays of 350de76a5adSDamjan Jovanovic * unicode symbol numbers, arranged as sequences, where symbols are sorted 351de76a5adSDamjan Jovanovic * by type, so the character of <code>i<sup><small>th</small></sup></code> 352de76a5adSDamjan Jovanovic * type is located on <code>i<sup><small>th</small></sup></code> position.<p> 353de76a5adSDamjan Jovanovic * Has <b> OK </b> status if for each character method returns value, that 354de76a5adSDamjan Jovanovic * is equal to a number where element is located in array. Also method has 355de76a5adSDamjan Jovanovic * <b> OK </b> status for symbol with code 55296, because it doesn't work 356de76a5adSDamjan Jovanovic * since it hasn't the right neighborhood.<p> 357de76a5adSDamjan Jovanovic * @see "http://ppewww.ph.gla.ac.uk/~flavell/unicode/unidata.html" 358de76a5adSDamjan Jovanovic */ 3592f709283SDamjan Jovanovic @Test _getScript()360de76a5adSDamjan Jovanovic public void _getScript() { 361de76a5adSDamjan Jovanovic boolean res = true; 362de76a5adSDamjan Jovanovic char[] characters = new char[]{65,128,256,384,592,750,773,924,1030,1331,1448, 363de76a5adSDamjan Jovanovic 1569,1792,1936,2313,2465,2570,2707,2822,2972,3079,3240,3337,3464,3590, 364de76a5adSDamjan Jovanovic 3745,3906,4097,4274,4357,4621,5040,5200,5776,5806,6030,6155,7683,7943, 365de76a5adSDamjan Jovanovic 8202,8319,8352,8413,8452,8545,8616,8715,8965,9217,9281,9336,9474,9608,9719, 366de76a5adSDamjan Jovanovic 9734,9999,10247,11911,12034,12274,12294,12358,12456,12552,12605,12688,12727, 367de76a5adSDamjan Jovanovic 12806,13065,13312,19968,40964,42152,44032,55296,56192,56320,57344,63744, 368de76a5adSDamjan Jovanovic 64257,64370,65056,65073,65131,65146,65532,65288}; 369de76a5adSDamjan Jovanovic String toCheck = new String(characters); 370de76a5adSDamjan Jovanovic 371de76a5adSDamjan Jovanovic for (int i=0;i<characters.length;i++) { 372de76a5adSDamjan Jovanovic int get = oObj.getScript(toCheck, i); 373de76a5adSDamjan Jovanovic //The HIGH_SURROGATE 55296 doesn't work since it hasn't the right 37407b05676SDamjan Jovanovic //neighborhood. Neither does 56192 - it combines with 55296 into another code point. 37507b05676SDamjan Jovanovic if (toCheck.charAt(i) != 55296 && toCheck.charAt(i) != 56192) { 37607b05676SDamjan Jovanovic res &= (get == i); 37707b05676SDamjan Jovanovic } 378de76a5adSDamjan Jovanovic if (!res) { 3792f709283SDamjan Jovanovic System.out.println("-- " + toCheck.substring(i, i + 1).hashCode()); 38007b05676SDamjan Jovanovic System.out.println("Code: " + Integer.toHexString((int)characters[i])); 38107b05676SDamjan Jovanovic System.out.println("Gained: " + get + " (" + (0 <= get && get < unicode_script.length ? unicode_script[get] : "out of range") + ")"); 3822f709283SDamjan Jovanovic System.out.println("Expected: " + unicode_script[i]); 383de76a5adSDamjan Jovanovic } 384de76a5adSDamjan Jovanovic } 3852f709283SDamjan Jovanovic Assert.assertTrue("getScript()", res); 386de76a5adSDamjan Jovanovic } 387de76a5adSDamjan Jovanovic 388de76a5adSDamjan Jovanovic /** 389de76a5adSDamjan Jovanovic * After defining a string to be parsed and parse conditions (flags), test 390de76a5adSDamjan Jovanovic * calls the method for different locales three times with different parameters, 391de76a5adSDamjan Jovanovic * checking result after every call. <p> 392de76a5adSDamjan Jovanovic * Has <b> OK </b> status if the method returns right results all three 393de76a5adSDamjan Jovanovic * times. 394de76a5adSDamjan Jovanovic */ 3952f709283SDamjan Jovanovic @Test _parseAnyToken()396de76a5adSDamjan Jovanovic public void _parseAnyToken() { 397de76a5adSDamjan Jovanovic int nStartFlags = KParseTokens.ANY_ALPHA | KParseTokens.ASC_UNDERSCORE; 398de76a5adSDamjan Jovanovic int nContFlags = KParseTokens.ANY_ALNUM | KParseTokens.ASC_UNDERSCORE 399de76a5adSDamjan Jovanovic | KParseTokens.ASC_DOT; 400de76a5adSDamjan Jovanovic String toCheck = " 18 i18n ^"; 401de76a5adSDamjan Jovanovic ParseResult pRes = null; 402de76a5adSDamjan Jovanovic boolean res = true; 403de76a5adSDamjan Jovanovic 404de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 405de76a5adSDamjan Jovanovic pRes = oObj.parseAnyToken(toCheck, 1, getLocale(i), 406de76a5adSDamjan Jovanovic nStartFlags, "", nContFlags, ""); 407de76a5adSDamjan Jovanovic res = ( (pRes.CharLen==2) 408de76a5adSDamjan Jovanovic && (pRes.TokenType==32) 409de76a5adSDamjan Jovanovic && (pRes.Value==18.0) ); 410de76a5adSDamjan Jovanovic pRes = oObj.parseAnyToken(toCheck, 4, getLocale(i), 411de76a5adSDamjan Jovanovic nStartFlags, "", nContFlags, ""); 412de76a5adSDamjan Jovanovic res &= ( (pRes.CharLen==4) 413de76a5adSDamjan Jovanovic && (pRes.TokenType==4) 414de76a5adSDamjan Jovanovic && (pRes.Value==0.0) ); 415de76a5adSDamjan Jovanovic pRes = oObj.parseAnyToken(toCheck, 9, getLocale(i), 416de76a5adSDamjan Jovanovic nStartFlags, "", nContFlags, ""); 417de76a5adSDamjan Jovanovic res &= ( (pRes.CharLen==1) 418de76a5adSDamjan Jovanovic && (pRes.TokenType==1) 419de76a5adSDamjan Jovanovic && (pRes.Value==0.0) ); 420de76a5adSDamjan Jovanovic } 4212f709283SDamjan Jovanovic Assert.assertTrue("parseAnyToken()", res); 422de76a5adSDamjan Jovanovic } 423de76a5adSDamjan Jovanovic 424de76a5adSDamjan Jovanovic /** 425de76a5adSDamjan Jovanovic * After defining a string to be parsed and parse conditions (flags), test 426de76a5adSDamjan Jovanovic * calls the method for different locales two times with different parameters, 427de76a5adSDamjan Jovanovic * checking result after every call. <p> 428de76a5adSDamjan Jovanovic * Has <b> OK </b> status if the method returns right results. 429de76a5adSDamjan Jovanovic */ 4302f709283SDamjan Jovanovic @Test _parsePredefinedToken()431de76a5adSDamjan Jovanovic public void _parsePredefinedToken() { 432de76a5adSDamjan Jovanovic int nStartFlags = KParseTokens.ANY_ALPHA | KParseTokens.ASC_UNDERSCORE; 433de76a5adSDamjan Jovanovic int nContFlags = nStartFlags; 434de76a5adSDamjan Jovanovic String toCheck = " 18 int"; 435de76a5adSDamjan Jovanovic ParseResult pRes = null; 436de76a5adSDamjan Jovanovic boolean res = true; 437de76a5adSDamjan Jovanovic 438de76a5adSDamjan Jovanovic for (int i=0;i<7;i++) { 439de76a5adSDamjan Jovanovic pRes = oObj.parsePredefinedToken(KParseType.IDENTNAME, toCheck, 440de76a5adSDamjan Jovanovic 1, getLocale(i), nStartFlags, "", nContFlags, ""); 441de76a5adSDamjan Jovanovic res = (pRes.CharLen==0); 442de76a5adSDamjan Jovanovic pRes = oObj.parsePredefinedToken(KParseType.IDENTNAME, toCheck, 443de76a5adSDamjan Jovanovic 4, getLocale(i), nStartFlags, "", nContFlags, ""); 444de76a5adSDamjan Jovanovic res &= ( (pRes.CharLen==3) 445de76a5adSDamjan Jovanovic && (pRes.TokenType==4) 446de76a5adSDamjan Jovanovic && (pRes.Value==0.0) ); 447de76a5adSDamjan Jovanovic } 4482f709283SDamjan Jovanovic Assert.assertTrue("parsePredefinedToken()", res); 449de76a5adSDamjan Jovanovic } 450de76a5adSDamjan Jovanovic 451de76a5adSDamjan Jovanovic 452de76a5adSDamjan Jovanovic /** 453de76a5adSDamjan Jovanovic * Method returns locale for a given language and country. 454de76a5adSDamjan Jovanovic * @param k index of needed locale. 455de76a5adSDamjan Jovanovic */ getLocale(int k)456de76a5adSDamjan Jovanovic private Locale getLocale(int k) { 457de76a5adSDamjan Jovanovic return new Locale(languages[k],countries[k],""); 458de76a5adSDamjan Jovanovic } 459de76a5adSDamjan Jovanovic 460de76a5adSDamjan Jovanovic 461de76a5adSDamjan Jovanovic } // end XCharacterClassification 462