xref: /trunk/test/testuno/source/api/i18n/XCharacterClassificationTest.java (revision 3309286857f19787ae62bd793a98b5af4edd2ad3)
1de76a5adSDamjan Jovanovic /**************************************************************
2de76a5adSDamjan Jovanovic  *
3de76a5adSDamjan Jovanovic  * Licensed to the Apache Software Foundation (ASF) under one
4de76a5adSDamjan Jovanovic  * or more contributor license agreements.  See the NOTICE file
5de76a5adSDamjan Jovanovic  * distributed with this work for additional information
6de76a5adSDamjan Jovanovic  * regarding copyright ownership.  The ASF licenses this file
7de76a5adSDamjan Jovanovic  * to you under the Apache License, Version 2.0 (the
8de76a5adSDamjan Jovanovic  * "License"); you may not use this file except in compliance
9de76a5adSDamjan Jovanovic  * with the License.  You may obtain a copy of the License at
10de76a5adSDamjan Jovanovic  *
11de76a5adSDamjan Jovanovic  *   http://www.apache.org/licenses/LICENSE-2.0
12de76a5adSDamjan Jovanovic  *
13de76a5adSDamjan Jovanovic  * Unless required by applicable law or agreed to in writing,
14de76a5adSDamjan Jovanovic  * software distributed under the License is distributed on an
15de76a5adSDamjan Jovanovic  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16de76a5adSDamjan Jovanovic  * KIND, either express or implied.  See the License for the
17de76a5adSDamjan Jovanovic  * specific language governing permissions and limitations
18de76a5adSDamjan Jovanovic  * under the License.
19de76a5adSDamjan Jovanovic  *
20de76a5adSDamjan Jovanovic  *************************************************************/
21de76a5adSDamjan Jovanovic 
22de76a5adSDamjan Jovanovic 
23de76a5adSDamjan Jovanovic 
242f709283SDamjan Jovanovic package api.i18n;
25de76a5adSDamjan Jovanovic 
26de76a5adSDamjan Jovanovic import com.sun.star.i18n.KParseTokens;
27de76a5adSDamjan Jovanovic import com.sun.star.i18n.KParseType;
28de76a5adSDamjan Jovanovic import com.sun.star.i18n.ParseResult;
29de76a5adSDamjan Jovanovic import com.sun.star.i18n.XCharacterClassification;
30de76a5adSDamjan Jovanovic import com.sun.star.lang.Locale;
312f709283SDamjan Jovanovic import com.sun.star.uno.UnoRuntime;
322f709283SDamjan Jovanovic import com.sun.star.uno.XComponentContext;
332f709283SDamjan Jovanovic import org.junit.After;
342f709283SDamjan Jovanovic import org.junit.AfterClass;
352f709283SDamjan Jovanovic import org.junit.Before;
362f709283SDamjan Jovanovic import org.junit.BeforeClass;
372f709283SDamjan Jovanovic import org.junit.Assert;
38*daf711bfSDamjan Jovanovic import org.junit.Ignore;
392f709283SDamjan Jovanovic import org.junit.Test;
402f709283SDamjan Jovanovic import org.openoffice.test.uno.UnoApp;
41de76a5adSDamjan Jovanovic 
42de76a5adSDamjan Jovanovic /**
43de76a5adSDamjan Jovanovic  * Testing <code>com.sun.star.i18n.XCharacterClassification</code>
44de76a5adSDamjan Jovanovic  * interface methods:
45de76a5adSDamjan Jovanovic  * <ul>
46de76a5adSDamjan Jovanovic  *  <li><code> toUpper() </code></li>
47de76a5adSDamjan Jovanovic  *  <li><code> toLower() </code></li>
48de76a5adSDamjan Jovanovic  *  <li><code> toTitle() </code></li>
49de76a5adSDamjan Jovanovic  *  <li><code> getType() </code></li>
50de76a5adSDamjan Jovanovic  *  <li><code> getCharacterType() </code></li>
51de76a5adSDamjan Jovanovic  *  <li><code> getStringType() </code></li>
52de76a5adSDamjan Jovanovic  *  <li><code> getCharacterDirection() </code></li>
53de76a5adSDamjan Jovanovic  *  <li><code> getScript() </code></li>
54de76a5adSDamjan Jovanovic  *  <li><code> parseAnyToken() </code></li>
55de76a5adSDamjan Jovanovic  *  <li><code> parsePredefinedToken() </code></li>
56de76a5adSDamjan Jovanovic  * </ul><p>
57de76a5adSDamjan Jovanovic  * Test is <b> NOT </b> multithread compliant. <p>
58de76a5adSDamjan Jovanovic  * @see com.sun.star.i18n.XCharacterClassification
59de76a5adSDamjan Jovanovic  */
602f709283SDamjan Jovanovic public class XCharacterClassificationTest {
612f709283SDamjan Jovanovic     private static final UnoApp app = new UnoApp();
622f709283SDamjan Jovanovic 
632f709283SDamjan Jovanovic     private XComponentContext xContext = null;
64de76a5adSDamjan Jovanovic     public XCharacterClassification oObj = null;
65de76a5adSDamjan Jovanovic     public String[] languages = new String[]{"de","en","es","fr","ja","ko","zh"};
66de76a5adSDamjan Jovanovic     public String[] countries = new String[]{"DE","US","ES","FR","JP","KR","CN"};
67de76a5adSDamjan Jovanovic 
68de76a5adSDamjan Jovanovic     public String[] charstyles_java = new String[] {"UNASSIGNED","UPPERCASE_LETTER",
69de76a5adSDamjan Jovanovic         "LOWERCASE_LETTER","TITLECASE_LETTER","MODIFIER_LETTER","OTHER_LETTER",
70de76a5adSDamjan Jovanovic         "NON_SPACING_MARK","ENCLOSING_MARK","COMBINING_SPACING_MARK",
71de76a5adSDamjan Jovanovic         "DECIMAL_DIGIT_NUMBER","LETTER_NUMBER","OTHER_NUMBER","SPACE_SEPARATOR",
72de76a5adSDamjan Jovanovic         "LINE_SEPARATOR","PARAGRAPH_SEPARATOR","CONTROL","FORMAT","none17",
73de76a5adSDamjan Jovanovic         "PRIVATE_USE","none19","DASH_PUNCTUATION","START_PUNCTUATION","END_PUNCTUATION",
74de76a5adSDamjan Jovanovic         "CONNECTOR_PUNCTUATION","OTHER_PUNCTUATION","MATH_SYMBOL","CURRENCY_SYMBOL",
75de76a5adSDamjan Jovanovic         "MODIFIER_SYMBOL","OTHER_SYMBOL"};
76de76a5adSDamjan Jovanovic 
77de76a5adSDamjan Jovanovic     public String[] charstyles_office = new String[] {"UNASSIGNED","UPPERCASE_LETTER",
78de76a5adSDamjan Jovanovic         "LOWERCASE_LETTER","TITLECASE_LETTER","MODIFIER_LETTER","OTHER_LETTER",
79de76a5adSDamjan Jovanovic         "NON_SPACING_MARK","ENCLOSING_MARK","COMBINING_SPACING_MARK",
80de76a5adSDamjan Jovanovic         "DECIMAL_DIGIT_NUMBER","LETTER_NUMBER","OTHER_NUMBER","SPACE_SEPARATOR",
81de76a5adSDamjan Jovanovic         "LINE_SEPARATOR","PARAGRAPH_SEPARATOR","CONTROL","FORMAT","PRIVATE_USE",
82de76a5adSDamjan Jovanovic         "OTHER_PUNCTUATION","DASH_PUNCTUATION","START_PUNCTUATION","END_PUNCTUATION",
83de76a5adSDamjan Jovanovic         "CONNECTOR_PUNCTUATION",
84de76a5adSDamjan Jovanovic         "OTHER_PUNCTUATION","MATH_SYMBOL","CURRENCY_SYMBOL","MODIFIER_SYMBOL",
85de76a5adSDamjan Jovanovic         "OTHER_SYMBOL","INITIAL_PUNCTUATION","FINAL_PUNCTUATION","GENERAL_TYPES_COUNT"};
86de76a5adSDamjan Jovanovic 
87de76a5adSDamjan Jovanovic     public String[] unicode_script = new String[] {"U_BASIC_LATIN","U_LATIN_1_SUPPLEMENT",
88de76a5adSDamjan Jovanovic         "U_LATIN_EXTENDED_A","U_LATIN_EXTENDED_B","U_IPA_EXTENSIONS","U_SPACING_MODIFIER_LETTERS",
89de76a5adSDamjan Jovanovic         "U_COMBINING_DIACRITICAL_MARKS","U_GREEK","U_CYRILLIC","U_ARMENIAN","U_HEBREW",
90de76a5adSDamjan Jovanovic         "U_ARABIC","U_SYRIAC","U_THAANA","U_DEVANAGARI","U_BENGALI","U_GURMUKHI",
91de76a5adSDamjan Jovanovic         "U_GUJARATI","U_ORIYA","U_TAMIL","U_TELUGU","U_KANNADA","U_MALAYALAM",
92de76a5adSDamjan Jovanovic         "U_SINHALA","U_THAI","U_LAO","U_TIBETAN","U_MYANMAR","U_GEORGIAN",
93de76a5adSDamjan Jovanovic         "U_HANGUL_JAMO","U_ETHIOPIC","U_CHEROKEE","U_UNIFIED_CANADIAN_ABORIGINAL_SYLLABICS",
94de76a5adSDamjan Jovanovic         "U_OGHAM","U_RUNIC","U_KHMER","U_MONGOLIAN","U_LATIN_EXTENDED_ADDITIONAL",
95de76a5adSDamjan Jovanovic         "U_GREEK_EXTENDED","U_GENERAL_PUNCTUATION","U_SUPERSCRIPTS_AND_SUBSCRIPTS",
96de76a5adSDamjan Jovanovic         "U_CURRENCY_SYMBOLS","U_COMBINING_MARKS_FOR_SYMBOLS","U_LETTERLIKE_SYMBOLS",
97de76a5adSDamjan Jovanovic         "U_NUMBER_FORMS","U_ARROWS","U_MATHEMATICAL_OPERATORS","U_MISCELLANEOUS_TECHNICAL",
98de76a5adSDamjan Jovanovic         "U_CONTROL_PICTURES","U_OPTICAL_CHARACTER_RECOGNITION","U_ENCLOSED_ALPHANUMERICS",
99de76a5adSDamjan Jovanovic         "U_BOX_DRAWING","U_BLOCK_ELEMENTS","U_GEOMETRIC_SHAPES","U_MISCELLANEOUS_SYMBOLS",
100de76a5adSDamjan Jovanovic         "U_DINGBATS","U_BRAILLE_PATTERNS","U_CJK_RADICALS_SUPPLEMENT","U_KANGXI_RADICALS",
101de76a5adSDamjan Jovanovic         "U_IDEOGRAPHIC_DESCRIPTION_CHARACTERS","U_CJK_SYMBOLS_AND_PUNCTUATION",
102de76a5adSDamjan Jovanovic         "U_HIRAGANA","U_KATAKANA","U_BOPOMOFO","U_HANGUL_COMPATIBILITY_JAMO","U_KANBUN",
103de76a5adSDamjan Jovanovic         "U_BOPOMOFO_EXTENDED","U_ENCLOSED_CJK_LETTERS_AND_MONTHS","U_CJK_COMPATIBILITY",
104de76a5adSDamjan Jovanovic         "U_CJK_UNIFIED_IDEOGRAPHS_EXTENSION_A","U_CJK_UNIFIED_IDEOGRAPHS","U_YI_SYLLABLES",
105de76a5adSDamjan Jovanovic         "U_YI_RADICALS","U_HANGUL_SYLLABLES","U_HIGH_SURROGATES","U_HIGH_PRIVATE_USE_SURROGATES",
106de76a5adSDamjan Jovanovic         "U_LOW_SURROGATES","U_PRIVATE_USE_AREA","U_CJK_COMPATIBILITY_IDEOGRAPHS",
107de76a5adSDamjan Jovanovic         "U_ALPHABETIC_PRESENTATION_FORMS","U_ARABIC_PRESENTATION_FORMS_A","U_COMBINING_HALF_MARKS",
108de76a5adSDamjan Jovanovic         "U_CJK_COMPATIBILITY_FORMS","U_SMALL_FORM_VARIANTS","U_ARABIC_PRESENTATION_FORMS_B",
109de76a5adSDamjan Jovanovic         "U_SPECIALS","U_HALFWIDTH_AND_FULLWIDTH_FORMS","U_CHAR_SCRIPT_COUNT","U_NO_SCRIPT"};
110de76a5adSDamjan Jovanovic 
1112f709283SDamjan Jovanovic     // setup and close connections
1122f709283SDamjan Jovanovic     @BeforeClass
setUpConnection()1132f709283SDamjan Jovanovic     public static void setUpConnection() throws Exception
1142f709283SDamjan Jovanovic     {
1152f709283SDamjan Jovanovic         app.start();
1162f709283SDamjan Jovanovic     }
1172f709283SDamjan Jovanovic 
1182f709283SDamjan Jovanovic     @AfterClass
tearDownConnection()1192f709283SDamjan Jovanovic     public static void tearDownConnection() throws InterruptedException, com.sun.star.uno.Exception
1202f709283SDamjan Jovanovic     {
1212f709283SDamjan Jovanovic         app.close();
1222f709283SDamjan Jovanovic     }
1232f709283SDamjan Jovanovic 
1242f709283SDamjan Jovanovic     @Before
before()1252f709283SDamjan Jovanovic     public void before() throws Exception {
1262f709283SDamjan Jovanovic         xContext = app.getComponentContext();
1272f709283SDamjan Jovanovic         oObj = UnoRuntime.queryInterface(
1282f709283SDamjan Jovanovic             XCharacterClassification.class,
1292f709283SDamjan Jovanovic             xContext.getServiceManager().createInstanceWithContext("com.sun.star.i18n.CharacterClassification", xContext)
1302f709283SDamjan Jovanovic         );
1312f709283SDamjan Jovanovic     }
1322f709283SDamjan Jovanovic 
133de76a5adSDamjan Jovanovic     /**
134de76a5adSDamjan Jovanovic     * Test calls the method for different locales. Then each result is compared
135de76a5adSDamjan Jovanovic     * with a string, converted to a upper case using
136de76a5adSDamjan Jovanovic     * <code>java.lang.String</code> method <code>toUpperCase()</code>.<p>
137de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if string, returned by the method is equal to
138de76a5adSDamjan Jovanovic     * a string that is returned by String.toUpperCase() for all locales.
139de76a5adSDamjan Jovanovic     */
1402f709283SDamjan Jovanovic     @Test
_toUpper()141de76a5adSDamjan Jovanovic     public void _toUpper() {
142de76a5adSDamjan Jovanovic         boolean res = true;
143de76a5adSDamjan Jovanovic         char[] characters = new char[]{586,65,97,498,721,4588,772,8413,3404};
144de76a5adSDamjan Jovanovic         String toCheck = new String(characters);
145de76a5adSDamjan Jovanovic         String get = "";
146de76a5adSDamjan Jovanovic         String exp = "";
147de76a5adSDamjan Jovanovic 
148de76a5adSDamjan Jovanovic         for (int i=0;i<7;i++) {
149de76a5adSDamjan Jovanovic             get = oObj.toUpper(toCheck, 0, toCheck.length(), getLocale(i));
150de76a5adSDamjan Jovanovic             exp = toCheck.toUpperCase(
151de76a5adSDamjan Jovanovic                 new java.util.Locale(languages[i], countries[i]));
152de76a5adSDamjan Jovanovic             res &= get.equals(exp);
153de76a5adSDamjan Jovanovic             if (!res) {
1542f709283SDamjan Jovanovic                 System.out.println("FAILED for: language=" + languages[i] +
155de76a5adSDamjan Jovanovic                     " ; country=" + countries[i]);
1562f709283SDamjan Jovanovic                 System.out.println("Expected: " + exp);
1572f709283SDamjan Jovanovic                 System.out.println("Gained : " + get);
158de76a5adSDamjan Jovanovic             }
159de76a5adSDamjan Jovanovic         }
1602f709283SDamjan Jovanovic         Assert.assertTrue("toUpper()", res);
161de76a5adSDamjan Jovanovic     }
162de76a5adSDamjan Jovanovic 
163de76a5adSDamjan Jovanovic     /**
164de76a5adSDamjan Jovanovic     * Test calls the method for different locales. Then each result is compared
165de76a5adSDamjan Jovanovic     * with a string, converted to a lower case using
166de76a5adSDamjan Jovanovic     * <code>java.lang.String</code> method <code>toLowerCase()</code>.<p>
167de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if string, returned by the method is equal to
168de76a5adSDamjan Jovanovic     * a string that is returned by String.toLowerCase() for all locales.
169de76a5adSDamjan Jovanovic     */
1702f709283SDamjan Jovanovic     @Test
171*daf711bfSDamjan Jovanovic     @Ignore("Bug #87590 Incorrect casing for U+026A, U+0268, U+0197...")
_toLower()172de76a5adSDamjan Jovanovic     public void _toLower() {
173de76a5adSDamjan Jovanovic         boolean res = true;
174de76a5adSDamjan Jovanovic         char[] characters = new char[]{586,65,97,498,721,4588,772,8413,3404};
175de76a5adSDamjan Jovanovic         String toCheck = new String(characters);
176de76a5adSDamjan Jovanovic         String get = "";
177de76a5adSDamjan Jovanovic         String exp = "";
178de76a5adSDamjan Jovanovic 
179de76a5adSDamjan Jovanovic         for (int i=0;i<7;i++) {
180de76a5adSDamjan Jovanovic             get = oObj.toLower(toCheck,0,toCheck.length(),getLocale(i));
181de76a5adSDamjan Jovanovic             exp = toCheck.toLowerCase(
182de76a5adSDamjan Jovanovic                 new java.util.Locale(languages[i],countries[i]));
183de76a5adSDamjan Jovanovic             res &= get.equals(exp);
184de76a5adSDamjan Jovanovic             if (!res) {
1852f709283SDamjan Jovanovic                 System.out.println("FAILED for: language=" + languages[i]
186de76a5adSDamjan Jovanovic                     + " ; country=" + countries[i]);
1872f709283SDamjan Jovanovic                 System.out.println("Expected: " + exp);
1882f709283SDamjan Jovanovic                 System.out.println("Gained : " + get);
189de76a5adSDamjan Jovanovic             }
190de76a5adSDamjan Jovanovic         }
1912f709283SDamjan Jovanovic         Assert.assertTrue("toLower()", res);
192de76a5adSDamjan Jovanovic     }
193de76a5adSDamjan Jovanovic 
194de76a5adSDamjan Jovanovic     /**
195de76a5adSDamjan Jovanovic     * Test calls the method for different locales. Then each result is compared
196de76a5adSDamjan Jovanovic     * with a string, converted to a title case using
197de76a5adSDamjan Jovanovic     * <code>java.lang.Character</code> method <code>toTitleCase()</code>.<p>
198de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if string, returned by the method is equal to
199de76a5adSDamjan Jovanovic     * a string that was converted using Character.toTitleCase() for all locales.
200de76a5adSDamjan Jovanovic     */
2012f709283SDamjan Jovanovic     @Test
_toTitle()202de76a5adSDamjan Jovanovic     public void _toTitle() {
203de76a5adSDamjan Jovanovic         boolean res = true;
204de76a5adSDamjan Jovanovic         String toCheck = new String(new char[]{8112});
205de76a5adSDamjan Jovanovic         String get = "";
206de76a5adSDamjan Jovanovic         String exp = "";
207de76a5adSDamjan Jovanovic 
208de76a5adSDamjan Jovanovic         for (int i=0;i<7;i++) {
209de76a5adSDamjan Jovanovic             get = oObj.toTitle(toCheck, 0, 1, getLocale(i));
210de76a5adSDamjan Jovanovic             exp = new String(
211de76a5adSDamjan Jovanovic                 new char[]{Character.toTitleCase(toCheck.toCharArray()[0])});
212de76a5adSDamjan Jovanovic             res &= get.equals(exp);
213de76a5adSDamjan Jovanovic             if (!res) {
2142f709283SDamjan Jovanovic                 System.out.println("FAILED for: language=" + languages[i]
215de76a5adSDamjan Jovanovic                     + " ; country=" + countries[i]);
2162f709283SDamjan Jovanovic                 System.out.println("Expected: " + exp);
2172f709283SDamjan Jovanovic                 System.out.println("Gained : " + get);
218de76a5adSDamjan Jovanovic             }
219de76a5adSDamjan Jovanovic         }
2202f709283SDamjan Jovanovic         Assert.assertTrue("toTitle()", res);
221de76a5adSDamjan Jovanovic     }
222de76a5adSDamjan Jovanovic 
223de76a5adSDamjan Jovanovic     /**
224de76a5adSDamjan Jovanovic     * At first we define <code>int[]</code> and <code>char[]</code> arrays of
225de76a5adSDamjan Jovanovic     * unicode symbol numbers, arranged as sequences, where symbols are sorted
226de76a5adSDamjan Jovanovic     * by type, so the character of <code>i<sup><small>th</small></sup></code>
227de76a5adSDamjan Jovanovic     * type is located on <code>i<sup><small>th</small></sup></code> position.<p>
228de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if for all 30 types the method returns value, that
229de76a5adSDamjan Jovanovic     * is equal to an element number.<p>
230de76a5adSDamjan Jovanovic     * @see com.sun.star.i18n.CharType
231de76a5adSDamjan Jovanovic     */
2322f709283SDamjan Jovanovic     @Test
_getType()233de76a5adSDamjan Jovanovic     public void _getType() {
234de76a5adSDamjan Jovanovic         boolean res = true;
23524ef62edSDamjan Jovanovic         // If or when this list gets out of date again,
23624ef62edSDamjan Jovanovic         // find new characters of the required type with:
23724ef62edSDamjan Jovanovic         // for (int i = 30; i <= 0xffff; i++) {
23824ef62edSDamjan Jovanovic         //     String s = new String("" + (char)i);
23924ef62edSDamjan Jovanovic         //     int type = oObj.getType(s, 0);
24024ef62edSDamjan Jovanovic         //     System.out.println("character " + i + " has type " + charstyles_office[type]);
24124ef62edSDamjan Jovanovic         // }
24224ef62edSDamjan Jovanovic         char[] characters = new char[]{888,65,97,498,721,4588,772,8413,3404,
24324ef62edSDamjan Jovanovic             48,8544,179,32,8232,8233,144,8204,57344,56320,45,40,41,95,3852,247,
244de76a5adSDamjan Jovanovic             3647,901,3896,171,187};
245de76a5adSDamjan Jovanovic         String toCheck = new String(characters);
246de76a5adSDamjan Jovanovic 
247de76a5adSDamjan Jovanovic         for (int i=0;i<characters.length;i++) {
248de76a5adSDamjan Jovanovic             int get = oObj.getType(toCheck, i);
249de76a5adSDamjan Jovanovic             res &= (charstyles_office[get] == charstyles_office[i]);
250de76a5adSDamjan Jovanovic             if (!res) {
25124ef62edSDamjan Jovanovic                 System.out.println("Code: " + Integer.toHexString((int)characters[i]));
2522f709283SDamjan Jovanovic                 System.out.println("Gained: " + charstyles_office[get]);
2532f709283SDamjan Jovanovic                 System.out.println("Expected: " + charstyles_office[i]);
254de76a5adSDamjan Jovanovic             }
255de76a5adSDamjan Jovanovic         }
2562f709283SDamjan Jovanovic         Assert.assertTrue("getType()", res);
257de76a5adSDamjan Jovanovic     }
258de76a5adSDamjan Jovanovic 
259de76a5adSDamjan Jovanovic     /**
260de76a5adSDamjan Jovanovic     * After defining string to be checked and array of expected types, test
261de76a5adSDamjan Jovanovic     * calls the method for each character of a string and for all locales.<p>
262de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if the method returns type, expected for a given
263de76a5adSDamjan Jovanovic     * character and locale.
264de76a5adSDamjan Jovanovic     */
2652f709283SDamjan Jovanovic     @Test
_getCharacterType()266de76a5adSDamjan Jovanovic     public void _getCharacterType() {
267de76a5adSDamjan Jovanovic         boolean res = true;
2685c977050SDamjan Jovanovic         // If or when this list gets out of date again,
2695c977050SDamjan Jovanovic         // find new characters of the required type with:
2705c977050SDamjan Jovanovic         //for (int i = 32; i <= 0xffff; i++) {
2715c977050SDamjan Jovanovic         //    int charType = oObj.getCharacterType("" + (char)i, 0, getLocale(1));
2725c977050SDamjan Jovanovic         //    if (charType == 32) {
2735c977050SDamjan Jovanovic         //        System.out.println("character " + i + " has type 32");
2745c977050SDamjan Jovanovic         //    }
2755c977050SDamjan Jovanovic         //}
2765c977050SDamjan Jovanovic         String toCheck = "Ab0*";
277de76a5adSDamjan Jovanovic         int[] expected = new int[]{226,228,97,32};
278de76a5adSDamjan Jovanovic 
279de76a5adSDamjan Jovanovic         for (int i=0;i<toCheck.length();i++) {
280de76a5adSDamjan Jovanovic             for (int j=1;j<7;j++) {
281de76a5adSDamjan Jovanovic                 int get = oObj.getCharacterType(toCheck, i, getLocale(j));
282de76a5adSDamjan Jovanovic                 res &= (get == expected[i]);
283de76a5adSDamjan Jovanovic                 if (!res) {
2842f709283SDamjan Jovanovic                     System.out.println("FAILED for: language=" + languages[j] +
285de76a5adSDamjan Jovanovic                         " ; country=" + countries[j]);
2868619c510SDamjan Jovanovic                     System.out.println("Symbol: " + toCheck.toCharArray()[i]);
2872f709283SDamjan Jovanovic                     System.out.println("Gained: " + get);
2882f709283SDamjan Jovanovic                     System.out.println("Expected: " + expected[i]);
289de76a5adSDamjan Jovanovic                 }
290de76a5adSDamjan Jovanovic             }
291de76a5adSDamjan Jovanovic         }
2922f709283SDamjan Jovanovic         Assert.assertTrue("getCharacterType()", res);
293de76a5adSDamjan Jovanovic     }
294de76a5adSDamjan Jovanovic 
295de76a5adSDamjan Jovanovic     /**
296de76a5adSDamjan Jovanovic     * After defining array of strings to be checked and array of expected types,
297de76a5adSDamjan Jovanovic     * test calls the method for each string of an array and for all locales.<p>
298de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if the method returns type, expected for a given
299de76a5adSDamjan Jovanovic     * string and locale.
300de76a5adSDamjan Jovanovic     */
3012f709283SDamjan Jovanovic     @Test
_getStringType()302de76a5adSDamjan Jovanovic     public void _getStringType() {
303de76a5adSDamjan Jovanovic         boolean res = true;
304de76a5adSDamjan Jovanovic         String[] toCheck = new String[]{"01234","AAAAA","bbbbb","AA()bb"};
305de76a5adSDamjan Jovanovic         int[] exp = new int[]{97,226,228,230};
306de76a5adSDamjan Jovanovic 
307de76a5adSDamjan Jovanovic         for (int j=0;j<toCheck.length;j++) {
308de76a5adSDamjan Jovanovic             for (int i=0;i<7;i++) {
309de76a5adSDamjan Jovanovic                 int get = oObj.getStringType(toCheck[j], 0,
310de76a5adSDamjan Jovanovic                     toCheck[j].length(), getLocale(i));
311de76a5adSDamjan Jovanovic                 res &= (get == exp[j]);
312de76a5adSDamjan Jovanovic                 if (!res) {
3132f709283SDamjan Jovanovic                     System.out.println("FAILED for: language=" + languages[i] +
314de76a5adSDamjan Jovanovic                         " ; country=" + countries[i]);
3152f709283SDamjan Jovanovic                     System.out.println("Expected: " + exp[j]);
3162f709283SDamjan Jovanovic                     System.out.println("Gained : " + get);
317de76a5adSDamjan Jovanovic                 }
318de76a5adSDamjan Jovanovic             }
319de76a5adSDamjan Jovanovic         }
3202f709283SDamjan Jovanovic         Assert.assertTrue("getStringType()", res);
321de76a5adSDamjan Jovanovic     }
322de76a5adSDamjan Jovanovic 
323de76a5adSDamjan Jovanovic     /**
324de76a5adSDamjan Jovanovic     * After string to be checked is initialized (all symbols are sorted
325de76a5adSDamjan Jovanovic     * by direction, so the character of <code>i<sup><small>th</small></sup></code>
326de76a5adSDamjan Jovanovic     * direction is located on <code>i<sup><small>th</small></sup></code>
327de76a5adSDamjan Jovanovic     * position), test calls the method for every character of that string. <p>
328de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if the method returns direction, that's equal to
329de76a5adSDamjan Jovanovic     * a symbol position in the string.
330de76a5adSDamjan Jovanovic     */
3312f709283SDamjan Jovanovic     @Test
_getCharacterDirection()332de76a5adSDamjan Jovanovic     public void _getCharacterDirection() {
333de76a5adSDamjan Jovanovic         boolean res = true;
334cc5c65fbSDamjan Jovanovic         String toCheck = new String(new char[]{65,1470,48,43,35,1632,44,10,
335de76a5adSDamjan Jovanovic                                 9,12,33,8234,8237,1563,8235,8238,8236,768,1});
336de76a5adSDamjan Jovanovic         for (short i=0;i<19;i++) {
337de76a5adSDamjan Jovanovic             short get = oObj.getCharacterDirection(toCheck, i);
338de76a5adSDamjan Jovanovic             res &= (get == i);
339de76a5adSDamjan Jovanovic             if (!res) {
3402f709283SDamjan Jovanovic                 System.out.println("Code :" + toCheck.toCharArray()[i]);
3412f709283SDamjan Jovanovic                 System.out.println("Gained: " + get);
3422f709283SDamjan Jovanovic                 System.out.println("Expected: " + i);
343de76a5adSDamjan Jovanovic             }
344de76a5adSDamjan Jovanovic         }
3452f709283SDamjan Jovanovic         Assert.assertTrue("getCharacterDirection()", res);
346de76a5adSDamjan Jovanovic     }
347de76a5adSDamjan Jovanovic 
348de76a5adSDamjan Jovanovic     /**
349de76a5adSDamjan Jovanovic     * At first we define <code>int[]</code> and <code>char[]</code> arrays of
350de76a5adSDamjan Jovanovic     * unicode symbol numbers, arranged as sequences, where symbols are sorted
351de76a5adSDamjan Jovanovic     * by type, so the character of <code>i<sup><small>th</small></sup></code>
352de76a5adSDamjan Jovanovic     * type is located on <code>i<sup><small>th</small></sup></code> position.<p>
353de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if for each character method returns value, that
354de76a5adSDamjan Jovanovic     * is equal to a number where element is located in array. Also method has
355de76a5adSDamjan Jovanovic     * <b> OK </b> status for symbol with code 55296, because it doesn't work
356de76a5adSDamjan Jovanovic     * since it hasn't the right neighborhood.<p>
357de76a5adSDamjan Jovanovic     * @see "http://ppewww.ph.gla.ac.uk/~flavell/unicode/unidata.html"
358de76a5adSDamjan Jovanovic     */
3592f709283SDamjan Jovanovic     @Test
_getScript()360de76a5adSDamjan Jovanovic     public void _getScript() {
361de76a5adSDamjan Jovanovic         boolean res = true;
362de76a5adSDamjan Jovanovic         char[] characters = new char[]{65,128,256,384,592,750,773,924,1030,1331,1448,
363de76a5adSDamjan Jovanovic             1569,1792,1936,2313,2465,2570,2707,2822,2972,3079,3240,3337,3464,3590,
364de76a5adSDamjan Jovanovic             3745,3906,4097,4274,4357,4621,5040,5200,5776,5806,6030,6155,7683,7943,
365de76a5adSDamjan Jovanovic             8202,8319,8352,8413,8452,8545,8616,8715,8965,9217,9281,9336,9474,9608,9719,
366de76a5adSDamjan Jovanovic             9734,9999,10247,11911,12034,12274,12294,12358,12456,12552,12605,12688,12727,
367de76a5adSDamjan Jovanovic             12806,13065,13312,19968,40964,42152,44032,55296,56192,56320,57344,63744,
368de76a5adSDamjan Jovanovic             64257,64370,65056,65073,65131,65146,65532,65288};
369de76a5adSDamjan Jovanovic         String toCheck = new String(characters);
370de76a5adSDamjan Jovanovic 
371de76a5adSDamjan Jovanovic         for (int i=0;i<characters.length;i++) {
372de76a5adSDamjan Jovanovic             int get = oObj.getScript(toCheck, i);
373de76a5adSDamjan Jovanovic             //The HIGH_SURROGATE 55296 doesn't work since it hasn't the right
37407b05676SDamjan Jovanovic             //neighborhood. Neither does 56192 - it combines with 55296 into another code point.
37507b05676SDamjan Jovanovic             if (toCheck.charAt(i) != 55296 && toCheck.charAt(i) != 56192) {
37607b05676SDamjan Jovanovic                 res &= (get == i);
37707b05676SDamjan Jovanovic             }
378de76a5adSDamjan Jovanovic             if (!res) {
3792f709283SDamjan Jovanovic                 System.out.println("-- " + toCheck.substring(i, i + 1).hashCode());
38007b05676SDamjan Jovanovic                 System.out.println("Code: " + Integer.toHexString((int)characters[i]));
38107b05676SDamjan Jovanovic                 System.out.println("Gained: " + get + " (" + (0 <= get && get < unicode_script.length ? unicode_script[get] : "out of range") + ")");
3822f709283SDamjan Jovanovic                 System.out.println("Expected: " + unicode_script[i]);
383de76a5adSDamjan Jovanovic             }
384de76a5adSDamjan Jovanovic         }
3852f709283SDamjan Jovanovic         Assert.assertTrue("getScript()", res);
386de76a5adSDamjan Jovanovic     }
387de76a5adSDamjan Jovanovic 
388de76a5adSDamjan Jovanovic     /**
389de76a5adSDamjan Jovanovic     * After defining a string to be parsed and parse conditions (flags), test
390de76a5adSDamjan Jovanovic     * calls the method for different locales three times with different parameters,
391de76a5adSDamjan Jovanovic     * checking result after every call.  <p>
392de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if the method returns right results all three
393de76a5adSDamjan Jovanovic     * times.
394de76a5adSDamjan Jovanovic     */
3952f709283SDamjan Jovanovic     @Test
_parseAnyToken()396de76a5adSDamjan Jovanovic     public void _parseAnyToken() {
397de76a5adSDamjan Jovanovic         int nStartFlags = KParseTokens.ANY_ALPHA | KParseTokens.ASC_UNDERSCORE;
398de76a5adSDamjan Jovanovic         int nContFlags = KParseTokens.ANY_ALNUM | KParseTokens.ASC_UNDERSCORE
399de76a5adSDamjan Jovanovic                         | KParseTokens.ASC_DOT;
400de76a5adSDamjan Jovanovic         String toCheck = " 18 i18n ^";
401de76a5adSDamjan Jovanovic         ParseResult pRes = null;
402de76a5adSDamjan Jovanovic         boolean res = true;
403de76a5adSDamjan Jovanovic 
404de76a5adSDamjan Jovanovic         for (int i=0;i<7;i++) {
405de76a5adSDamjan Jovanovic             pRes = oObj.parseAnyToken(toCheck, 1, getLocale(i),
406de76a5adSDamjan Jovanovic                 nStartFlags, "", nContFlags, "");
407de76a5adSDamjan Jovanovic             res = ( (pRes.CharLen==2)
408de76a5adSDamjan Jovanovic                  && (pRes.TokenType==32)
409de76a5adSDamjan Jovanovic                  && (pRes.Value==18.0) );
410de76a5adSDamjan Jovanovic             pRes = oObj.parseAnyToken(toCheck, 4, getLocale(i),
411de76a5adSDamjan Jovanovic                 nStartFlags, "", nContFlags, "");
412de76a5adSDamjan Jovanovic             res &= ( (pRes.CharLen==4)
413de76a5adSDamjan Jovanovic                   && (pRes.TokenType==4)
414de76a5adSDamjan Jovanovic                   && (pRes.Value==0.0) );
415de76a5adSDamjan Jovanovic             pRes = oObj.parseAnyToken(toCheck, 9, getLocale(i),
416de76a5adSDamjan Jovanovic                 nStartFlags, "", nContFlags, "");
417de76a5adSDamjan Jovanovic             res &= ( (pRes.CharLen==1)
418de76a5adSDamjan Jovanovic                   && (pRes.TokenType==1)
419de76a5adSDamjan Jovanovic                   && (pRes.Value==0.0) );
420de76a5adSDamjan Jovanovic         }
4212f709283SDamjan Jovanovic         Assert.assertTrue("parseAnyToken()", res);
422de76a5adSDamjan Jovanovic     }
423de76a5adSDamjan Jovanovic 
424de76a5adSDamjan Jovanovic     /**
425de76a5adSDamjan Jovanovic     * After defining a string to be parsed and parse conditions (flags), test
426de76a5adSDamjan Jovanovic     * calls the method for different locales two times with different parameters,
427de76a5adSDamjan Jovanovic     * checking result after every call. <p>
428de76a5adSDamjan Jovanovic     * Has <b> OK </b> status if the method returns right results.
429de76a5adSDamjan Jovanovic     */
4302f709283SDamjan Jovanovic     @Test
_parsePredefinedToken()431de76a5adSDamjan Jovanovic     public void _parsePredefinedToken() {
432de76a5adSDamjan Jovanovic         int nStartFlags = KParseTokens.ANY_ALPHA | KParseTokens.ASC_UNDERSCORE;
433de76a5adSDamjan Jovanovic         int nContFlags = nStartFlags;
434de76a5adSDamjan Jovanovic         String toCheck = " 18 int";
435de76a5adSDamjan Jovanovic         ParseResult pRes = null;
436de76a5adSDamjan Jovanovic         boolean res = true;
437de76a5adSDamjan Jovanovic 
438de76a5adSDamjan Jovanovic         for (int i=0;i<7;i++) {
439de76a5adSDamjan Jovanovic             pRes = oObj.parsePredefinedToken(KParseType.IDENTNAME, toCheck,
440de76a5adSDamjan Jovanovic                 1, getLocale(i), nStartFlags, "", nContFlags, "");
441de76a5adSDamjan Jovanovic             res = (pRes.CharLen==0);
442de76a5adSDamjan Jovanovic             pRes = oObj.parsePredefinedToken(KParseType.IDENTNAME, toCheck,
443de76a5adSDamjan Jovanovic                 4, getLocale(i), nStartFlags, "", nContFlags, "");
444de76a5adSDamjan Jovanovic             res &= ( (pRes.CharLen==3)
445de76a5adSDamjan Jovanovic                   && (pRes.TokenType==4)
446de76a5adSDamjan Jovanovic                   && (pRes.Value==0.0) );
447de76a5adSDamjan Jovanovic         }
4482f709283SDamjan Jovanovic         Assert.assertTrue("parsePredefinedToken()", res);
449de76a5adSDamjan Jovanovic     }
450de76a5adSDamjan Jovanovic 
451de76a5adSDamjan Jovanovic 
452de76a5adSDamjan Jovanovic     /**
453de76a5adSDamjan Jovanovic     * Method returns locale for a given language and country.
454de76a5adSDamjan Jovanovic     * @param k index of needed locale.
455de76a5adSDamjan Jovanovic     */
getLocale(int k)456de76a5adSDamjan Jovanovic     private Locale getLocale(int k) {
457de76a5adSDamjan Jovanovic         return new Locale(languages[k],countries[k],"");
458de76a5adSDamjan Jovanovic     }
459de76a5adSDamjan Jovanovic 
460de76a5adSDamjan Jovanovic 
461de76a5adSDamjan Jovanovic } // end XCharacterClassification
462