1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4  *******************************************************************************
5  * Copyright (C) 1998-2004, International Business Machines Corporation and    *
6  * others. All Rights Reserved.                                                *
7  *******************************************************************************
8  *
9  * Created on Dec 3, 2003
10  *
11  *******************************************************************************
12  */
13 package com.ibm.icu.dev.tool.layout;
14 
15 import com.ibm.icu.lang.UCharacter;
16 import com.ibm.icu.lang.UProperty;
17 import com.ibm.icu.text.Normalizer;
18 import com.ibm.icu.text.UnicodeSet;
19 
20 public class ArabicCharacterData
21 {
22     public class Record
23     {
getCodePoint()24         public int getCodePoint()
25         {
26             return codePoint;
27         }
28 
getGeneralCategory()29         public int getGeneralCategory()
30         {
31             return generalCategory;
32         }
33 
getDecompositionType()34         public int getDecompositionType()
35         {
36             return decompositionType;
37         }
38 
getDecomposition()39         public String getDecomposition()
40         {
41             return decomposition;
42         }
43 
Record(int character)44         private Record(int character)
45         {
46             codePoint         = character;
47             generalCategory   = UCharacter.getType(character);
48             decompositionType = UCharacter.getIntPropertyValue(character, UProperty.DECOMPOSITION_TYPE);
49 
50             switch (decompositionType) {
51             case UCharacter.DecompositionType.FINAL:
52             case UCharacter.DecompositionType.INITIAL:
53             case UCharacter.DecompositionType.ISOLATED:
54             case UCharacter.DecompositionType.MEDIAL:
55                 decomposition = Normalizer.compose(UCharacter.toString(character), true);
56                 break;
57 
58             case UCharacter.DecompositionType.CANONICAL:
59                 decomposition = Normalizer.decompose(UCharacter.toString(character), true);
60                 break;
61 
62             default:
63                 decomposition = null;
64             }
65         }
66 
67         private int codePoint;
68         private int generalCategory;
69         private int decompositionType;
70         private String decomposition;
71     }
72 
ArabicCharacterData(int charCount)73     private ArabicCharacterData(int charCount)
74     {
75         records = new Record[charCount];
76     }
77 
add(int character)78     private void add(int character)
79     {
80         records[recordIndex++] = new Record(character);
81     }
82 
getRecord(int index)83     public Record getRecord(int index)
84     {
85         if (index < 0 || index >= records.length) {
86             return null;
87         }
88 
89         return records[index];
90     }
91 
countRecords()92     public int countRecords()
93     {
94         return records.length;
95     }
96 
97     // TODO: do we need to change this to use UnicodeSetIterator?
98     // That will mean not knowing the number of characters until
99     // after the iteration is done, so we'd have to use a vector
100     // to hold the Records at first and copy it to an array
101     // when we're done...
factory(UnicodeSet characterSet)102     public static ArabicCharacterData factory(UnicodeSet characterSet)
103     {
104         int charCount = characterSet.size();
105         ArabicCharacterData data = new ArabicCharacterData(charCount);
106 
107         for (int i = 0; i < charCount; i += 1) {
108             data.add(characterSet.charAt(i));
109         }
110 
111         return data;
112     }
113 
114     private Record[] records;
115     private int recordIndex = 0;
116 }
117