1 /*
2  *******************************************************************************
3  *
4  *   Copyright (C) 2004-2014, International Business Machines
5  *   Corporation and others.  All Rights Reserved.
6  *
7  *******************************************************************************
8  *   file name:  UBiDiProps.java
9  *   encoding:   US-ASCII
10  *   tab size:   8 (not used)
11  *   indentation:4
12  *
13  *   created on: 2005jan16
14  *   created by: Markus W. Scherer
15  *
16  *   Low-level Unicode bidi/shaping properties access.
17  *   Java port of ubidi_props.h/.c.
18  */
19 
20 package com.ibm.icu.impl;
21 
22 import java.io.IOException;
23 import java.nio.ByteBuffer;
24 import java.util.Iterator;
25 
26 import com.ibm.icu.lang.UCharacter;
27 import com.ibm.icu.lang.UProperty;
28 import com.ibm.icu.text.UnicodeSet;
29 import com.ibm.icu.util.ICUUncheckedIOException;
30 
31 public final class UBiDiProps {
32     // constructors etc. --------------------------------------------------- ***
33 
34     // port of ubidi_openProps()
UBiDiProps()35     private UBiDiProps() throws IOException{
36         ByteBuffer bytes=ICUBinary.getData(DATA_FILE_NAME);
37         readData(bytes);
38     }
39 
readData(ByteBuffer bytes)40     private void readData(ByteBuffer bytes) throws IOException {
41         // read the header
42         ICUBinary.readHeader(bytes, FMT, new IsAcceptable());
43 
44         // read indexes[]
45         int i, count;
46         count=bytes.getInt();
47         if(count<IX_TOP) {
48             throw new IOException("indexes[0] too small in "+DATA_FILE_NAME);
49         }
50         indexes=new int[count];
51 
52         indexes[0]=count;
53         for(i=1; i<count; ++i) {
54             indexes[i]=bytes.getInt();
55         }
56 
57         // read the trie
58         trie=Trie2_16.createFromSerialized(bytes);
59         int expectedTrieLength=indexes[IX_TRIE_SIZE];
60         int trieLength=trie.getSerializedLength();
61         if(trieLength>expectedTrieLength) {
62             throw new IOException(DATA_FILE_NAME+": not enough bytes for the trie");
63         }
64         // skip padding after trie bytes
65         ICUBinary.skipBytes(bytes, expectedTrieLength-trieLength);
66 
67         // read mirrors[]
68         count=indexes[IX_MIRROR_LENGTH];
69         if(count>0) {
70             mirrors=new int[count];
71             for(i=0; i<count; ++i) {
72                 mirrors[i]=bytes.getInt();
73             }
74         }
75 
76         // read jgArray[]
77         count=indexes[IX_JG_LIMIT]-indexes[IX_JG_START];
78         jgArray=new byte[count];
79         for(i=0; i<count; ++i) {
80             jgArray[i]=bytes.get();
81         }
82 
83         // read jgArray2[]
84         count=indexes[IX_JG_LIMIT2]-indexes[IX_JG_START2];
85         jgArray2=new byte[count];
86         for(i=0; i<count; ++i) {
87             jgArray2[i]=bytes.get();
88         }
89     }
90 
91     // implement ICUBinary.Authenticate
92     private final static class IsAcceptable implements ICUBinary.Authenticate {
isDataVersionAcceptable(byte version[])93         public boolean isDataVersionAcceptable(byte version[]) {
94             return version[0]==2;
95         }
96     }
97 
98     // set of property starts for UnicodeSet ------------------------------- ***
99 
addPropertyStarts(UnicodeSet set)100     public final void addPropertyStarts(UnicodeSet set) {
101         int i, length;
102         int c, start, limit;
103 
104         byte prev, jg;
105 
106         /* add the start code point of each same-value range of the trie */
107         Iterator<Trie2.Range> trieIterator=trie.iterator();
108         Trie2.Range range;
109         while(trieIterator.hasNext() && !(range=trieIterator.next()).leadSurrogate) {
110             set.add(range.startCodePoint);
111         }
112 
113         /* add the code points from the bidi mirroring table */
114         length=indexes[IX_MIRROR_LENGTH];
115         for(i=0; i<length; ++i) {
116             c=getMirrorCodePoint(mirrors[i]);
117             set.add(c, c+1);
118         }
119 
120         /* add the code points from the Joining_Group array where the value changes */
121         start=indexes[IX_JG_START];
122         limit=indexes[IX_JG_LIMIT];
123         byte[] jga=jgArray;
124         for(;;) {
125             length=limit-start;
126             prev=0;
127             for(i=0; i<length; ++i) {
128                 jg=jga[i];
129                 if(jg!=prev) {
130                     set.add(start);
131                     prev=jg;
132                 }
133                 ++start;
134             }
135             if(prev!=0) {
136                 /* add the limit code point if the last value was not 0 (it is now start==limit) */
137                 set.add(limit);
138             }
139             if(limit==indexes[IX_JG_LIMIT]) {
140                 /* switch to the second Joining_Group range */
141                 start=indexes[IX_JG_START2];
142                 limit=indexes[IX_JG_LIMIT2];
143                 jga=jgArray2;
144             } else {
145                 break;
146             }
147         }
148 
149         /* add code points with hardcoded properties, plus the ones following them */
150 
151         /* (none right now) */
152     }
153 
154     // property access functions ------------------------------------------- ***
155 
getMaxValue(int which)156     public final int getMaxValue(int which) {
157         int max;
158 
159         max=indexes[IX_MAX_VALUES];
160         switch(which) {
161         case UProperty.BIDI_CLASS:
162             return (max&CLASS_MASK);
163         case UProperty.JOINING_GROUP:
164             return (max&MAX_JG_MASK)>>MAX_JG_SHIFT;
165         case UProperty.JOINING_TYPE:
166             return (max&JT_MASK)>>JT_SHIFT;
167         case UProperty.BIDI_PAIRED_BRACKET_TYPE:
168             return (max&BPT_MASK)>>BPT_SHIFT;
169         default:
170             return -1; /* undefined */
171         }
172     }
173 
getClass(int c)174     public final int getClass(int c) {
175         return getClassFromProps(trie.get(c));
176     }
177 
isMirrored(int c)178     public final boolean isMirrored(int c) {
179         return getFlagFromProps(trie.get(c), IS_MIRRORED_SHIFT);
180     }
181 
getMirror(int c, int props)182     private final int getMirror(int c, int props) {
183         int delta=getMirrorDeltaFromProps(props);
184         if(delta!=ESC_MIRROR_DELTA) {
185             return c+delta;
186         } else {
187             /* look for mirror code point in the mirrors[] table */
188             int m;
189             int i, length;
190             int c2;
191 
192             length=indexes[IX_MIRROR_LENGTH];
193 
194             /* linear search */
195             for(i=0; i<length; ++i) {
196                 m=mirrors[i];
197                 c2=getMirrorCodePoint(m);
198                 if(c==c2) {
199                     /* found c, return its mirror code point using the index in m */
200                     return getMirrorCodePoint(mirrors[getMirrorIndex(m)]);
201                 } else if(c<c2) {
202                     break;
203                 }
204             }
205 
206             /* c not found, return it itself */
207             return c;
208         }
209     }
210 
getMirror(int c)211     public final int getMirror(int c) {
212         int props=trie.get(c);
213         return getMirror(c, props);
214     }
215 
isBidiControl(int c)216     public final boolean isBidiControl(int c) {
217         return getFlagFromProps(trie.get(c), BIDI_CONTROL_SHIFT);
218     }
219 
isJoinControl(int c)220     public final boolean isJoinControl(int c) {
221         return getFlagFromProps(trie.get(c), JOIN_CONTROL_SHIFT);
222     }
223 
getJoiningType(int c)224     public final int getJoiningType(int c) {
225         return (trie.get(c)&JT_MASK)>>JT_SHIFT;
226     }
227 
getJoiningGroup(int c)228     public final int getJoiningGroup(int c) {
229         int start, limit;
230 
231         start=indexes[IX_JG_START];
232         limit=indexes[IX_JG_LIMIT];
233         if(start<=c && c<limit) {
234             return (int)jgArray[c-start]&0xff;
235         }
236         start=indexes[IX_JG_START2];
237         limit=indexes[IX_JG_LIMIT2];
238         if(start<=c && c<limit) {
239             return (int)jgArray2[c-start]&0xff;
240         }
241         return UCharacter.JoiningGroup.NO_JOINING_GROUP;
242     }
243 
getPairedBracketType(int c)244     public final int getPairedBracketType(int c) {
245         return (trie.get(c)&BPT_MASK)>>BPT_SHIFT;
246     }
247 
getPairedBracket(int c)248     public final int getPairedBracket(int c) {
249         int props=trie.get(c);
250         if((props&BPT_MASK)==0) {
251             return c;
252         } else {
253             return getMirror(c, props);
254         }
255     }
256 
257     // data members -------------------------------------------------------- ***
258     private int indexes[];
259     private int mirrors[];
260     private byte jgArray[];
261     private byte jgArray2[];
262 
263     private Trie2_16 trie;
264 
265     // data format constants ----------------------------------------------- ***
266     private static final String DATA_NAME="ubidi";
267     private static final String DATA_TYPE="icu";
268     private static final String DATA_FILE_NAME=DATA_NAME+"."+DATA_TYPE;
269 
270     /* format "BiDi" */
271     private static final int FMT=0x42694469;
272 
273     /* indexes into indexes[] */
274     //private static final int IX_INDEX_TOP=0;
275     //private static final int IX_LENGTH=1;
276     private static final int IX_TRIE_SIZE=2;
277     private static final int IX_MIRROR_LENGTH=3;
278 
279     private static final int IX_JG_START=4;
280     private static final int IX_JG_LIMIT=5;
281     private static final int IX_JG_START2=6;  /* new in format version 2.2, ICU 54 */
282     private static final int IX_JG_LIMIT2=7;
283 
284     private static final int IX_MAX_VALUES=15;
285     private static final int IX_TOP=16;
286 
287     // definitions for 16-bit bidi/shaping properties word ----------------- ***
288 
289                           /* CLASS_SHIFT=0, */     /* bidi class: 5 bits (4..0) */
290     private static final int JT_SHIFT=5;           /* joining type: 3 bits (7..5) */
291 
292     private static final int BPT_SHIFT=8;          /* Bidi_Paired_Bracket_Type(bpt): 2 bits (9..8) */
293 
294     private static final int JOIN_CONTROL_SHIFT=10;
295     private static final int BIDI_CONTROL_SHIFT=11;
296 
297     private static final int IS_MIRRORED_SHIFT=12;         /* 'is mirrored' */
298     private static final int MIRROR_DELTA_SHIFT=13;        /* bidi mirroring delta: 3 bits (15..13) */
299 
300     private static final int MAX_JG_SHIFT=16;              /* max JG value in indexes[MAX_VALUES_INDEX] bits 23..16 */
301 
302     private static final int CLASS_MASK=    0x0000001f;
303     private static final int JT_MASK=       0x000000e0;
304     private static final int BPT_MASK=      0x00000300;
305 
306     private static final int MAX_JG_MASK=   0x00ff0000;
307 
getClassFromProps(int props)308     private static final int getClassFromProps(int props) {
309         return props&CLASS_MASK;
310     }
getFlagFromProps(int props, int shift)311     private static final boolean getFlagFromProps(int props, int shift) {
312         return ((props>>shift)&1)!=0;
313     }
getMirrorDeltaFromProps(int props)314     private static final int getMirrorDeltaFromProps(int props) {
315         return (short)props>>MIRROR_DELTA_SHIFT;
316     }
317 
318     private static final int ESC_MIRROR_DELTA=-4;
319     //private static final int MIN_MIRROR_DELTA=-3;
320     //private static final int MAX_MIRROR_DELTA=3;
321 
322     // definitions for 32-bit mirror table entry --------------------------- ***
323 
324     /* the source Unicode code point takes 21 bits (20..0) */
325     private static final int MIRROR_INDEX_SHIFT=21;
326     //private static final int MAX_MIRROR_INDEX=0x7ff;
327 
getMirrorCodePoint(int m)328     private static final int getMirrorCodePoint(int m) {
329         return m&0x1fffff;
330     }
getMirrorIndex(int m)331     private static final int getMirrorIndex(int m) {
332         return m>>>MIRROR_INDEX_SHIFT;
333     }
334 
335 
336     /*
337      * public singleton instance
338      */
339     public static final UBiDiProps INSTANCE;
340 
341     // This static initializer block must be placed after
342     // other static member initialization
343     static {
344         try {
345             INSTANCE = new UBiDiProps();
346         } catch (IOException e) {
347             throw new ICUUncheckedIOException(e);
348         }
349     }
350 }
351