1 /*
2  *
3  * Copyright 2006, The Android Open Source Project
4  *
5  * Licensed under the Apache License, Version 2.0 (the "License");
6  * you may not use this file except in compliance with the License.
7  * You may obtain a copy of the License at
8  *
9  *     http://www.apache.org/licenses/LICENSE-2.0
10  *
11  * Unless required by applicable law or agreed to in writing, software
12  * distributed under the License is distributed on an "AS IS" BASIS,
13  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14  * See the License for the specific language governing permissions and
15  * limitations under the License.
16  */
17 
18 // Old implementation for phone_number_compare(), which has used in cupcake, but once replaced with
19 // the new, more strict version, and reverted again.
20 
21 #include <string.h>
22 
23 namespace android {
24 
25 static int MIN_MATCH = 7;
26 
27 /** True if c is ISO-LATIN characters 0-9 */
isISODigit(char c)28 static bool isISODigit (char c)
29 {
30     return c >= '0' && c <= '9';
31 }
32 
33 /** True if c is ISO-LATIN characters 0-9, *, # , +  */
isNonSeparator(char c)34 static bool isNonSeparator(char c)
35 {
36     return (c >= '0' && c <= '9') || c == '*' || c == '#' || c == '+';
37 }
38 
39 /**
40  * Phone numbers are stored in "lookup" form in the database
41  * as reversed strings to allow for caller ID lookup
42  *
43  * This method takes a phone number and makes a valid SQL "LIKE"
44  * string that will match the lookup form
45  *
46  */
47 /** all of a up to len must be an international prefix or
48  *  separators/non-dialing digits
49  */
matchIntlPrefix(const char * a,int len)50 static bool matchIntlPrefix(const char* a, int len)
51 {
52     /* '([^0-9*#+]\+[^0-9*#+] | [^0-9*#+]0(0|11)[^0-9*#+] )$' */
53     /*        0    1                     2 3 45               */
54 
55     int state = 0;
56     for (int i = 0 ; i < len ; i++) {
57         char c = a[i];
58 
59         switch (state) {
60             case 0:
61                 if      (c == '+') state = 1;
62                 else if (c == '0') state = 2;
63                 else if (isNonSeparator(c)) return false;
64             break;
65 
66             case 2:
67                 if      (c == '0') state = 3;
68                 else if (c == '1') state = 4;
69                 else if (isNonSeparator(c)) return false;
70             break;
71 
72             case 4:
73                 if      (c == '1') state = 5;
74                 else if (isNonSeparator(c)) return false;
75             break;
76 
77             default:
78                 if (isNonSeparator(c)) return false;
79             break;
80 
81         }
82     }
83 
84     return state == 1 || state == 3 || state == 5;
85 }
86 
87 /** all of 'a' up to len must match non-US trunk prefix ('0') */
matchTrunkPrefix(const char * a,int len)88 static bool matchTrunkPrefix(const char* a, int len)
89 {
90     bool found;
91 
92     found = false;
93 
94     for (int i = 0 ; i < len ; i++) {
95         char c = a[i];
96 
97         if (c == '0' && !found) {
98             found = true;
99         } else if (isNonSeparator(c)) {
100             return false;
101         }
102     }
103 
104     return found;
105 }
106 
107 /** all of 'a' up to len must be a (+|00|011)country code)
108  *  We're fast and loose with the country code. Any \d{1,3} matches */
matchIntlPrefixAndCC(const char * a,int len)109 static bool matchIntlPrefixAndCC(const char* a, int len)
110 {
111     /*  [^0-9*#+]*(\+|0(0|11)\d\d?\d? [^0-9*#+] $ */
112     /*      0       1 2 3 45  6 7  8              */
113 
114     int state = 0;
115     for (int i = 0 ; i < len ; i++ ) {
116         char c = a[i];
117 
118         switch (state) {
119             case 0:
120                 if      (c == '+') state = 1;
121                 else if (c == '0') state = 2;
122                 else if (isNonSeparator(c)) return false;
123             break;
124 
125             case 2:
126                 if      (c == '0') state = 3;
127                 else if (c == '1') state = 4;
128                 else if (isNonSeparator(c)) return false;
129             break;
130 
131             case 4:
132                 if      (c == '1') state = 5;
133                 else if (isNonSeparator(c)) return false;
134             break;
135 
136             case 1:
137             case 3:
138             case 5:
139                 if      (isISODigit(c)) state = 6;
140                 else if (isNonSeparator(c)) return false;
141             break;
142 
143             case 6:
144             case 7:
145                 if      (isISODigit(c)) state++;
146                 else if (isNonSeparator(c)) return false;
147             break;
148 
149             default:
150                 if (isNonSeparator(c)) return false;
151         }
152     }
153 
154     return state == 6 || state == 7 || state == 8;
155 }
156 
157 /**
158  * Compare phone numbers a and b, return true if they're identical
159  * enough for caller ID purposes.
160  *
161  * - Compares from right to left
162  * - requires minimum characters to match
163  * - handles common trunk prefixes and international prefixes
164  *   (basically, everything except the Russian trunk prefix)
165  *
166  * Tolerates nulls
167  */
phone_number_compare_loose_with_minmatch(const char * a,const char * b,int min_match)168 bool phone_number_compare_loose_with_minmatch(const char* a, const char* b, int min_match)
169 {
170     int ia, ib;
171     int matched;
172     int numSeparatorCharsInA = 0;
173     int numSeparatorCharsInB = 0;
174 
175     if (a == NULL || b == NULL) {
176         return false;
177     }
178 
179     ia = strlen(a);
180     ib = strlen(b);
181     if (ia == 0 || ib == 0) {
182         return false;
183     }
184 
185     // Compare from right to left
186     ia--;
187     ib--;
188 
189     matched = 0;
190 
191     while (ia >= 0 && ib >=0) {
192         char ca, cb;
193         bool skipCmp = false;
194 
195         ca = a[ia];
196 
197         if (!isNonSeparator(ca)) {
198             ia--;
199             skipCmp = true;
200             numSeparatorCharsInA++;
201         }
202 
203         cb = b[ib];
204 
205         if (!isNonSeparator(cb)) {
206             ib--;
207             skipCmp = true;
208             numSeparatorCharsInB++;
209         }
210 
211         if (!skipCmp) {
212             if (cb != ca) {
213                 break;
214             }
215             ia--; ib--; matched++;
216         }
217     }
218 
219     if (matched < min_match) {
220         const int effectiveALen = strlen(a) - numSeparatorCharsInA;
221         const int effectiveBLen = strlen(b) - numSeparatorCharsInB;
222 
223         // if the number of dialable chars in a and b match, but the matched chars < min_match,
224         // treat them as equal (i.e. 404-04 and 40404)
225         if (effectiveALen == effectiveBLen && effectiveALen == matched) {
226             return true;
227         }
228 
229         return false;
230     }
231 
232     // At least one string has matched completely;
233     if (matched >= min_match && (ia < 0 || ib < 0)) {
234         return true;
235     }
236 
237     /*
238      * Now, what remains must be one of the following for a
239      * match:
240      *
241      *  - a '+' on one and a '00' or a '011' on the other
242      *  - a '0' on one and a (+,00)<country code> on the other
243      *     (for this, a '0' and a '00' prefix would have succeeded above)
244      */
245 
246     if (matchIntlPrefix(a, ia + 1) && matchIntlPrefix(b, ib + 1)) {
247         return true;
248     }
249 
250     if (matchTrunkPrefix(a, ia + 1) && matchIntlPrefixAndCC(b, ib + 1)) {
251         return true;
252     }
253 
254     if (matchTrunkPrefix(b, ib + 1) && matchIntlPrefixAndCC(a, ia + 1)) {
255         return true;
256     }
257 
258     /*
259      * Last resort: if the number of unmatched characters on both sides is less than or equal
260      * to the length of the longest country code and only one number starts with a + accept
261      * the match. This is because some countries like France and Russia have an extra prefix
262      * digit that is used when dialing locally in country that does not show up when you dial
263      * the number using the country code. In France this prefix digit is used to determine
264      * which land line carrier to route the call over.
265      */
266     bool aPlusFirst = (*a == '+');
267     bool bPlusFirst = (*b == '+');
268     bool aIgnoreUnmatched = aPlusFirst && (ia - ib) >= 0 && (ia - ib) <= 1;
269     bool bIgnoreUnmatched = bPlusFirst && (ib - ia) >= 0 && (ib - ia) <= 1;
270     if (ia < 4 && ib < 4 && (aIgnoreUnmatched || bIgnoreUnmatched) && !(aPlusFirst && bPlusFirst)) {
271         return true;
272     }
273 
274     return false;
275 }
276 
phone_number_compare_loose(const char * a,const char * b)277 bool phone_number_compare_loose(const char* a, const char* b)
278 {
279     return phone_number_compare_loose_with_minmatch(a, b, MIN_MATCH);
280 }
281 
282 }  // namespace android
283