blob: baeb3fec838a5eb437b571db195516633f8cec97 [file] [log] [blame]
Daisuke Miyakawa948a1192009-09-19 19:19:53 -07001/*
2 *
3 * Copyright 2006, The Android Open Source Project
4 *
5 * Licensed under the Apache License, Version 2.0 (the "License");
6 * you may not use this file except in compliance with the License.
7 * You may obtain a copy of the License at
8 *
9 * http://www.apache.org/licenses/LICENSE-2.0
10 *
11 * Unless required by applicable law or agreed to in writing, software
12 * distributed under the License is distributed on an "AS IS" BASIS,
13 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14 * See the License for the specific language governing permissions and
15 * limitations under the License.
16 */
17
18// Old implementation for phone_number_compare(), which has used in cupcake, but once replaced with
19// the new, more strict version, and reverted again.
20
21#include <string.h>
22
23namespace android {
24
Wei Huang3fffdd32009-09-20 16:54:10 -070025static int MIN_MATCH = 7;
Daisuke Miyakawa948a1192009-09-19 19:19:53 -070026
27/** True if c is ISO-LATIN characters 0-9 */
28static bool isISODigit (char c)
29{
30 return c >= '0' && c <= '9';
31}
32
33/** True if c is ISO-LATIN characters 0-9, *, # , + */
34static bool isNonSeparator(char c)
35{
36 return (c >= '0' && c <= '9') || c == '*' || c == '#' || c == '+';
37}
38
39/**
40 * Phone numbers are stored in "lookup" form in the database
41 * as reversed strings to allow for caller ID lookup
42 *
43 * This method takes a phone number and makes a valid SQL "LIKE"
44 * string that will match the lookup form
45 *
46 */
47/** all of a up to len must be an international prefix or
48 * separators/non-dialing digits
49 */
50static bool matchIntlPrefix(const char* a, int len)
51{
52 /* '([^0-9*#+]\+[^0-9*#+] | [^0-9*#+]0(0|11)[^0-9*#+] )$' */
53 /* 0 1 2 3 45 */
54
55 int state = 0;
56 for (int i = 0 ; i < len ; i++) {
57 char c = a[i];
58
59 switch (state) {
60 case 0:
61 if (c == '+') state = 1;
62 else if (c == '0') state = 2;
63 else if (isNonSeparator(c)) return false;
64 break;
65
66 case 2:
67 if (c == '0') state = 3;
68 else if (c == '1') state = 4;
69 else if (isNonSeparator(c)) return false;
70 break;
71
72 case 4:
73 if (c == '1') state = 5;
74 else if (isNonSeparator(c)) return false;
75 break;
76
77 default:
78 if (isNonSeparator(c)) return false;
79 break;
80
81 }
82 }
83
84 return state == 1 || state == 3 || state == 5;
85}
86
87/** all of 'a' up to len must match non-US trunk prefix ('0') */
88static bool matchTrunkPrefix(const char* a, int len)
89{
90 bool found;
91
92 found = false;
93
94 for (int i = 0 ; i < len ; i++) {
95 char c = a[i];
96
97 if (c == '0' && !found) {
98 found = true;
99 } else if (isNonSeparator(c)) {
100 return false;
101 }
102 }
103
104 return found;
105}
106
107/** all of 'a' up to len must be a (+|00|011)country code)
108 * We're fast and loose with the country code. Any \d{1,3} matches */
109static bool matchIntlPrefixAndCC(const char* a, int len)
110{
111 /* [^0-9*#+]*(\+|0(0|11)\d\d?\d? [^0-9*#+] $ */
112 /* 0 1 2 3 45 6 7 8 */
113
114 int state = 0;
115 for (int i = 0 ; i < len ; i++ ) {
116 char c = a[i];
117
118 switch (state) {
119 case 0:
120 if (c == '+') state = 1;
121 else if (c == '0') state = 2;
122 else if (isNonSeparator(c)) return false;
123 break;
124
125 case 2:
126 if (c == '0') state = 3;
127 else if (c == '1') state = 4;
128 else if (isNonSeparator(c)) return false;
129 break;
130
131 case 4:
132 if (c == '1') state = 5;
133 else if (isNonSeparator(c)) return false;
134 break;
135
136 case 1:
137 case 3:
138 case 5:
139 if (isISODigit(c)) state = 6;
140 else if (isNonSeparator(c)) return false;
141 break;
142
143 case 6:
144 case 7:
145 if (isISODigit(c)) state++;
146 else if (isNonSeparator(c)) return false;
147 break;
148
149 default:
150 if (isNonSeparator(c)) return false;
151 }
152 }
153
154 return state == 6 || state == 7 || state == 8;
155}
156
157/** or -1 if both are negative */
158static int minPositive(int a, int b)
159{
160 if (a >= 0 && b >= 0) {
161 return (a < b) ? a : b;
162 } else if (a >= 0) { /* && b < 0 */
163 return a;
164 } else if (b >= 0) { /* && a < 0 */
165 return b;
166 } else { /* a < 0 && b < 0 */
167 return -1;
168 }
169}
170
171/**
172 * Return the offset into a of the first appearance of b, or -1 if there
173 * is no such character in a.
174 */
175static int indexOf(const char *a, char b) {
176 char *ix = strchr(a, b);
177
178 if (ix == NULL)
179 return -1;
180 else
181 return ix - a;
182}
183
184/**
185 * Compare phone numbers a and b, return true if they're identical
186 * enough for caller ID purposes.
187 *
188 * - Compares from right to left
Wei Huang3fffdd32009-09-20 16:54:10 -0700189 * - requires MIN_MATCH (7) characters to match
Daisuke Miyakawa948a1192009-09-19 19:19:53 -0700190 * - handles common trunk prefixes and international prefixes
191 * (basically, everything except the Russian trunk prefix)
192 *
193 * Tolerates nulls
194 */
195bool phone_number_compare_loose(const char* a, const char* b)
196{
197 int ia, ib;
198 int matched;
199
200 if (a == NULL || b == NULL) {
201 return false;
202 }
203
204 ia = strlen(a);
205 ib = strlen(b);
206 if (ia == 0 || ib == 0) {
207 return false;
208 }
209
210 // Compare from right to left
211 ia--;
212 ib--;
213
214 matched = 0;
215
216 while (ia >= 0 && ib >=0) {
217 char ca, cb;
218 bool skipCmp = false;
219
220 ca = a[ia];
221
222 if (!isNonSeparator(ca)) {
223 ia--;
224 skipCmp = true;
225 }
226
227 cb = b[ib];
228
229 if (!isNonSeparator(cb)) {
230 ib--;
231 skipCmp = true;
232 }
233
234 if (!skipCmp) {
235 if (cb != ca) {
236 break;
237 }
238 ia--; ib--; matched++;
239 }
240 }
241
242 if (matched < MIN_MATCH) {
243 int aLen = strlen(a);
244
245 // if the input strings match, but their lengths < MIN_MATCH,
246 // treat them as equal.
247 if (aLen == (int)strlen(b) && aLen == matched) {
248 return true;
249 }
250 return false;
251 }
252
253 // At least one string has matched completely;
254 if (matched >= MIN_MATCH && (ia < 0 || ib < 0)) {
255 return true;
256 }
257
258 /*
259 * Now, what remains must be one of the following for a
260 * match:
261 *
262 * - a '+' on one and a '00' or a '011' on the other
263 * - a '0' on one and a (+,00)<country code> on the other
264 * (for this, a '0' and a '00' prefix would have succeeded above)
265 */
266
267 if (matchIntlPrefix(a, ia + 1) && matchIntlPrefix(b, ib +1)) {
268 return true;
269 }
270
271 if (matchTrunkPrefix(a, ia + 1) && matchIntlPrefixAndCC(b, ib +1)) {
272 return true;
273 }
274
275 if (matchTrunkPrefix(b, ib + 1) && matchIntlPrefixAndCC(a, ia +1)) {
276 return true;
277 }
278
279 /*
280 * Last resort: if the number of unmatched characters on both sides is less than or equal
281 * to the length of the longest country code and only one number starts with a + accept
282 * the match. This is because some countries like France and Russia have an extra prefix
283 * digit that is used when dialing locally in country that does not show up when you dial
284 * the number using the country code. In France this prefix digit is used to determine
285 * which land line carrier to route the call over.
286 */
287 bool aPlusFirst = (*a == '+');
288 bool bPlusFirst = (*b == '+');
289 if (ia < 4 && ib < 4 && (aPlusFirst || bPlusFirst) && !(aPlusFirst && bPlusFirst)) {
290 return true;
291 }
292
293 return false;
294}
295
296} // namespace android