| /* |
| * Copyright (C) 2009 Google Inc. |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package com.google.i18n.phonenumbers; |
| |
| import com.google.i18n.phonenumbers.Phonemetadata.NumberFormat; |
| import com.google.i18n.phonenumbers.Phonemetadata.PhoneMetadata; |
| import com.google.i18n.phonenumbers.Phonemetadata.PhoneMetadataCollection; |
| import com.google.i18n.phonenumbers.Phonemetadata.PhoneNumberDesc; |
| import com.google.i18n.phonenumbers.Phonenumber.PhoneNumber; |
| import com.google.i18n.phonenumbers.Phonenumber.PhoneNumber.CountryCodeSource; |
| |
| import java.io.IOException; |
| import java.io.InputStream; |
| import java.io.ObjectInputStream; |
| import java.util.ArrayList; |
| import java.util.Arrays; |
| import java.util.Collections; |
| import java.util.HashMap; |
| import java.util.HashSet; |
| import java.util.Iterator; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Set; |
| import java.util.logging.Level; |
| import java.util.logging.Logger; |
| import java.util.regex.Matcher; |
| import java.util.regex.Pattern; |
| |
| /** |
| * Utility for international phone numbers. Functionality includes formatting, parsing and |
| * validation. |
| * |
| * <p>If you use this library, and want to be notified about important changes, please sign up to |
| * our <a href="http://groups.google.com/group/libphonenumber-discuss/about">mailing list</a>. |
| * |
| * NOTE: A lot of methods in this class require Region Code strings. These must be provided using |
| * ISO 3166-1 two-letter country-code format. These should be in upper-case. The list of the codes |
| * can be found here: http://www.iso.org/iso/english_country_names_and_code_elements |
| * |
| * @author Shaopeng Jia |
| * @author Lara Rennie |
| */ |
| public class PhoneNumberUtil { |
| /** Flags to use when compiling regular expressions for phone numbers. */ |
| static final int REGEX_FLAGS = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE; |
| // The minimum and maximum length of the national significant number. |
| private static final int MIN_LENGTH_FOR_NSN = 3; |
| static final int MAX_LENGTH_FOR_NSN = 15; |
| // The maximum length of the country calling code. |
| static final int MAX_LENGTH_COUNTRY_CODE = 3; |
| static final String META_DATA_FILE_PREFIX = |
| "/com/google/i18n/phonenumbers/data/PhoneNumberMetadataProto"; |
| private String currentFilePrefix = META_DATA_FILE_PREFIX; |
| private static final Logger LOGGER = Logger.getLogger(PhoneNumberUtil.class.getName()); |
| |
| // A mapping from a country calling code to the region codes which denote the region represented |
| // by that country calling code. In the case of multiple regions sharing a calling code, such as |
| // the NANPA regions, the one indicated with "isMainCountryForCode" in the metadata should be |
| // first. |
| private Map<Integer, List<String>> countryCallingCodeToRegionCodeMap = null; |
| |
| // The set of regions the library supports. |
| // There are roughly 220 of them and we set the initial capacity of the HashSet to 300 to offer a |
| // load factor of roughly 0.75. |
| private final Set<String> supportedRegions = new HashSet<String>(300); |
| |
| // Region-code for the unknown region. |
| private static final String UNKNOWN_REGION = "ZZ"; |
| |
| // The set of regions that share country calling code 1. |
| // There are roughly 26 regions and we set the initial capacity of the HashSet to 35 to offer a |
| // load factor of roughly 0.75. |
| private final Set<String> nanpaRegions = new HashSet<String>(35); |
| private static final int NANPA_COUNTRY_CODE = 1; |
| |
| // The PLUS_SIGN signifies the international prefix. |
| static final char PLUS_SIGN = '+'; |
| |
| private static final String RFC3966_EXTN_PREFIX = ";ext="; |
| |
| // Only upper-case variants of alpha characters are stored. |
| private static final Map<Character, Character> ALPHA_MAPPINGS; |
| |
| // For performance reasons, amalgamate both into one map. |
| private static final Map<Character, Character> ALPHA_PHONE_MAPPINGS; |
| |
| // Separate map of all symbols that we wish to retain when formatting alpha numbers. This |
| // includes digits, ASCII letters and number grouping symbols such as "-" and " ". |
| private static final Map<Character, Character> ALL_PLUS_NUMBER_GROUPING_SYMBOLS; |
| |
| static { |
| // Simple ASCII digits map used to populate ALPHA_PHONE_MAPPINGS and |
| // ALL_PLUS_NUMBER_GROUPING_SYMBOLS. |
| HashMap<Character, Character> asciiDigitMappings = new HashMap<Character, Character>(); |
| asciiDigitMappings.put('0', '0'); |
| asciiDigitMappings.put('1', '1'); |
| asciiDigitMappings.put('2', '2'); |
| asciiDigitMappings.put('3', '3'); |
| asciiDigitMappings.put('4', '4'); |
| asciiDigitMappings.put('5', '5'); |
| asciiDigitMappings.put('6', '6'); |
| asciiDigitMappings.put('7', '7'); |
| asciiDigitMappings.put('8', '8'); |
| asciiDigitMappings.put('9', '9'); |
| |
| HashMap<Character, Character> alphaMap = new HashMap<Character, Character>(40); |
| alphaMap.put('A', '2'); |
| alphaMap.put('B', '2'); |
| alphaMap.put('C', '2'); |
| alphaMap.put('D', '3'); |
| alphaMap.put('E', '3'); |
| alphaMap.put('F', '3'); |
| alphaMap.put('G', '4'); |
| alphaMap.put('H', '4'); |
| alphaMap.put('I', '4'); |
| alphaMap.put('J', '5'); |
| alphaMap.put('K', '5'); |
| alphaMap.put('L', '5'); |
| alphaMap.put('M', '6'); |
| alphaMap.put('N', '6'); |
| alphaMap.put('O', '6'); |
| alphaMap.put('P', '7'); |
| alphaMap.put('Q', '7'); |
| alphaMap.put('R', '7'); |
| alphaMap.put('S', '7'); |
| alphaMap.put('T', '8'); |
| alphaMap.put('U', '8'); |
| alphaMap.put('V', '8'); |
| alphaMap.put('W', '9'); |
| alphaMap.put('X', '9'); |
| alphaMap.put('Y', '9'); |
| alphaMap.put('Z', '9'); |
| ALPHA_MAPPINGS = Collections.unmodifiableMap(alphaMap); |
| |
| HashMap<Character, Character> combinedMap = new HashMap<Character, Character>(100); |
| combinedMap.putAll(ALPHA_MAPPINGS); |
| combinedMap.putAll(asciiDigitMappings); |
| ALPHA_PHONE_MAPPINGS = Collections.unmodifiableMap(combinedMap); |
| |
| HashMap<Character, Character> allPlusNumberGroupings = new HashMap<Character, Character>(); |
| // Put (lower letter -> upper letter) and (upper letter -> upper letter) mappings. |
| for (char c : ALPHA_MAPPINGS.keySet()) { |
| allPlusNumberGroupings.put(Character.toLowerCase(c), c); |
| allPlusNumberGroupings.put(c, c); |
| } |
| allPlusNumberGroupings.putAll(asciiDigitMappings); |
| // Put grouping symbols. |
| allPlusNumberGroupings.put('-', '-'); |
| allPlusNumberGroupings.put('\uFF0D', '-'); |
| allPlusNumberGroupings.put('\u2010', '-'); |
| allPlusNumberGroupings.put('\u2011', '-'); |
| allPlusNumberGroupings.put('\u2012', '-'); |
| allPlusNumberGroupings.put('\u2013', '-'); |
| allPlusNumberGroupings.put('\u2014', '-'); |
| allPlusNumberGroupings.put('\u2015', '-'); |
| allPlusNumberGroupings.put('\u2212', '-'); |
| allPlusNumberGroupings.put('/', '/'); |
| allPlusNumberGroupings.put('\uFF0F', '/'); |
| allPlusNumberGroupings.put(' ', ' '); |
| allPlusNumberGroupings.put('\u3000', ' '); |
| allPlusNumberGroupings.put('\u2060', ' '); |
| allPlusNumberGroupings.put('.', '.'); |
| allPlusNumberGroupings.put('\uFF0E', '.'); |
| ALL_PLUS_NUMBER_GROUPING_SYMBOLS = Collections.unmodifiableMap(allPlusNumberGroupings); |
| } |
| |
| // Pattern that makes it easy to distinguish whether a region has a unique international dialing |
| // prefix or not. If a region has a unique international prefix (e.g. 011 in USA), it will be |
| // represented as a string that contains a sequence of ASCII digits. If there are multiple |
| // available international prefixes in a region, they will be represented as a regex string that |
| // always contains character(s) other than ASCII digits. |
| // Note this regex also includes tilde, which signals waiting for the tone. |
| private static final Pattern UNIQUE_INTERNATIONAL_PREFIX = |
| Pattern.compile("[\\d]+(?:[~\u2053\u223C\uFF5E][\\d]+)?"); |
| |
| // Regular expression of acceptable punctuation found in phone numbers. This excludes punctuation |
| // found as a leading character only. |
| // This consists of dash characters, white space characters, full stops, slashes, |
| // square brackets, parentheses and tildes. It also includes the letter 'x' as that is found as a |
| // placeholder for carrier information in some phone numbers. Full-width variants are also |
| // present. |
| static final String VALID_PUNCTUATION = "-x\u2010-\u2015\u2212\u30FC\uFF0D-\uFF0F " + |
| "\u00A0\u200B\u2060\u3000()\uFF08\uFF09\uFF3B\uFF3D.\\[\\]/~\u2053\u223C\uFF5E"; |
| |
| private static final String DIGITS = "\\p{Nd}"; |
| // We accept alpha characters in phone numbers, ASCII only, upper and lower case. |
| private static final String VALID_ALPHA = |
| Arrays.toString(ALPHA_MAPPINGS.keySet().toArray()).replaceAll("[, \\[\\]]", "") + |
| Arrays.toString(ALPHA_MAPPINGS.keySet().toArray()).toLowerCase().replaceAll("[, \\[\\]]", ""); |
| static final String PLUS_CHARS = "+\uFF0B"; |
| static final Pattern PLUS_CHARS_PATTERN = Pattern.compile("[" + PLUS_CHARS + "]+"); |
| private static final Pattern SEPARATOR_PATTERN = Pattern.compile("[" + VALID_PUNCTUATION + "]+"); |
| private static final Pattern CAPTURING_DIGIT_PATTERN = Pattern.compile("(" + DIGITS + ")"); |
| |
| // Regular expression of acceptable characters that may start a phone number for the purposes of |
| // parsing. This allows us to strip away meaningless prefixes to phone numbers that may be |
| // mistakenly given to us. This consists of digits, the plus symbol and arabic-indic digits. This |
| // does not contain alpha characters, although they may be used later in the number. It also does |
| // not include other punctuation, as this will be stripped later during parsing and is of no |
| // information value when parsing a number. |
| private static final String VALID_START_CHAR = "[" + PLUS_CHARS + DIGITS + "]"; |
| private static final Pattern VALID_START_CHAR_PATTERN = Pattern.compile(VALID_START_CHAR); |
| |
| // Regular expression of characters typically used to start a second phone number for the purposes |
| // of parsing. This allows us to strip off parts of the number that are actually the start of |
| // another number, such as for: (530) 583-6985 x302/x2303 -> the second extension here makes this |
| // actually two phone numbers, (530) 583-6985 x302 and (530) 583-6985 x2303. We remove the second |
| // extension so that the first number is parsed correctly. |
| private static final String SECOND_NUMBER_START = "[\\\\/] *x"; |
| static final Pattern SECOND_NUMBER_START_PATTERN = Pattern.compile(SECOND_NUMBER_START); |
| |
| // Regular expression of trailing characters that we want to remove. We remove all characters that |
| // are not alpha or numerical characters. The hash character is retained here, as it may signify |
| // the previous block was an extension. |
| private static final String UNWANTED_END_CHARS = "[[\\P{N}&&\\P{L}]&&[^#]]+$"; |
| static final Pattern UNWANTED_END_CHAR_PATTERN = Pattern.compile(UNWANTED_END_CHARS); |
| |
| // We use this pattern to check if the phone number has at least three letters in it - if so, then |
| // we treat it as a number where some phone-number digits are represented by letters. |
| private static final Pattern VALID_ALPHA_PHONE_PATTERN = Pattern.compile("(?:.*?[A-Za-z]){3}.*"); |
| |
| // Regular expression of viable phone numbers. This is location independent. Checks we have at |
| // least three leading digits, and only valid punctuation, alpha characters and |
| // digits in the phone number. Does not include extension data. |
| // The symbol 'x' is allowed here as valid punctuation since it is often used as a placeholder for |
| // carrier codes, for example in Brazilian phone numbers. We also allow multiple "+" characters at |
| // the start. |
| // Corresponds to the following: |
| // plus_sign*([punctuation]*[digits]){3,}([punctuation]|[digits]|[alpha])* |
| // Note VALID_PUNCTUATION starts with a -, so must be the first in the range. |
| private static final String VALID_PHONE_NUMBER = |
| "[" + PLUS_CHARS + "]*(?:[" + VALID_PUNCTUATION + "]*" + DIGITS + "){3,}[" + |
| VALID_PUNCTUATION + VALID_ALPHA + DIGITS + "]*"; |
| |
| // Default extension prefix to use when formatting. This will be put in front of any extension |
| // component of the number, after the main national number is formatted. For example, if you wish |
| // the default extension formatting to be " extn: 3456", then you should specify " extn: " here |
| // as the default extension prefix. This can be overridden by region-specific preferences. |
| private static final String DEFAULT_EXTN_PREFIX = " ext. "; |
| |
| // Regexp of all possible ways to write extensions, for use when parsing. This will be run as a |
| // case-insensitive regexp match. Wide character versions are also provided after each ASCII |
| // version. There are three regular expressions here. The first covers RFC 3966 format, where the |
| // extension is added using ";ext=". The second more generic one starts with optional white space |
| // and ends with an optional full stop (.), followed by zero or more spaces/tabs and then the |
| // numbers themselves. The other one covers the special case of American numbers where the |
| // extension is written with a hash at the end, such as "- 503#". |
| // Note that the only capturing groups should be around the digits that you want to capture as |
| // part of the extension, or else parsing will fail! |
| // Canonical-equivalence doesn't seem to be an option with Android java, so we allow two options |
| // for representing the accented o - the character itself, and one in the unicode decomposed form |
| // with the combining acute accent. |
| private static final String CAPTURING_EXTN_DIGITS = "(" + DIGITS + "{1,7})"; |
| static final String KNOWN_EXTN_PATTERNS = |
| RFC3966_EXTN_PREFIX + CAPTURING_EXTN_DIGITS + "|" + |
| "[ \u00A0\\t,]*(?:ext(?:ensi(?:o\u0301?|\u00F3))?n?|" + |
| "\uFF45\uFF58\uFF54\uFF4E?|[,x\uFF58#\uFF03~\uFF5E]|int|anexo|\uFF49\uFF4E\uFF54)" + |
| "[:\\.\uFF0E]?[ \u00A0\\t,-]*" + CAPTURING_EXTN_DIGITS + "#?|" + |
| "[- ]+(" + DIGITS + "{1,5})#"; |
| |
| // Regexp of all known extension prefixes used by different regions followed by 1 or more valid |
| // digits, for use when parsing. |
| private static final Pattern EXTN_PATTERN = |
| Pattern.compile("(?:" + KNOWN_EXTN_PATTERNS + ")$", REGEX_FLAGS); |
| |
| // We append optionally the extension pattern to the end here, as a valid phone number may |
| // have an extension prefix appended, followed by 1 or more digits. |
| private static final Pattern VALID_PHONE_NUMBER_PATTERN = |
| Pattern.compile(VALID_PHONE_NUMBER + "(?:" + KNOWN_EXTN_PATTERNS + ")?", REGEX_FLAGS); |
| |
| private static final Pattern NON_DIGITS_PATTERN = Pattern.compile("(\\D+)"); |
| |
| // The FIRST_GROUP_PATTERN was originally set to $1 but there are some countries for which the |
| // first group is not used in the national pattern (e.g. Argentina) so the $1 group does not match |
| // correctly. Therefore, we use \d, so that the first group actually used in the pattern will be |
| // matched. |
| private static final Pattern FIRST_GROUP_PATTERN = Pattern.compile("(\\$\\d)"); |
| private static final Pattern NP_PATTERN = Pattern.compile("\\$NP"); |
| private static final Pattern FG_PATTERN = Pattern.compile("\\$FG"); |
| private static final Pattern CC_PATTERN = Pattern.compile("\\$CC"); |
| |
| private static PhoneNumberUtil instance = null; |
| |
| // A mapping from a region code to the PhoneMetadata for that region. |
| private Map<String, PhoneMetadata> regionToMetadataMap = new HashMap<String, PhoneMetadata>(); |
| |
| // A cache for frequently used region-specific regular expressions. |
| // As most people use phone numbers primarily from one to two countries, and there are roughly 60 |
| // regular expressions needed, the initial capacity of 100 offers a rough load factor of 0.75. |
| private RegexCache regexCache = new RegexCache(100); |
| |
| /** |
| * INTERNATIONAL and NATIONAL formats are consistent with the definition in ITU-T Recommendation |
| * E123. For example, the number of the Google Switzerland office will be written as |
| * "+41 44 668 1800" in INTERNATIONAL format, and as "044 668 1800" in NATIONAL format. |
| * E164 format is as per INTERNATIONAL format but with no formatting applied, e.g. +41446681800. |
| * RFC3966 is as per INTERNATIONAL format, but with all spaces and other separating symbols |
| * replaced with a hyphen, and with any phone number extension appended with ";ext=". |
| * |
| * Note: If you are considering storing the number in a neutral format, you are highly advised to |
| * use the PhoneNumber class. |
| */ |
| public enum PhoneNumberFormat { |
| E164, |
| INTERNATIONAL, |
| NATIONAL, |
| RFC3966 |
| } |
| |
| /** |
| * Type of phone numbers. |
| */ |
| public enum PhoneNumberType { |
| FIXED_LINE, |
| MOBILE, |
| // In some regions (e.g. the USA), it is impossible to distinguish between fixed-line and |
| // mobile numbers by looking at the phone number itself. |
| FIXED_LINE_OR_MOBILE, |
| // Freephone lines |
| TOLL_FREE, |
| PREMIUM_RATE, |
| // The cost of this call is shared between the caller and the recipient, and is hence typically |
| // less than PREMIUM_RATE calls. See // http://en.wikipedia.org/wiki/Shared_Cost_Service for |
| // more information. |
| SHARED_COST, |
| // Voice over IP numbers. This includes TSoIP (Telephony Service over IP). |
| VOIP, |
| // A personal number is associated with a particular person, and may be routed to either a |
| // MOBILE or FIXED_LINE number. Some more information can be found here: |
| // http://en.wikipedia.org/wiki/Personal_Numbers |
| PERSONAL_NUMBER, |
| PAGER, |
| // Used for "Universal Access Numbers" or "Company Numbers". They may be further routed to |
| // specific offices, but allow one number to be used for a company. |
| UAN, |
| // A phone number is of type UNKNOWN when it does not fit any of the known patterns for a |
| // specific region. |
| UNKNOWN |
| } |
| |
| /** |
| * Types of phone number matches. See detailed description beside the isNumberMatch() method. |
| */ |
| public enum MatchType { |
| NOT_A_NUMBER, |
| NO_MATCH, |
| SHORT_NSN_MATCH, |
| NSN_MATCH, |
| EXACT_MATCH, |
| } |
| |
| /** |
| * Possible outcomes when testing if a PhoneNumber is possible. |
| */ |
| public enum ValidationResult { |
| IS_POSSIBLE, |
| INVALID_COUNTRY_CODE, |
| TOO_SHORT, |
| TOO_LONG, |
| } |
| |
| /** |
| * Leniency when {@linkplain PhoneNumberUtil#findNumbers finding} potential phone numbers in text |
| * segments. |
| */ |
| public enum Leniency { |
| /** |
| * Phone numbers accepted are {@linkplain PhoneNumberUtil#isPossibleNumber(PhoneNumber) |
| * possible}, but not necessarily {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid}. |
| */ |
| POSSIBLE { |
| @Override |
| boolean verify(PhoneNumber number, PhoneNumberUtil util) { |
| return util.isPossibleNumber(number); |
| } |
| }, |
| /** |
| * Phone numbers accepted are {@linkplain PhoneNumberUtil#isPossibleNumber(PhoneNumber) |
| * possible} and {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid}. |
| */ |
| VALID { |
| @Override |
| boolean verify(PhoneNumber number, PhoneNumberUtil util) { |
| return util.isValidNumber(number); |
| } |
| }; |
| |
| /** Returns true if {@code number} is a verified number according to this leniency. */ |
| abstract boolean verify(PhoneNumber number, PhoneNumberUtil util); |
| } |
| |
| /** |
| * This class implements a singleton, so the only constructor is private. |
| */ |
| private PhoneNumberUtil() { |
| } |
| |
| private void init(String filePrefix) { |
| currentFilePrefix = filePrefix; |
| for (List<String> regionCodes : countryCallingCodeToRegionCodeMap.values()) { |
| supportedRegions.addAll(regionCodes); |
| } |
| nanpaRegions.addAll(countryCallingCodeToRegionCodeMap.get(NANPA_COUNTRY_CODE)); |
| } |
| |
| private void loadMetadataForRegionFromFile(String filePrefix, String regionCode) { |
| InputStream source = |
| PhoneNumberUtil.class.getResourceAsStream(filePrefix + "_" + regionCode); |
| ObjectInputStream in; |
| try { |
| in = new ObjectInputStream(source); |
| PhoneMetadataCollection metadataCollection = new PhoneMetadataCollection(); |
| metadataCollection.readExternal(in); |
| for (PhoneMetadata metadata : metadataCollection.getMetadataList()) { |
| regionToMetadataMap.put(regionCode, metadata); |
| } |
| } catch (IOException e) { |
| LOGGER.log(Level.WARNING, e.toString()); |
| } |
| } |
| |
| /** |
| * Attempts to extract a possible number from the string passed in. This currently strips all |
| * leading characters that cannot be used to start a phone number. Characters that can be used to |
| * start a phone number are defined in the VALID_START_CHAR_PATTERN. If none of these characters |
| * are found in the number passed in, an empty string is returned. This function also attempts to |
| * strip off any alternative extensions or endings if two or more are present, such as in the case |
| * of: (530) 583-6985 x302/x2303. The second extension here makes this actually two phone numbers, |
| * (530) 583-6985 x302 and (530) 583-6985 x2303. We remove the second extension so that the first |
| * number is parsed correctly. |
| * |
| * @param number the string that might contain a phone number |
| * @return the number, stripped of any non-phone-number prefix (such as "Tel:") or an empty |
| * string if no character used to start phone numbers (such as + or any digit) is |
| * found in the number |
| */ |
| static String extractPossibleNumber(String number) { |
| Matcher m = VALID_START_CHAR_PATTERN.matcher(number); |
| if (m.find()) { |
| number = number.substring(m.start()); |
| // Remove trailing non-alpha non-numerical characters. |
| Matcher trailingCharsMatcher = UNWANTED_END_CHAR_PATTERN.matcher(number); |
| if (trailingCharsMatcher.find()) { |
| number = number.substring(0, trailingCharsMatcher.start()); |
| LOGGER.log(Level.FINER, "Stripped trailing characters: " + number); |
| } |
| // Check for extra numbers at the end. |
| Matcher secondNumber = SECOND_NUMBER_START_PATTERN.matcher(number); |
| if (secondNumber.find()) { |
| number = number.substring(0, secondNumber.start()); |
| } |
| return number; |
| } else { |
| return ""; |
| } |
| } |
| |
| /** |
| * Checks to see if the string of characters could possibly be a phone number at all. At the |
| * moment, checks to see that the string begins with at least 3 digits, ignoring any punctuation |
| * commonly found in phone numbers. |
| * This method does not require the number to be normalized in advance - but does assume that |
| * leading non-number symbols have been removed, such as by the method extractPossibleNumber. |
| * |
| * @param number string to be checked for viability as a phone number |
| * @return true if the number could be a phone number of some sort, otherwise false |
| */ |
| static boolean isViablePhoneNumber(String number) { |
| if (number.length() < MIN_LENGTH_FOR_NSN) { |
| return false; |
| } |
| Matcher m = VALID_PHONE_NUMBER_PATTERN.matcher(number); |
| return m.matches(); |
| } |
| |
| /** |
| * Normalizes a string of characters representing a phone number. This performs the following |
| * conversions: |
| * Punctuation is stripped. |
| * For ALPHA/VANITY numbers: |
| * Letters are converted to their numeric representation on a telephone keypad. The keypad |
| * used here is the one defined in ITU Recommendation E.161. This is only done if there are |
| * 3 or more letters in the number, to lessen the risk that such letters are typos. |
| * For other numbers: |
| * Wide-ascii digits are converted to normal ASCII (European) digits. |
| * Arabic-Indic numerals are converted to European numerals. |
| * Spurious alpha characters are stripped. |
| * |
| * @param number a string of characters representing a phone number |
| * @return the normalized string version of the phone number |
| */ |
| static String normalize(String number) { |
| Matcher m = VALID_ALPHA_PHONE_PATTERN.matcher(number); |
| if (m.matches()) { |
| return normalizeHelper(number, ALPHA_PHONE_MAPPINGS, true); |
| } else { |
| return normalizeDigitsOnly(number); |
| } |
| } |
| |
| /** |
| * Normalizes a string of characters representing a phone number. This is a wrapper for |
| * normalize(String number) but does in-place normalization of the StringBuilder provided. |
| * |
| * @param number a StringBuilder of characters representing a phone number that will be |
| * normalized in place |
| */ |
| static void normalize(StringBuilder number) { |
| String normalizedNumber = normalize(number.toString()); |
| number.replace(0, number.length(), normalizedNumber); |
| } |
| |
| /** |
| * Normalizes a string of characters representing a phone number. This converts wide-ascii and |
| * arabic-indic numerals to European numerals, and strips punctuation and alpha characters. |
| * |
| * @param number a string of characters representing a phone number |
| * @return the normalized string version of the phone number |
| */ |
| public static String normalizeDigitsOnly(String number) { |
| int numberLength = number.length(); |
| StringBuilder normalizedDigits = new StringBuilder(numberLength); |
| for (int i = 0; i < numberLength; i++) { |
| int d = Character.digit(number.charAt(i), 10); |
| if (d != -1) { |
| normalizedDigits.append(d); |
| } |
| } |
| return normalizedDigits.toString(); |
| } |
| |
| /** |
| * Converts all alpha characters in a number to their respective digits on a keypad, but retains |
| * existing formatting. |
| */ |
| public static String convertAlphaCharactersInNumber(String number) { |
| return normalizeHelper(number, ALPHA_PHONE_MAPPINGS, false); |
| } |
| |
| /** |
| * Gets the length of the geographical area code in the {@code nationalNumber_} field of the |
| * PhoneNumber object passed in, so that clients could use it to split a national significant |
| * number into geographical area code and subscriber number. It works in such a way that the |
| * resultant subscriber number should be diallable, at least on some devices. An example of how |
| * this could be used: |
| * |
| * <pre> |
| * PhoneNumberUtil phoneUtil = PhoneNumberUtil.getInstance(); |
| * PhoneNumber number = phoneUtil.parse("16502530000", "US"); |
| * String nationalSignificantNumber = phoneUtil.getNationalSignificantNumber(number); |
| * String areaCode; |
| * String subscriberNumber; |
| * |
| * int areaCodeLength = phoneUtil.getLengthOfGeographicalAreaCode(number); |
| * if (areaCodeLength > 0) { |
| * areaCode = nationalSignificantNumber.substring(0, areaCodeLength); |
| * subscriberNumber = nationalSignificantNumber.substring(areaCodeLength); |
| * } else { |
| * areaCode = ""; |
| * subscriberNumber = nationalSignificantNumber; |
| * } |
| * </pre> |
| * |
| * N.B.: area code is a very ambiguous concept, so the I18N team generally recommends against |
| * using it for most purposes, but recommends using the more general {@code national_number} |
| * instead. Read the following carefully before deciding to use this method: |
| * <ul> |
| * <li> geographical area codes change over time, and this method honors those changes; |
| * therefore, it doesn't guarantee the stability of the result it produces. |
| * <li> subscriber numbers may not be diallable from all devices (notably mobile devices, which |
| * typically requires the full national_number to be dialled in most regions). |
| * <li> most non-geographical numbers have no area codes. |
| * <li> some geographical numbers have no area codes. |
| * </ul> |
| * @param number the PhoneNumber object for which clients want to know the length of the area |
| * code. |
| * @return the length of area code of the PhoneNumber object passed in. |
| */ |
| public int getLengthOfGeographicalAreaCode(PhoneNumber number) { |
| String regionCode = getRegionCodeForNumber(number); |
| if (!isValidRegionCode(regionCode)) { |
| return 0; |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| if (!metadata.hasNationalPrefix()) { |
| return 0; |
| } |
| |
| PhoneNumberType type = getNumberTypeHelper(getNationalSignificantNumber(number), |
| metadata); |
| // Most numbers other than the two types below have to be dialled in full. |
| if (type != PhoneNumberType.FIXED_LINE && type != PhoneNumberType.FIXED_LINE_OR_MOBILE) { |
| return 0; |
| } |
| |
| return getLengthOfNationalDestinationCode(number); |
| } |
| |
| /** |
| * Gets the length of the national destination code (NDC) from the PhoneNumber object passed in, |
| * so that clients could use it to split a national significant number into NDC and subscriber |
| * number. The NDC of a phone number is normally the first group of digit(s) right after the |
| * country calling code when the number is formatted in the international format, if there is a |
| * subscriber number part that follows. An example of how this could be used: |
| * |
| * <pre> |
| * PhoneNumberUtil phoneUtil = PhoneNumberUtil.getInstance(); |
| * PhoneNumber number = phoneUtil.parse("18002530000", "US"); |
| * String nationalSignificantNumber = phoneUtil.getNationalSignificantNumber(number); |
| * String nationalDestinationCode; |
| * String subscriberNumber; |
| * |
| * int nationalDestinationCodeLength = phoneUtil.getLengthOfNationalDestinationCode(number); |
| * if (nationalDestinationCodeLength > 0) { |
| * nationalDestinationCode = nationalSignificantNumber.substring(0, |
| * nationalDestinationCodeLength); |
| * subscriberNumber = nationalSignificantNumber.substring(nationalDestinationCodeLength); |
| * } else { |
| * nationalDestinationCode = ""; |
| * subscriberNumber = nationalSignificantNumber; |
| * } |
| * </pre> |
| * |
| * Refer to the unittests to see the difference between this function and |
| * {@link #getLengthOfGeographicalAreaCode}. |
| * |
| * @param number the PhoneNumber object for which clients want to know the length of the NDC. |
| * @return the length of NDC of the PhoneNumber object passed in. |
| */ |
| public int getLengthOfNationalDestinationCode(PhoneNumber number) { |
| PhoneNumber copiedProto; |
| if (number.hasExtension()) { |
| // We don't want to alter the proto given to us, but we don't want to include the extension |
| // when we format it, so we copy it and clear the extension here. |
| copiedProto = new PhoneNumber(); |
| copiedProto.mergeFrom(number); |
| copiedProto.clearExtension(); |
| } else { |
| copiedProto = number; |
| } |
| |
| String nationalSignificantNumber = format(copiedProto, |
| PhoneNumberUtil.PhoneNumberFormat.INTERNATIONAL); |
| String[] numberGroups = NON_DIGITS_PATTERN.split(nationalSignificantNumber); |
| // The pattern will start with "+COUNTRY_CODE " so the first group will always be the empty |
| // string (before the + symbol) and the second group will be the country calling code. The third |
| // group will be area code if it is not the last group. |
| if (numberGroups.length <= 3) { |
| return 0; |
| } |
| |
| if (getRegionCodeForNumber(number).equals("AR") && |
| getNumberType(number) == PhoneNumberType.MOBILE) { |
| // Argentinian mobile numbers, when formatted in the international format, are in the form of |
| // +54 9 NDC XXXX.... As a result, we take the length of the third group (NDC) and add 1 for |
| // the digit 9, which also forms part of the national significant number. |
| // |
| // TODO: Investigate the possibility of better modeling the metadata to make it |
| // easier to obtain the NDC. |
| return numberGroups[3].length() + 1; |
| } |
| return numberGroups[2].length(); |
| } |
| |
| /** |
| * Normalizes a string of characters representing a phone number by replacing all characters found |
| * in the accompanying map with the values therein, and stripping all other characters if |
| * removeNonMatches is true. |
| * |
| * @param number a string of characters representing a phone number |
| * @param normalizationReplacements a mapping of characters to what they should be replaced by in |
| * the normalized version of the phone number |
| * @param removeNonMatches indicates whether characters that are not able to be replaced |
| * should be stripped from the number. If this is false, they |
| * will be left unchanged in the number. |
| * @return the normalized string version of the phone number |
| */ |
| private static String normalizeHelper(String number, |
| Map<Character, Character> normalizationReplacements, |
| boolean removeNonMatches) { |
| StringBuilder normalizedNumber = new StringBuilder(number.length()); |
| char[] numberAsCharArray = number.toCharArray(); |
| for (char character : numberAsCharArray) { |
| Character newDigit = normalizationReplacements.get(Character.toUpperCase(character)); |
| if (newDigit != null) { |
| normalizedNumber.append(newDigit); |
| } else if (!removeNonMatches) { |
| normalizedNumber.append(character); |
| } |
| // If neither of the above are true, we remove this character. |
| } |
| return normalizedNumber.toString(); |
| } |
| |
| static synchronized PhoneNumberUtil getInstance( |
| String baseFileLocation, |
| Map<Integer, List<String>> countryCallingCodeToRegionCodeMap) { |
| if (instance == null) { |
| instance = new PhoneNumberUtil(); |
| instance.countryCallingCodeToRegionCodeMap = countryCallingCodeToRegionCodeMap; |
| instance.init(baseFileLocation); |
| } |
| return instance; |
| } |
| |
| /** |
| * Used for testing purposes only to reset the PhoneNumberUtil singleton to null. |
| */ |
| static synchronized void resetInstance() { |
| instance = null; |
| } |
| |
| /** |
| * Convenience method to enable tests to get a list of what regions the library has metadata for. |
| */ |
| public Set<String> getSupportedRegions() { |
| return supportedRegions; |
| } |
| |
| /** |
| * Gets a {@link PhoneNumberUtil} instance to carry out international phone number formatting, |
| * parsing, or validation. The instance is loaded with phone number metadata for a number of most |
| * commonly used regions. |
| * |
| * <p>The {@link PhoneNumberUtil} is implemented as a singleton. Therefore, calling getInstance |
| * multiple times will only result in one instance being created. |
| * |
| * @return a PhoneNumberUtil instance |
| */ |
| public static synchronized PhoneNumberUtil getInstance() { |
| if (instance == null) { |
| return getInstance(META_DATA_FILE_PREFIX, |
| CountryCodeToRegionCodeMap.getCountryCodeToRegionCodeMap()); |
| } |
| return instance; |
| } |
| |
| /** |
| * Helper function to check region code is not unknown or null. |
| */ |
| private boolean isValidRegionCode(String regionCode) { |
| return regionCode != null && supportedRegions.contains(regionCode); |
| } |
| |
| /** |
| * Helper function to check region code is not unknown or null and log an error message. The |
| * {@code countryCallingCode} and {@code number} supplied is used only for the resultant log |
| * message. |
| */ |
| private boolean hasValidRegionCode(String regionCode, |
| int countryCallingCode, String number) { |
| if (!isValidRegionCode(regionCode)) { |
| LOGGER.log(Level.WARNING, |
| "Number " + number + " has invalid or missing country calling code (" |
| + countryCallingCode + ")"); |
| return false; |
| } |
| return true; |
| } |
| |
| /** |
| * Formats a phone number in the specified format using default rules. Note that this does not |
| * promise to produce a phone number that the user can dial from where they are - although we do |
| * format in either 'national' or 'international' format depending on what the client asks for, we |
| * do not currently support a more abbreviated format, such as for users in the same "area" who |
| * could potentially dial the number without area code. Note that if the phone number has a |
| * country calling code of 0 or an otherwise invalid country calling code, we cannot work out |
| * which formatting rules to apply so we return the national significant number with no formatting |
| * applied. |
| * |
| * @param number the phone number to be formatted |
| * @param numberFormat the format the phone number should be formatted into |
| * @return the formatted phone number |
| */ |
| public String format(PhoneNumber number, PhoneNumberFormat numberFormat) { |
| StringBuilder formattedNumber = new StringBuilder(20); |
| format(number, numberFormat, formattedNumber); |
| return formattedNumber.toString(); |
| } |
| |
| /** |
| * Same as {@link #format(PhoneNumber, PhoneNumberFormat)}, but accepts a mutable StringBuilder as |
| * a parameter to decrease object creation when invoked many times. |
| */ |
| public void format(PhoneNumber number, PhoneNumberFormat numberFormat, |
| StringBuilder formattedNumber) { |
| // Clear the StringBuilder first. |
| formattedNumber.setLength(0); |
| int countryCallingCode = number.getCountryCode(); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| if (numberFormat == PhoneNumberFormat.E164) { |
| // Early exit for E164 case since no formatting of the national number needs to be applied. |
| // Extensions are not formatted. |
| formattedNumber.append(nationalSignificantNumber); |
| formatNumberByFormat(countryCallingCode, PhoneNumberFormat.E164, formattedNumber); |
| return; |
| } |
| // Note getRegionCodeForCountryCode() is used because formatting information for regions which |
| // share a country calling code is contained by only one region for performance reasons. For |
| // example, for NANPA regions it will be contained in the metadata for US. |
| String regionCode = getRegionCodeForCountryCode(countryCallingCode); |
| if (!isValidRegionCode(regionCode)) { |
| formattedNumber.append(nationalSignificantNumber); |
| return; |
| } |
| |
| formattedNumber.append(formatNationalNumber(nationalSignificantNumber, |
| regionCode, numberFormat)); |
| maybeGetFormattedExtension(number, regionCode, numberFormat, formattedNumber); |
| formatNumberByFormat(countryCallingCode, numberFormat, formattedNumber); |
| } |
| |
| /** |
| * Formats a phone number in the specified format using client-defined formatting rules. Note that |
| * if the phone number has a country calling code of zero or an otherwise invalid country calling |
| * code, we cannot work out things like whether there should be a national prefix applied, or how |
| * to format extensions, so we return the national significant number with no formatting applied. |
| * |
| * @param number the phone number to be formatted |
| * @param numberFormat the format the phone number should be formatted into |
| * @param userDefinedFormats formatting rules specified by clients |
| * @return the formatted phone number |
| */ |
| public String formatByPattern(PhoneNumber number, |
| PhoneNumberFormat numberFormat, |
| List<NumberFormat> userDefinedFormats) { |
| int countryCallingCode = number.getCountryCode(); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| // Note getRegionCodeForCountryCode() is used because formatting information for regions which |
| // share a country calling code is contained by only one region for performance reasons. For |
| // example, for NANPA regions it will be contained in the metadata for US. |
| String regionCode = getRegionCodeForCountryCode(countryCallingCode); |
| if (!hasValidRegionCode(regionCode, countryCallingCode, nationalSignificantNumber)) { |
| return nationalSignificantNumber; |
| } |
| List<NumberFormat> userDefinedFormatsCopy = |
| new ArrayList<NumberFormat>(userDefinedFormats.size()); |
| for (NumberFormat numFormat : userDefinedFormats) { |
| String nationalPrefixFormattingRule = numFormat.getNationalPrefixFormattingRule(); |
| if (nationalPrefixFormattingRule.length() > 0) { |
| // Before we do a replacement of the national prefix pattern $NP with the national prefix, |
| // we need to copy the rule so that subsequent replacements for different numbers have the |
| // appropriate national prefix. |
| NumberFormat numFormatCopy = new NumberFormat(); |
| numFormatCopy.mergeFrom(numFormat); |
| String nationalPrefix = getMetadataForRegion(regionCode).getNationalPrefix(); |
| if (nationalPrefix.length() > 0) { |
| // Replace $NP with national prefix and $FG with the first group ($1). |
| nationalPrefixFormattingRule = |
| NP_PATTERN.matcher(nationalPrefixFormattingRule).replaceFirst(nationalPrefix); |
| nationalPrefixFormattingRule = |
| FG_PATTERN.matcher(nationalPrefixFormattingRule).replaceFirst("\\$1"); |
| numFormatCopy.setNationalPrefixFormattingRule(nationalPrefixFormattingRule); |
| } else { |
| // We don't want to have a rule for how to format the national prefix if there isn't one. |
| numFormatCopy.clearNationalPrefixFormattingRule(); |
| } |
| userDefinedFormatsCopy.add(numFormatCopy); |
| } else { |
| // Otherwise, we just add the original rule to the modified list of formats. |
| userDefinedFormatsCopy.add(numFormat); |
| } |
| } |
| |
| StringBuilder formattedNumber = |
| new StringBuilder(formatAccordingToFormats(nationalSignificantNumber, |
| userDefinedFormatsCopy, |
| numberFormat)); |
| maybeGetFormattedExtension(number, regionCode, numberFormat, formattedNumber); |
| formatNumberByFormat(countryCallingCode, numberFormat, formattedNumber); |
| return formattedNumber.toString(); |
| } |
| |
| /** |
| * Formats a phone number in national format for dialing using the carrier as specified in the |
| * {@code carrierCode}. The {@code carrierCode} will always be used regardless of whether the |
| * phone number already has a preferred domestic carrier code stored. If {@code carrierCode} |
| * contains an empty string, returns the number in national format without any carrier code. |
| * |
| * @param number the phone number to be formatted |
| * @param carrierCode the carrier selection code to be used |
| * @return the formatted phone number in national format for dialing using the carrier as |
| * specified in the {@code carrierCode} |
| */ |
| public String formatNationalNumberWithCarrierCode(PhoneNumber number, String carrierCode) { |
| int countryCallingCode = number.getCountryCode(); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| // Note getRegionCodeForCountryCode() is used because formatting information for regions which |
| // share a country calling code is contained by only one region for performance reasons. For |
| // example, for NANPA regions it will be contained in the metadata for US. |
| String regionCode = getRegionCodeForCountryCode(countryCallingCode); |
| if (!hasValidRegionCode(regionCode, countryCallingCode, nationalSignificantNumber)) { |
| return nationalSignificantNumber; |
| } |
| |
| StringBuilder formattedNumber = new StringBuilder(20); |
| formattedNumber.append(formatNationalNumber(nationalSignificantNumber, |
| regionCode, |
| PhoneNumberFormat.NATIONAL, |
| carrierCode)); |
| maybeGetFormattedExtension(number, regionCode, PhoneNumberFormat.NATIONAL, formattedNumber); |
| formatNumberByFormat(countryCallingCode, PhoneNumberFormat.NATIONAL, formattedNumber); |
| return formattedNumber.toString(); |
| } |
| |
| /** |
| * Formats a phone number in national format for dialing using the carrier as specified in the |
| * preferredDomesticCarrierCode field of the PhoneNumber object passed in. If that is missing, |
| * use the {@code fallbackCarrierCode} passed in instead. If there is no |
| * {@code preferredDomesticCarrierCode}, and the {@code fallbackCarrierCode} contains an empty |
| * string, return the number in national format without any carrier code. |
| * |
| * <p>Use {@link #formatNationalNumberWithCarrierCode} instead if the carrier code passed in |
| * should take precedence over the number's {@code preferredDomesticCarrierCode} when formatting. |
| * |
| * @param number the phone number to be formatted |
| * @param fallbackCarrierCode the carrier selection code to be used, if none is found in the |
| * phone number itself |
| * @return the formatted phone number in national format for dialing using the number's |
| * {@code preferredDomesticCarrierCode}, or the {@code fallbackCarrierCode} passed in if |
| * none is found |
| */ |
| public String formatNationalNumberWithPreferredCarrierCode(PhoneNumber number, |
| String fallbackCarrierCode) { |
| return formatNationalNumberWithCarrierCode(number, number.hasPreferredDomesticCarrierCode() |
| ? number.getPreferredDomesticCarrierCode() |
| : fallbackCarrierCode); |
| } |
| |
| /** |
| * Formats a phone number for out-of-country dialing purposes. If no regionCallingFrom is |
| * supplied, we format the number in its INTERNATIONAL format. If the country calling code is the |
| * same as that of the region where the number is from, then NATIONAL formatting will be applied. |
| * |
| * <p>If the number itself has a country calling code of zero or an otherwise invalid country |
| * calling code, then we return the number with no formatting applied. |
| * |
| * <p>Note this function takes care of the case for calling inside of NANPA and between Russia and |
| * Kazakhstan (who share the same country calling code). In those cases, no international prefix |
| * is used. For regions which have multiple international prefixes, the number in its |
| * INTERNATIONAL format will be returned instead. |
| * |
| * @param number the phone number to be formatted |
| * @param regionCallingFrom the region where the call is being placed |
| * @return the formatted phone number |
| */ |
| public String formatOutOfCountryCallingNumber(PhoneNumber number, |
| String regionCallingFrom) { |
| if (!isValidRegionCode(regionCallingFrom)) { |
| return format(number, PhoneNumberFormat.INTERNATIONAL); |
| } |
| int countryCallingCode = number.getCountryCode(); |
| String regionCode = getRegionCodeForCountryCode(countryCallingCode); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| if (!hasValidRegionCode(regionCode, countryCallingCode, nationalSignificantNumber)) { |
| return nationalSignificantNumber; |
| } |
| if (countryCallingCode == NANPA_COUNTRY_CODE) { |
| if (isNANPACountry(regionCallingFrom)) { |
| // For NANPA regions, return the national format for these regions but prefix it with the |
| // country calling code. |
| return countryCallingCode + " " + format(number, PhoneNumberFormat.NATIONAL); |
| } |
| } else if (countryCallingCode == getCountryCodeForRegion(regionCallingFrom)) { |
| // For regions that share a country calling code, the country calling code need not be dialled. |
| // This also applies when dialling within a region, so this if clause covers both these cases. |
| // Technically this is the case for dialling from La Reunion to other overseas departments of |
| // France (French Guiana, Martinique, Guadeloupe), but not vice versa - so we don't cover this |
| // edge case for now and for those cases return the version including country calling code. |
| // Details here: http://www.petitfute.com/voyage/225-info-pratiques-reunion |
| return format(number, PhoneNumberFormat.NATIONAL); |
| } |
| String formattedNationalNumber = |
| formatNationalNumber(nationalSignificantNumber, |
| regionCode, PhoneNumberFormat.INTERNATIONAL); |
| PhoneMetadata metadata = getMetadataForRegion(regionCallingFrom); |
| String internationalPrefix = metadata.getInternationalPrefix(); |
| |
| // For regions that have multiple international prefixes, the international format of the |
| // number is returned, unless there is a preferred international prefix. |
| String internationalPrefixForFormatting = ""; |
| if (UNIQUE_INTERNATIONAL_PREFIX.matcher(internationalPrefix).matches()) { |
| internationalPrefixForFormatting = internationalPrefix; |
| } else if (metadata.hasPreferredInternationalPrefix()) { |
| internationalPrefixForFormatting = metadata.getPreferredInternationalPrefix(); |
| } |
| |
| StringBuilder formattedNumber = new StringBuilder(formattedNationalNumber); |
| maybeGetFormattedExtension(number, regionCode, PhoneNumberFormat.INTERNATIONAL, |
| formattedNumber); |
| if (internationalPrefixForFormatting.length() > 0) { |
| formattedNumber.insert(0, " ").insert(0, countryCallingCode).insert(0, " ") |
| .insert(0, internationalPrefixForFormatting); |
| } else { |
| formatNumberByFormat(countryCallingCode, |
| PhoneNumberFormat.INTERNATIONAL, |
| formattedNumber); |
| } |
| return formattedNumber.toString(); |
| } |
| |
| /** |
| * Formats a phone number using the original phone number format that the number is parsed from. |
| * The original format is embedded in the country_code_source field of the PhoneNumber object |
| * passed in. If such information is missing, the number will be formatted into the NATIONAL |
| * format by default. |
| * |
| * @param number the phone number that needs to be formatted in its original number format |
| * @param regionCallingFrom the region whose IDD needs to be prefixed if the original number |
| * has one |
| * @return the formatted phone number in its original number format |
| */ |
| public String formatInOriginalFormat(PhoneNumber number, String regionCallingFrom) { |
| if (!number.hasCountryCodeSource()) { |
| return format(number, PhoneNumberFormat.NATIONAL); |
| } |
| switch (number.getCountryCodeSource()) { |
| case FROM_NUMBER_WITH_PLUS_SIGN: |
| return format(number, PhoneNumberFormat.INTERNATIONAL); |
| case FROM_NUMBER_WITH_IDD: |
| return formatOutOfCountryCallingNumber(number, regionCallingFrom); |
| case FROM_NUMBER_WITHOUT_PLUS_SIGN: |
| return format(number, PhoneNumberFormat.INTERNATIONAL).substring(1); |
| case FROM_DEFAULT_COUNTRY: |
| default: |
| return format(number, PhoneNumberFormat.NATIONAL); |
| } |
| } |
| |
| /** |
| * Formats a phone number for out-of-country dialing purposes. |
| * |
| * Note that in this version, if the number was entered originally using alpha characters and |
| * this version of the number is stored in raw_input, this representation of the number will be |
| * used rather than the digit representation. Grouping information, as specified by characters |
| * such as "-" and " ", will be retained. |
| * |
| * <p><b>Caveats:</b></p> |
| * <ul> |
| * <li> This will not produce good results if the country calling code is both present in the raw |
| * input _and_ is the start of the national number. This is not a problem in the regions |
| * which typically use alpha numbers. |
| * <li> This will also not produce good results if the raw input has any grouping information |
| * within the first three digits of the national number, and if the function needs to strip |
| * preceding digits/words in the raw input before these digits. Normally people group the |
| * first three digits together so this is not a huge problem - and will be fixed if it |
| * proves to be so. |
| * </ul> |
| * |
| * @param number the phone number that needs to be formatted |
| * @param regionCallingFrom the region where the call is being placed |
| * @return the formatted phone number |
| */ |
| public String formatOutOfCountryKeepingAlphaChars(PhoneNumber number, |
| String regionCallingFrom) { |
| String rawInput = number.getRawInput(); |
| // If there is no raw input, then we can't keep alpha characters because there aren't any. |
| // In this case, we return formatOutOfCountryCallingNumber. |
| if (rawInput.length() == 0) { |
| return formatOutOfCountryCallingNumber(number, regionCallingFrom); |
| } |
| int countryCode = number.getCountryCode(); |
| String regionCode = getRegionCodeForCountryCode(countryCode); |
| if (!hasValidRegionCode(regionCode, countryCode, rawInput)) { |
| return rawInput; |
| } |
| // Strip any prefix such as country calling code, IDD, that was present. We do this by comparing |
| // the number in raw_input with the parsed number. |
| // To do this, first we normalize punctuation. We retain number grouping symbols such as " " |
| // only. |
| rawInput = normalizeHelper(rawInput, ALL_PLUS_NUMBER_GROUPING_SYMBOLS, true); |
| // Now we trim everything before the first three digits in the parsed number. We choose three |
| // because all valid alpha numbers have 3 digits at the start - if it does not, then we don't |
| // trim anything at all. Similarly, if the national number was less than three digits, we don't |
| // trim anything at all. |
| String nationalNumber = getNationalSignificantNumber(number); |
| if (nationalNumber.length() > 3) { |
| int firstNationalNumberDigit = rawInput.indexOf(nationalNumber.substring(0, 3)); |
| if (firstNationalNumberDigit != -1) { |
| rawInput = rawInput.substring(firstNationalNumberDigit); |
| } |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCallingFrom); |
| if (countryCode == NANPA_COUNTRY_CODE) { |
| if (isNANPACountry(regionCallingFrom)) { |
| return countryCode + " " + rawInput; |
| } |
| } else if (countryCode == getCountryCodeForRegion(regionCallingFrom)) { |
| // Here we copy the formatting rules so we can modify the pattern we expect to match against. |
| List<NumberFormat> availableFormats = |
| new ArrayList<NumberFormat>(metadata.numberFormatSize()); |
| for (NumberFormat format : metadata.numberFormats()) { |
| NumberFormat newFormat = new NumberFormat(); |
| newFormat.mergeFrom(format); |
| // The first group is the first group of digits that the user determined. |
| newFormat.setPattern("(\\d+)(.*)"); |
| // Here we just concatenate them back together after the national prefix has been fixed. |
| newFormat.setFormat("$1$2"); |
| availableFormats.add(newFormat); |
| } |
| // Now we format using these patterns instead of the default pattern, but with the national |
| // prefix prefixed if necessary, by choosing the format rule based on the leading digits |
| // present in the unformatted national number. |
| // This will not work in the cases where the pattern (and not the leading digits) decide |
| // whether a national prefix needs to be used, since we have overridden the pattern to match |
| // anything, but that is not the case in the metadata to date. |
| return formatAccordingToFormats(rawInput, availableFormats, PhoneNumberFormat.NATIONAL); |
| } |
| String internationalPrefix = metadata.getInternationalPrefix(); |
| // For countries that have multiple international prefixes, the international format of the |
| // number is returned, unless there is a preferred international prefix. |
| String internationalPrefixForFormatting = |
| UNIQUE_INTERNATIONAL_PREFIX.matcher(internationalPrefix).matches() |
| ? internationalPrefix |
| : metadata.getPreferredInternationalPrefix(); |
| StringBuilder formattedNumber = new StringBuilder(rawInput); |
| maybeGetFormattedExtension(number, regionCode, PhoneNumberFormat.INTERNATIONAL, |
| formattedNumber); |
| if (internationalPrefixForFormatting.length() > 0) { |
| formattedNumber.insert(0, " ").insert(0, countryCode).insert(0, " ") |
| .insert(0, internationalPrefixForFormatting); |
| } else { |
| formatNumberByFormat(countryCode, |
| PhoneNumberFormat.INTERNATIONAL, |
| formattedNumber); |
| } |
| return formattedNumber.toString(); |
| } |
| |
| /** |
| * Gets the national significant number of the a phone number. Note a national significant number |
| * doesn't contain a national prefix or any formatting. |
| * |
| * @param number the phone number for which the national significant number is needed |
| * @return the national significant number of the PhoneNumber object passed in |
| */ |
| public String getNationalSignificantNumber(PhoneNumber number) { |
| // The leading zero in the national (significant) number of an Italian phone number has a |
| // special meaning. Unlike the rest of the world, it indicates the number is a landline |
| // number. There have been plans to migrate landline numbers to start with the digit two since |
| // December 2000, but it has not yet happened. |
| // See http://en.wikipedia.org/wiki/%2B39 for more details. |
| // Other regions such as Cote d'Ivoire and Gabon use this for their mobile numbers. |
| StringBuilder nationalNumber = new StringBuilder( |
| (number.hasItalianLeadingZero() && |
| number.isItalianLeadingZero() && |
| isLeadingZeroPossible(number.getCountryCode())) |
| ? "0" : "" |
| ); |
| nationalNumber.append(number.getNationalNumber()); |
| return nationalNumber.toString(); |
| } |
| |
| /** |
| * A helper function that is used by format and formatByPattern. |
| */ |
| private void formatNumberByFormat(int countryCallingCode, |
| PhoneNumberFormat numberFormat, |
| StringBuilder formattedNumber) { |
| switch (numberFormat) { |
| case E164: |
| formattedNumber.insert(0, countryCallingCode).insert(0, PLUS_SIGN); |
| return; |
| case INTERNATIONAL: |
| formattedNumber.insert(0, " ").insert(0, countryCallingCode).insert(0, PLUS_SIGN); |
| return; |
| case RFC3966: |
| formattedNumber.insert(0, "-").insert(0, countryCallingCode) .insert(0, PLUS_SIGN); |
| return; |
| case NATIONAL: |
| default: |
| return; |
| } |
| } |
| |
| // Simple wrapper of formatNationalNumber for the common case of no carrier code. |
| private String formatNationalNumber(String number, |
| String regionCode, |
| PhoneNumberFormat numberFormat) { |
| return formatNationalNumber(number, regionCode, numberFormat, null); |
| } |
| |
| // Note in some regions, the national number can be written in two completely different ways |
| // depending on whether it forms part of the NATIONAL format or INTERNATIONAL format. The |
| // numberFormat parameter here is used to specify which format to use for those cases. If a |
| // carrierCode is specified, this will be inserted into the formatted string to replace $CC. |
| private String formatNationalNumber(String number, |
| String regionCode, |
| PhoneNumberFormat numberFormat, |
| String carrierCode) { |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| List<NumberFormat> intlNumberFormats = metadata.intlNumberFormats(); |
| // When the intlNumberFormats exists, we use that to format national number for the |
| // INTERNATIONAL format instead of using the numberDesc.numberFormats. |
| List<NumberFormat> availableFormats = |
| (intlNumberFormats.size() == 0 || numberFormat == PhoneNumberFormat.NATIONAL) |
| ? metadata.numberFormats() |
| : metadata.intlNumberFormats(); |
| String formattedNationalNumber = |
| formatAccordingToFormats(number, availableFormats, numberFormat, carrierCode); |
| if (numberFormat == PhoneNumberFormat.RFC3966) { |
| formattedNationalNumber = |
| SEPARATOR_PATTERN.matcher(formattedNationalNumber).replaceAll("-"); |
| } |
| return formattedNationalNumber; |
| } |
| |
| // Simple wrapper of formatAccordingToFormats for the common case of no carrier code. |
| private String formatAccordingToFormats(String nationalNumber, |
| List<NumberFormat> availableFormats, |
| PhoneNumberFormat numberFormat) { |
| return formatAccordingToFormats(nationalNumber, availableFormats, numberFormat, null); |
| } |
| |
| // Note that carrierCode is optional - if NULL or an empty string, no carrier code replacement |
| // will take place. |
| private String formatAccordingToFormats(String nationalNumber, |
| List<NumberFormat> availableFormats, |
| PhoneNumberFormat numberFormat, |
| String carrierCode) { |
| for (NumberFormat numFormat : availableFormats) { |
| int size = numFormat.leadingDigitsPatternSize(); |
| if (size == 0 || regexCache.getPatternForRegex( |
| // We always use the last leading_digits_pattern, as it is the most detailed. |
| numFormat.getLeadingDigitsPattern(size - 1)).matcher(nationalNumber).lookingAt()) { |
| Matcher m = regexCache.getPatternForRegex(numFormat.getPattern()).matcher(nationalNumber); |
| if (m.matches()) { |
| String numberFormatRule = numFormat.getFormat(); |
| if (numberFormat == PhoneNumberFormat.NATIONAL && |
| carrierCode != null && carrierCode.length() > 0 && |
| numFormat.getDomesticCarrierCodeFormattingRule().length() > 0) { |
| // Replace the $CC in the formatting rule with the desired carrier code. |
| String carrierCodeFormattingRule = numFormat.getDomesticCarrierCodeFormattingRule(); |
| carrierCodeFormattingRule = |
| CC_PATTERN.matcher(carrierCodeFormattingRule).replaceFirst(carrierCode); |
| // Now replace the $FG in the formatting rule with the first group and the carrier code |
| // combined in the appropriate way. |
| numberFormatRule = FIRST_GROUP_PATTERN.matcher(numberFormatRule) |
| .replaceFirst(carrierCodeFormattingRule); |
| return m.replaceAll(numberFormatRule); |
| } else { |
| // Use the national prefix formatting rule instead. |
| String nationalPrefixFormattingRule = numFormat.getNationalPrefixFormattingRule(); |
| if (numberFormat == PhoneNumberFormat.NATIONAL && |
| nationalPrefixFormattingRule != null && |
| nationalPrefixFormattingRule.length() > 0) { |
| Matcher firstGroupMatcher = FIRST_GROUP_PATTERN.matcher(numberFormatRule); |
| return m.replaceAll(firstGroupMatcher.replaceFirst(nationalPrefixFormattingRule)); |
| } else { |
| return m.replaceAll(numberFormatRule); |
| } |
| } |
| } |
| } |
| } |
| |
| // If no pattern above is matched, we format the number as a whole. |
| return nationalNumber; |
| } |
| |
| /** |
| * Gets a valid number for the specified region. |
| * |
| * @param regionCode the region for which an example number is needed |
| * @return a valid fixed-line number for the specified region. Returns null when the metadata |
| * does not contain such information. |
| */ |
| public PhoneNumber getExampleNumber(String regionCode) { |
| return getExampleNumberForType(regionCode, PhoneNumberType.FIXED_LINE); |
| } |
| |
| /** |
| * Gets a valid number for the specified region and number type. |
| * |
| * @param regionCode the region for which an example number is needed |
| * @param type the type of number that is needed |
| * @return a valid number for the specified region and type. Returns null when the metadata |
| * does not contain such information or if an invalid region was entered. |
| */ |
| public PhoneNumber getExampleNumberForType(String regionCode, PhoneNumberType type) { |
| // Check the region code is valid. |
| if (!isValidRegionCode(regionCode)) { |
| LOGGER.log(Level.WARNING, "Invalid or unknown region code provided."); |
| return null; |
| } |
| PhoneNumberDesc desc = getNumberDescByType(getMetadataForRegion(regionCode), type); |
| try { |
| if (desc.hasExampleNumber()) { |
| return parse(desc.getExampleNumber(), regionCode); |
| } |
| } catch (NumberParseException e) { |
| LOGGER.log(Level.SEVERE, e.toString()); |
| } |
| return null; |
| } |
| |
| /** |
| * Appends the formatted extension of a phone number to formattedNumber, if the phone number had |
| * an extension specified. |
| */ |
| private void maybeGetFormattedExtension(PhoneNumber number, String regionCode, |
| PhoneNumberFormat numberFormat, |
| StringBuilder formattedNumber) { |
| if (number.hasExtension() && number.getExtension().length() > 0) { |
| if (numberFormat == PhoneNumberFormat.RFC3966) { |
| formattedNumber.append(RFC3966_EXTN_PREFIX).append(number.getExtension()); |
| } else { |
| formatExtension(number.getExtension(), regionCode, formattedNumber); |
| } |
| } |
| } |
| |
| /** |
| * Formats the extension part of the phone number by prefixing it with the appropriate extension |
| * prefix. This will be the default extension prefix, unless overridden by a preferred |
| * extension prefix for this region. |
| */ |
| private void formatExtension(String extensionDigits, String regionCode, |
| StringBuilder extension) { |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| if (metadata.hasPreferredExtnPrefix()) { |
| extension.append(metadata.getPreferredExtnPrefix()).append(extensionDigits); |
| } else { |
| extension.append(DEFAULT_EXTN_PREFIX).append(extensionDigits); |
| } |
| } |
| |
| PhoneNumberDesc getNumberDescByType(PhoneMetadata metadata, PhoneNumberType type) { |
| switch (type) { |
| case PREMIUM_RATE: |
| return metadata.getPremiumRate(); |
| case TOLL_FREE: |
| return metadata.getTollFree(); |
| case MOBILE: |
| return metadata.getMobile(); |
| case FIXED_LINE: |
| case FIXED_LINE_OR_MOBILE: |
| return metadata.getFixedLine(); |
| case SHARED_COST: |
| return metadata.getSharedCost(); |
| case VOIP: |
| return metadata.getVoip(); |
| case PERSONAL_NUMBER: |
| return metadata.getPersonalNumber(); |
| case PAGER: |
| return metadata.getPager(); |
| case UAN: |
| return metadata.getUan(); |
| default: |
| return metadata.getGeneralDesc(); |
| } |
| } |
| |
| /** |
| * Gets the type of a phone number. |
| * |
| * @param number the phone number that we want to know the type |
| * @return the type of the phone number |
| */ |
| public PhoneNumberType getNumberType(PhoneNumber number) { |
| String regionCode = getRegionCodeForNumber(number); |
| if (!isValidRegionCode(regionCode)) { |
| return PhoneNumberType.UNKNOWN; |
| } |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| return getNumberTypeHelper(nationalSignificantNumber, getMetadataForRegion(regionCode)); |
| } |
| |
| private PhoneNumberType getNumberTypeHelper(String nationalNumber, PhoneMetadata metadata) { |
| PhoneNumberDesc generalNumberDesc = metadata.getGeneralDesc(); |
| if (!generalNumberDesc.hasNationalNumberPattern() || |
| !isNumberMatchingDesc(nationalNumber, generalNumberDesc)) { |
| return PhoneNumberType.UNKNOWN; |
| } |
| |
| if (isNumberMatchingDesc(nationalNumber, metadata.getPremiumRate())) { |
| return PhoneNumberType.PREMIUM_RATE; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getTollFree())) { |
| return PhoneNumberType.TOLL_FREE; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getSharedCost())) { |
| return PhoneNumberType.SHARED_COST; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getVoip())) { |
| return PhoneNumberType.VOIP; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getPersonalNumber())) { |
| return PhoneNumberType.PERSONAL_NUMBER; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getPager())) { |
| return PhoneNumberType.PAGER; |
| } |
| if (isNumberMatchingDesc(nationalNumber, metadata.getUan())) { |
| return PhoneNumberType.UAN; |
| } |
| |
| boolean isFixedLine = isNumberMatchingDesc(nationalNumber, metadata.getFixedLine()); |
| if (isFixedLine) { |
| if (metadata.isSameMobileAndFixedLinePattern()) { |
| return PhoneNumberType.FIXED_LINE_OR_MOBILE; |
| } else if (isNumberMatchingDesc(nationalNumber, metadata.getMobile())) { |
| return PhoneNumberType.FIXED_LINE_OR_MOBILE; |
| } |
| return PhoneNumberType.FIXED_LINE; |
| } |
| // Otherwise, test to see if the number is mobile. Only do this if certain that the patterns for |
| // mobile and fixed line aren't the same. |
| if (!metadata.isSameMobileAndFixedLinePattern() && |
| isNumberMatchingDesc(nationalNumber, metadata.getMobile())) { |
| return PhoneNumberType.MOBILE; |
| } |
| return PhoneNumberType.UNKNOWN; |
| } |
| |
| PhoneMetadata getMetadataForRegion(String regionCode) { |
| if (!isValidRegionCode(regionCode)) { |
| return null; |
| } |
| if (!regionToMetadataMap.containsKey(regionCode)) { |
| loadMetadataForRegionFromFile(currentFilePrefix, regionCode); |
| } |
| return regionToMetadataMap.get(regionCode); |
| } |
| |
| private boolean isNumberMatchingDesc(String nationalNumber, PhoneNumberDesc numberDesc) { |
| Matcher possibleNumberPatternMatcher = |
| regexCache.getPatternForRegex(numberDesc.getPossibleNumberPattern()) |
| .matcher(nationalNumber); |
| Matcher nationalNumberPatternMatcher = |
| regexCache.getPatternForRegex(numberDesc.getNationalNumberPattern()) |
| .matcher(nationalNumber); |
| return possibleNumberPatternMatcher.matches() && nationalNumberPatternMatcher.matches(); |
| } |
| |
| /** |
| * Tests whether a phone number matches a valid pattern. Note this doesn't verify the number |
| * is actually in use, which is impossible to tell by just looking at a number itself. |
| * |
| * @param number the phone number that we want to validate |
| * @return a boolean that indicates whether the number is of a valid pattern |
| */ |
| public boolean isValidNumber(PhoneNumber number) { |
| String regionCode = getRegionCodeForNumber(number); |
| return (isValidRegionCode(regionCode) && isValidNumberForRegion(number, regionCode)); |
| } |
| |
| /** |
| * Tests whether a phone number is valid for a certain region. Note this doesn't verify the number |
| * is actually in use, which is impossible to tell by just looking at a number itself. If the |
| * country calling code is not the same as the country calling code for the region, this |
| * immediately exits with false. After this, the specific number pattern rules for the region are |
| * examined. This is useful for determining for example whether a particular number is valid for |
| * Canada, rather than just a valid NANPA number. |
| * |
| * @param number the phone number that we want to validate |
| * @param regionCode the region that we want to validate the phone number for |
| * @return a boolean that indicates whether the number is of a valid pattern |
| */ |
| public boolean isValidNumberForRegion(PhoneNumber number, String regionCode) { |
| if (number.getCountryCode() != getCountryCodeForRegion(regionCode)) { |
| return false; |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| PhoneNumberDesc generalNumDesc = metadata.getGeneralDesc(); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| |
| // For regions where we don't have metadata for PhoneNumberDesc, we treat any number passed in |
| // as a valid number if its national significant number is between the minimum and maximum |
| // lengths defined by ITU for a national significant number. |
| if (!generalNumDesc.hasNationalNumberPattern()) { |
| int numberLength = nationalSignificantNumber.length(); |
| return numberLength > MIN_LENGTH_FOR_NSN && numberLength <= MAX_LENGTH_FOR_NSN; |
| } |
| return getNumberTypeHelper(nationalSignificantNumber, metadata) != PhoneNumberType.UNKNOWN; |
| } |
| |
| /** |
| * Returns the region where a phone number is from. This could be used for geocoding at the region |
| * level. |
| * |
| * @param number the phone number whose origin we want to know |
| * @return the region where the phone number is from, or null if no region matches this calling |
| * code |
| */ |
| public String getRegionCodeForNumber(PhoneNumber number) { |
| int countryCode = number.getCountryCode(); |
| List<String> regions = countryCallingCodeToRegionCodeMap.get(countryCode); |
| if (regions == null) { |
| return null; |
| } |
| if (regions.size() == 1) { |
| return regions.get(0); |
| } else { |
| return getRegionCodeForNumberFromRegionList(number, regions); |
| } |
| } |
| |
| private String getRegionCodeForNumberFromRegionList(PhoneNumber number, |
| List<String> regionCodes) { |
| String nationalNumber = getNationalSignificantNumber(number); |
| for (String regionCode : regionCodes) { |
| // If leadingDigits is present, use this. Otherwise, do full validation. |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| if (metadata.hasLeadingDigits()) { |
| if (regexCache.getPatternForRegex(metadata.getLeadingDigits()) |
| .matcher(nationalNumber).lookingAt()) { |
| return regionCode; |
| } |
| } else if (getNumberTypeHelper(nationalNumber, metadata) != PhoneNumberType.UNKNOWN) { |
| return regionCode; |
| } |
| } |
| return null; |
| } |
| |
| /** |
| * Returns the region code that matches the specific country calling code. In the case of no |
| * region code being found, ZZ will be returned. In the case of multiple regions, the one |
| * designated in the metadata as the "main" region for this calling code will be returned. |
| */ |
| public String getRegionCodeForCountryCode(int countryCallingCode) { |
| List<String> regionCodes = countryCallingCodeToRegionCodeMap.get(countryCallingCode); |
| return regionCodes == null ? UNKNOWN_REGION : regionCodes.get(0); |
| } |
| |
| /** |
| * Returns the country calling code for a specific region. For example, this would be 1 for the |
| * United States, and 64 for New Zealand. |
| * |
| * @param regionCode the region that we want to get the country calling code for |
| * @return the country calling code for the region denoted by regionCode |
| */ |
| public int getCountryCodeForRegion(String regionCode) { |
| if (!isValidRegionCode(regionCode)) { |
| return 0; |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| return metadata.getCountryCode(); |
| } |
| |
| /** |
| * Returns the national dialling prefix for a specific region. For example, this would be 1 for |
| * the United States, and 0 for New Zealand. Set stripNonDigits to true to strip symbols like "~" |
| * (which indicates a wait for a dialling tone) from the prefix returned. If no national prefix is |
| * present, we return null. |
| * |
| * <p>Warning: Do not use this method for do-your-own formatting - for some regions, the |
| * national dialling prefix is used only for certain types of numbers. Use the library's |
| * formatting functions to prefix the national prefix when required. |
| * |
| * @param regionCode the region that we want to get the dialling prefix for |
| * @param stripNonDigits true to strip non-digits from the national dialling prefix |
| * @return the dialling prefix for the region denoted by regionCode |
| */ |
| public String getNddPrefixForRegion(String regionCode, boolean stripNonDigits) { |
| if (!isValidRegionCode(regionCode)) { |
| LOGGER.log(Level.SEVERE, "Invalid or missing region code provided."); |
| return null; |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| String nationalPrefix = metadata.getNationalPrefix(); |
| // If no national prefix was found, we return null. |
| if (nationalPrefix.length() == 0) { |
| return null; |
| } |
| if (stripNonDigits) { |
| // Note: if any other non-numeric symbols are ever used in national prefixes, these would have |
| // to be removed here as well. |
| nationalPrefix = nationalPrefix.replace("~", ""); |
| } |
| return nationalPrefix; |
| } |
| |
| /** |
| * Checks if this is a region under the North American Numbering Plan Administration (NANPA). |
| * |
| * @return true if regionCode is one of the regions under NANPA |
| */ |
| public boolean isNANPACountry(String regionCode) { |
| return regionCode != null && nanpaRegions.contains(regionCode); |
| } |
| |
| /** |
| * Checks whether the country calling code is from a region whose national significant number |
| * could contain a leading zero. An example of such a region is Italy. Returns false if no |
| * metadata for the country is found. |
| */ |
| public boolean isLeadingZeroPossible(int countryCallingCode) { |
| PhoneMetadata mainMetadataForCallingCode = getMetadataForRegion( |
| getRegionCodeForCountryCode(countryCallingCode)); |
| if (mainMetadataForCallingCode == null) { |
| return false; |
| } |
| return mainMetadataForCallingCode.isLeadingZeroPossible(); |
| } |
| |
| /** |
| * Checks if the number is a valid vanity (alpha) number such as 800 MICROSOFT. A valid vanity |
| * number will start with at least 3 digits and will have three or more alpha characters. This |
| * does not do region-specific checks - to work out if this number is actually valid for a region, |
| * it should be parsed and methods such as {@link #isPossibleNumberWithReason} and |
| * {@link #isValidNumber} should be used. |
| * |
| * @param number the number that needs to be checked |
| * @return true if the number is a valid vanity number |
| */ |
| public boolean isAlphaNumber(String number) { |
| if (!isViablePhoneNumber(number)) { |
| // Number is too short, or doesn't match the basic phone number pattern. |
| return false; |
| } |
| StringBuilder strippedNumber = new StringBuilder(number); |
| maybeStripExtension(strippedNumber); |
| return VALID_ALPHA_PHONE_PATTERN.matcher(strippedNumber).matches(); |
| } |
| |
| /** |
| * Convenience wrapper around {@link #isPossibleNumberWithReason}. Instead of returning the reason |
| * for failure, this method returns a boolean value. |
| * @param number the number that needs to be checked |
| * @return true if the number is possible |
| */ |
| public boolean isPossibleNumber(PhoneNumber number) { |
| return isPossibleNumberWithReason(number) == ValidationResult.IS_POSSIBLE; |
| } |
| |
| /** |
| * Helper method to check a number against a particular pattern and determine whether it matches, |
| * or is too short or too long. Currently, if a number pattern suggests that numbers of length 7 |
| * and 10 are possible, and a number in between these possible lengths is entered, such as of |
| * length 8, this will return TOO_LONG. |
| */ |
| private ValidationResult testNumberLengthAgainstPattern(Pattern numberPattern, String number) { |
| Matcher numberMatcher = numberPattern.matcher(number); |
| if (numberMatcher.matches()) { |
| return ValidationResult.IS_POSSIBLE; |
| } |
| if (numberMatcher.lookingAt()) { |
| return ValidationResult.TOO_LONG; |
| } else { |
| return ValidationResult.TOO_SHORT; |
| } |
| } |
| |
| /** |
| * Check whether a phone number is a possible number. It provides a more lenient check than |
| * {@link #isValidNumber} in the following sense: |
| *<ol> |
| * <li> It only checks the length of phone numbers. In particular, it doesn't check starting |
| * digits of the number. |
| * <li> It doesn't attempt to figure out the type of the number, but uses general rules which |
| * applies to all types of phone numbers in a region. Therefore, it is much faster than |
| * isValidNumber. |
| * <li> For fixed line numbers, many regions have the concept of area code, which together with |
| * subscriber number constitute the national significant number. It is sometimes okay to dial |
| * the subscriber number only when dialing in the same area. This function will return |
| * true if the subscriber-number-only version is passed in. On the other hand, because |
| * isValidNumber validates using information on both starting digits (for fixed line |
| * numbers, that would most likely be area codes) and length (obviously includes the |
| * length of area codes for fixed line numbers), it will return false for the |
| * subscriber-number-only version. |
| * </ol |
| * @param number the number that needs to be checked |
| * @return a ValidationResult object which indicates whether the number is possible |
| */ |
| public ValidationResult isPossibleNumberWithReason(PhoneNumber number) { |
| String nationalNumber = getNationalSignificantNumber(number); |
| int countryCode = number.getCountryCode(); |
| // Note: For Russian Fed and NANPA numbers, we just use the rules from the default region (US or |
| // Russia) since the getRegionCodeForNumber will not work if the number is possible but not |
| // valid. This would need to be revisited if the possible number pattern ever differed between |
| // various regions within those plans. |
| String regionCode = getRegionCodeForCountryCode(countryCode); |
| if (!isValidRegionCode(regionCode)) { |
| return ValidationResult.INVALID_COUNTRY_CODE; |
| } |
| PhoneNumberDesc generalNumDesc = getMetadataForRegion(regionCode).getGeneralDesc(); |
| // Handling case of numbers with no metadata. |
| if (!generalNumDesc.hasNationalNumberPattern()) { |
| LOGGER.log(Level.FINER, "Checking if number is possible with incomplete metadata."); |
| int numberLength = nationalNumber.length(); |
| if (numberLength < MIN_LENGTH_FOR_NSN) { |
| return ValidationResult.TOO_SHORT; |
| } else if (numberLength > MAX_LENGTH_FOR_NSN) { |
| return ValidationResult.TOO_LONG; |
| } else { |
| return ValidationResult.IS_POSSIBLE; |
| } |
| } |
| Pattern possibleNumberPattern = |
| regexCache.getPatternForRegex(generalNumDesc.getPossibleNumberPattern()); |
| return testNumberLengthAgainstPattern(possibleNumberPattern, nationalNumber); |
| } |
| |
| /** |
| * Check whether a phone number is a possible number given a number in the form of a string, and |
| * the region where the number could be dialed from. It provides a more lenient check than |
| * {@link #isValidNumber}. See {@link #isPossibleNumber(PhoneNumber)} for details. |
| * |
| * <p>This method first parses the number, then invokes {@link #isPossibleNumber(PhoneNumber |
| * number)} with the resultant PhoneNumber object. |
| * |
| * @param number the number that needs to be checked, in the form of a string |
| * @param regionDialingFrom the region that we are expecting the number to be dialed from. |
| * Note this is different from the region where the number belongs. For example, the number |
| * +1 650 253 0000 is a number that belongs to US. When written in this form, it can be |
| * dialed from any region. When it is written as 00 1 650 253 0000, it can be dialed from any |
| * region which uses an international dialling prefix of 00. When it is written as |
| * 650 253 0000, it can only be dialed from within the US, and when written as 253 0000, it |
| * can only be dialed from within a smaller area in the US (Mountain View, CA, to be more |
| * specific). |
| * @return true if the number is possible |
| */ |
| public boolean isPossibleNumber(String number, String regionDialingFrom) { |
| try { |
| return isPossibleNumber(parse(number, regionDialingFrom)); |
| } catch (NumberParseException e) { |
| return false; |
| } |
| } |
| |
| /** |
| * Attempts to extract a valid number from a phone number that is too long to be valid, and resets |
| * the PhoneNumber object passed in to that valid version. If no valid number could be extracted, |
| * the PhoneNumber object passed in will not be modified. |
| * @param number a PhoneNumber object which contains a number that is too long to be valid. |
| * @return true if a valid phone number can be successfully extracted. |
| */ |
| public boolean truncateTooLongNumber(PhoneNumber number) { |
| if (isValidNumber(number)) { |
| return true; |
| } |
| PhoneNumber numberCopy = new PhoneNumber(); |
| numberCopy.mergeFrom(number); |
| long nationalNumber = number.getNationalNumber(); |
| do { |
| nationalNumber /= 10; |
| numberCopy.setNationalNumber(nationalNumber); |
| if (isPossibleNumberWithReason(numberCopy) == ValidationResult.TOO_SHORT || |
| nationalNumber == 0) { |
| return false; |
| } |
| } while (!isValidNumber(numberCopy)); |
| number.setNationalNumber(nationalNumber); |
| return true; |
| } |
| |
| /** |
| * Gets an {@link com.google.i18n.phonenumbers.AsYouTypeFormatter} for the specific region. |
| * |
| * @param regionCode the region where the phone number is being entered |
| * @return an {@link com.google.i18n.phonenumbers.AsYouTypeFormatter} object, which can be used |
| * to format phone numbers in the specific region "as you type" |
| */ |
| public AsYouTypeFormatter getAsYouTypeFormatter(String regionCode) { |
| return new AsYouTypeFormatter(regionCode); |
| } |
| |
| // Extracts country calling code from fullNumber, returns it and places the remaining number in |
| // nationalNumber. It assumes that the leading plus sign or IDD has already been removed. Returns |
| // 0 if fullNumber doesn't start with a valid country calling code, and leaves nationalNumber |
| // unmodified. |
| int extractCountryCode(StringBuilder fullNumber, StringBuilder nationalNumber) { |
| int potentialCountryCode; |
| int numberLength = fullNumber.length(); |
| for (int i = 1; i <= MAX_LENGTH_COUNTRY_CODE && i <= numberLength; i++) { |
| potentialCountryCode = Integer.parseInt(fullNumber.substring(0, i)); |
| if (countryCallingCodeToRegionCodeMap.containsKey(potentialCountryCode)) { |
| nationalNumber.append(fullNumber.substring(i)); |
| return potentialCountryCode; |
| } |
| } |
| return 0; |
| } |
| |
| /** |
| * Tries to extract a country calling code from a number. This method will return zero if no |
| * country calling code is considered to be present. Country calling codes are extracted in the |
| * following ways: |
| * <ul> |
| * <li> by stripping the international dialing prefix of the region the person is dialing from, |
| * if this is present in the number, and looking at the next digits |
| * <li> by stripping the '+' sign if present and then looking at the next digits |
| * <li> by comparing the start of the number and the country calling code of the default region. |
| * If the number is not considered possible for the numbering plan of the default region |
| * initially, but starts with the country calling code of this region, validation will be |
| * reattempted after stripping this country calling code. If this number is considered a |
| * possible number, then the first digits will be considered the country calling code and |
| * removed as such. |
| * </ul> |
| * It will throw a NumberParseException if the number starts with a '+' but the country calling |
| * code supplied after this does not match that of any known region. |
| * |
| * @param number non-normalized telephone number that we wish to extract a country calling |
| * code from - may begin with '+' |
| * @param defaultRegionMetadata metadata about the region this number may be from |
| * @param nationalNumber a string buffer to store the national significant number in, in the case |
| * that a country calling code was extracted. The number is appended to any existing contents. |
| * If no country calling code was extracted, this will be left unchanged. |
| * @param keepRawInput true if the country_code_source and preferred_carrier_code fields of |
| * phoneNumber should be populated. |
| * @param phoneNumber the PhoneNumber object where the country_code and country_code_source need |
| * to be populated. Note the country_code is always populated, whereas country_code_source is |
| * only populated when keepCountryCodeSource is true. |
| * @return the country calling code extracted or 0 if none could be extracted |
| */ |
| int maybeExtractCountryCode(String number, PhoneMetadata defaultRegionMetadata, |
| StringBuilder nationalNumber, boolean keepRawInput, |
| PhoneNumber phoneNumber) |
| throws NumberParseException { |
| if (number.length() == 0) { |
| return 0; |
| } |
| StringBuilder fullNumber = new StringBuilder(number); |
| // Set the default prefix to be something that will never match. |
| String possibleCountryIddPrefix = "NonMatch"; |
| if (defaultRegionMetadata != null) { |
| possibleCountryIddPrefix = defaultRegionMetadata.getInternationalPrefix(); |
| } |
| |
| CountryCodeSource countryCodeSource = |
| maybeStripInternationalPrefixAndNormalize(fullNumber, possibleCountryIddPrefix); |
| if (keepRawInput) { |
| phoneNumber.setCountryCodeSource(countryCodeSource); |
| } |
| if (countryCodeSource != CountryCodeSource.FROM_DEFAULT_COUNTRY) { |
| if (fullNumber.length() < MIN_LENGTH_FOR_NSN) { |
| throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_AFTER_IDD, |
| "Phone number had an IDD, but after this was not " |
| + "long enough to be a viable phone number."); |
| } |
| int potentialCountryCode = extractCountryCode(fullNumber, nationalNumber); |
| if (potentialCountryCode != 0) { |
| phoneNumber.setCountryCode(potentialCountryCode); |
| return potentialCountryCode; |
| } |
| |
| // If this fails, they must be using a strange country calling code that we don't recognize, |
| // or that doesn't exist. |
| throw new NumberParseException(NumberParseException.ErrorType.INVALID_COUNTRY_CODE, |
| "Country calling code supplied was not recognised."); |
| } else if (defaultRegionMetadata != null) { |
| // Check to see if the number starts with the country calling code for the default region. If |
| // so, we remove the country calling code, and do some checks on the validity of the number |
| // before and after. |
| int defaultCountryCode = defaultRegionMetadata.getCountryCode(); |
| String defaultCountryCodeString = String.valueOf(defaultCountryCode); |
| String normalizedNumber = fullNumber.toString(); |
| if (normalizedNumber.startsWith(defaultCountryCodeString)) { |
| StringBuilder potentialNationalNumber = |
| new StringBuilder(normalizedNumber.substring(defaultCountryCodeString.length())); |
| PhoneNumberDesc generalDesc = defaultRegionMetadata.getGeneralDesc(); |
| Pattern validNumberPattern = |
| regexCache.getPatternForRegex(generalDesc.getNationalNumberPattern()); |
| maybeStripNationalPrefixAndCarrierCode(potentialNationalNumber, defaultRegionMetadata); |
| Pattern possibleNumberPattern = |
| regexCache.getPatternForRegex(generalDesc.getPossibleNumberPattern()); |
| // If the number was not valid before but is valid now, or if it was too long before, we |
| // consider the number with the country calling code stripped to be a better result and |
| // keep that instead. |
| if ((!validNumberPattern.matcher(fullNumber).matches() && |
| validNumberPattern.matcher(potentialNationalNumber).matches()) || |
| testNumberLengthAgainstPattern(possibleNumberPattern, fullNumber.toString()) |
| == ValidationResult.TOO_LONG) { |
| nationalNumber.append(potentialNationalNumber); |
| if (keepRawInput) { |
| phoneNumber.setCountryCodeSource(CountryCodeSource.FROM_NUMBER_WITHOUT_PLUS_SIGN); |
| } |
| phoneNumber.setCountryCode(defaultCountryCode); |
| return defaultCountryCode; |
| } |
| } |
| } |
| // No country calling code present. |
| phoneNumber.setCountryCode(0); |
| return 0; |
| } |
| |
| /** |
| * Strips the IDD from the start of the number if present. Helper function used by |
| * maybeStripInternationalPrefixAndNormalize. |
| */ |
| private boolean parsePrefixAsIdd(Pattern iddPattern, StringBuilder number) { |
| Matcher m = iddPattern.matcher(number); |
| if (m.lookingAt()) { |
| int matchEnd = m.end(); |
| // Only strip this if the first digit after the match is not a 0, since country calling codes |
| // cannot begin with 0. |
| Matcher digitMatcher = CAPTURING_DIGIT_PATTERN.matcher(number.substring(matchEnd)); |
| if (digitMatcher.find()) { |
| String normalizedGroup = normalizeDigitsOnly(digitMatcher.group(1)); |
| if (normalizedGroup.equals("0")) { |
| return false; |
| } |
| } |
| number.delete(0, matchEnd); |
| return true; |
| } |
| return false; |
| } |
| |
| /** |
| * Strips any international prefix (such as +, 00, 011) present in the number provided, normalizes |
| * the resulting number, and indicates if an international prefix was present. |
| * |
| * @param number the non-normalized telephone number that we wish to strip any international |
| * dialing prefix from. |
| * @param possibleIddPrefix the international direct dialing prefix from the region we |
| * think this number may be dialed in |
| * @return the corresponding CountryCodeSource if an international dialing prefix could be |
| * removed from the number, otherwise CountryCodeSource.FROM_DEFAULT_COUNTRY if the number did |
| * not seem to be in international format. |
| */ |
| CountryCodeSource maybeStripInternationalPrefixAndNormalize( |
| StringBuilder number, |
| String possibleIddPrefix) { |
| if (number.length() == 0) { |
| return CountryCodeSource.FROM_DEFAULT_COUNTRY; |
| } |
| // Check to see if the number begins with one or more plus signs. |
| Matcher m = PLUS_CHARS_PATTERN.matcher(number); |
| if (m.lookingAt()) { |
| number.delete(0, m.end()); |
| // Can now normalize the rest of the number since we've consumed the "+" sign at the start. |
| normalize(number); |
| return CountryCodeSource.FROM_NUMBER_WITH_PLUS_SIGN; |
| } |
| // Attempt to parse the first digits as an international prefix. |
| Pattern iddPattern = regexCache.getPatternForRegex(possibleIddPrefix); |
| if (parsePrefixAsIdd(iddPattern, number)) { |
| normalize(number); |
| return CountryCodeSource.FROM_NUMBER_WITH_IDD; |
| } |
| // If still not found, then try and normalize the number and then try again. This shouldn't be |
| // done before, since non-numeric characters (+ and ~) may legally be in the international |
| // prefix. |
| normalize(number); |
| return parsePrefixAsIdd(iddPattern, number) |
| ? CountryCodeSource.FROM_NUMBER_WITH_IDD |
| : CountryCodeSource.FROM_DEFAULT_COUNTRY; |
| } |
| |
| /** |
| * Strips any national prefix (such as 0, 1) present in the number provided. |
| * |
| * @param number the normalized telephone number that we wish to strip any national |
| * dialing prefix from |
| * @param metadata the metadata for the region that we think this number is from |
| * @return the carrier code extracted if it is present, otherwise return an empty string. |
| */ |
| String maybeStripNationalPrefixAndCarrierCode(StringBuilder number, PhoneMetadata metadata) { |
| String carrierCode = ""; |
| int numberLength = number.length(); |
| String possibleNationalPrefix = metadata.getNationalPrefixForParsing(); |
| if (numberLength == 0 || possibleNationalPrefix.length() == 0) { |
| // Early return for numbers of zero length. |
| return carrierCode; |
| } |
| // Attempt to parse the first digits as a national prefix. |
| Matcher prefixMatcher = regexCache.getPatternForRegex(possibleNationalPrefix).matcher(number); |
| if (prefixMatcher.lookingAt()) { |
| Pattern nationalNumberRule = |
| regexCache.getPatternForRegex(metadata.getGeneralDesc().getNationalNumberPattern()); |
| // prefixMatcher.group(numOfGroups) == null implies nothing was captured by the capturing |
| // groups in possibleNationalPrefix; therefore, no transformation is necessary, and we just |
| // remove the national prefix. |
| int numOfGroups = prefixMatcher.groupCount(); |
| String transformRule = metadata.getNationalPrefixTransformRule(); |
| if (transformRule == null || transformRule.length() == 0 || |
| prefixMatcher.group(numOfGroups) == null) { |
| // Check that the resultant number is viable. If not, return. |
| Matcher nationalNumber = nationalNumberRule.matcher(number.substring(prefixMatcher.end())); |
| if (!nationalNumber.matches()) { |
| return carrierCode; |
| } |
| if (numOfGroups > 0 && prefixMatcher.group(numOfGroups) != null) { |
| carrierCode = prefixMatcher.group(1); |
| } |
| number.delete(0, prefixMatcher.end()); |
| } else { |
| // Check that the resultant number is viable. If not, return. Check this by copying the |
| // string buffer and making the transformation on the copy first. |
| StringBuilder transformedNumber = new StringBuilder(number); |
| transformedNumber.replace(0, numberLength, prefixMatcher.replaceFirst(transformRule)); |
| Matcher nationalNumber = nationalNumberRule.matcher(transformedNumber.toString()); |
| if (!nationalNumber.matches()) { |
| return carrierCode; |
| } |
| if (numOfGroups > 1) { |
| carrierCode = prefixMatcher.group(1); |
| } |
| number.replace(0, number.length(), transformedNumber.toString()); |
| } |
| } |
| return carrierCode; |
| } |
| |
| /** |
| * Strips any extension (as in, the part of the number dialled after the call is connected, |
| * usually indicated with extn, ext, x or similar) from the end of the number, and returns it. |
| * |
| * @param number the non-normalized telephone number that we wish to strip the extension from |
| * @return the phone extension |
| */ |
| String maybeStripExtension(StringBuilder number) { |
| Matcher m = EXTN_PATTERN.matcher(number); |
| // If we find a potential extension, and the number preceding this is a viable number, we assume |
| // it is an extension. |
| if (m.find() && isViablePhoneNumber(number.substring(0, m.start()))) { |
| // The numbers are captured into groups in the regular expression. |
| for (int i = 1, length = m.groupCount(); i <= length; i++) { |
| if (m.group(i) != null) { |
| // We go through the capturing groups until we find one that captured some digits. If none |
| // did, then we will return the empty string. |
| String extension = m.group(i); |
| number.delete(m.start(), number.length()); |
| return extension; |
| } |
| } |
| } |
| return ""; |
| } |
| |
| /** |
| * Checks to see that the region code used is valid, or if it is not valid, that the number to |
| * parse starts with a + symbol so that we can attempt to infer the region from the number. |
| * Returns false if it cannot use the region provided and the region cannot be inferred. |
| */ |
| private boolean checkRegionForParsing(String numberToParse, String defaultRegion) { |
| if (!isValidRegionCode(defaultRegion)) { |
| // If the number is null or empty, we can't infer the region. |
| if (numberToParse == null || numberToParse.length() == 0 || |
| !PLUS_CHARS_PATTERN.matcher(numberToParse).lookingAt()) { |
| return false; |
| } |
| } |
| return true; |
| } |
| |
| /** |
| * Parses a string and returns it in proto buffer format. This method will throw a |
| * {@link com.google.i18n.phonenumbers.NumberParseException} if the number is not considered to be |
| * a possible number. Note that validation of whether the number is actually a valid number for a |
| * particular region is not performed. This can be done separately with {@link #isValidNumber}. |
| * |
| * @param numberToParse number that we are attempting to parse. This can contain formatting |
| * such as +, ( and -, as well as a phone number extension. |
| * @param defaultRegion region that we are expecting the number to be from. This is only used |
| * if the number being parsed is not written in international format. |
| * The country_code for the number in this case would be stored as that |
| * of the default region supplied. If the number is guaranteed to |
| * start with a '+' followed by the country calling code, then |
| * "ZZ" or null can be supplied. |
| * @return a phone number proto buffer filled with the parsed number |
| * @throws NumberParseException if the string is not considered to be a viable phone number or if |
| * no default region was supplied and the number is not in |
| * international format (does not start with +) |
| */ |
| public PhoneNumber parse(String numberToParse, String defaultRegion) |
| throws NumberParseException { |
| PhoneNumber phoneNumber = new PhoneNumber(); |
| parse(numberToParse, defaultRegion, phoneNumber); |
| return phoneNumber; |
| } |
| |
| /** |
| * Same as {@link #parse(String, String)}, but accepts mutable PhoneNumber as a parameter to |
| * decrease object creation when invoked many times. |
| */ |
| public void parse(String numberToParse, String defaultRegion, PhoneNumber phoneNumber) |
| throws NumberParseException { |
| parseHelper(numberToParse, defaultRegion, false, true, phoneNumber); |
| } |
| |
| /** |
| * Parses a string and returns it in proto buffer format. This method differs from {@link #parse} |
| * in that it always populates the raw_input field of the protocol buffer with numberToParse as |
| * well as the country_code_source field. |
| * |
| * @param numberToParse number that we are attempting to parse. This can contain formatting |
| * such as +, ( and -, as well as a phone number extension. |
| * @param defaultRegion region that we are expecting the number to be from. This is only used |
| * if the number being parsed is not written in international format. |
| * The country calling code for the number in this case would be stored |
| * as that of the default region supplied. |
| * @return a phone number proto buffer filled with the parsed number |
| * @throws NumberParseException if the string is not considered to be a viable phone number or if |
| * no default region was supplied |
| */ |
| public PhoneNumber parseAndKeepRawInput(String numberToParse, String defaultRegion) |
| throws NumberParseException { |
| PhoneNumber phoneNumber = new PhoneNumber(); |
| parseAndKeepRawInput(numberToParse, defaultRegion, phoneNumber); |
| return phoneNumber; |
| } |
| |
| /** |
| * Same as{@link #parseAndKeepRawInput(String, String)}, but accepts a mutable PhoneNumber as |
| * a parameter to decrease object creation when invoked many times. |
| */ |
| public void parseAndKeepRawInput(String numberToParse, String defaultRegion, |
| PhoneNumber phoneNumber) |
| throws NumberParseException { |
| parseHelper(numberToParse, defaultRegion, true, true, phoneNumber); |
| } |
| |
| /** |
| * Returns an iterable over all {@link PhoneNumberMatch PhoneNumberMatches} in {@code text}. This |
| * is a shortcut for {@link #findNumbers(CharSequence, String, Leniency, long) |
| * getMatcher(text, defaultRegion, Leniency.VALID, Long.MAX_VALUE)}. |
| * |
| * @param text the text to search for phone numbers, null for no text |
| * @param defaultRegion region that we are expecting the number to be from. This is only used |
| * if the number being parsed is not written in international format. The |
| * country_code for the number in this case would be stored as that of |
| * the default region supplied. May be null if only international |
| * numbers are expected. |
| */ |
| public Iterable<PhoneNumberMatch> findNumbers(CharSequence text, String defaultRegion) { |
| return findNumbers(text, defaultRegion, Leniency.VALID, Long.MAX_VALUE); |
| } |
| |
| /** |
| * Returns an iterable over all {@link PhoneNumberMatch PhoneNumberMatches} in {@code text}. |
| * |
| * @param text the text to search for phone numbers, null for no text |
| * @param defaultRegion region that we are expecting the number to be from. This is only used |
| * if the number being parsed is not written in international format. The |
| * country_code for the number in this case would be stored as that of |
| * the default region supplied. May be null if only international |
| * numbers are expected. |
| * @param leniency the leniency to use when evaluating candidate phone numbers |
| * @param maxTries the maximum number of invalid numbers to try before giving up on the |
| * text. This is to cover degenerate cases where the text has a lot of |
| * false positives in it. Must be {@code >= 0}. |
| */ |
| public Iterable<PhoneNumberMatch> findNumbers( |
| final CharSequence text, final String defaultRegion, final Leniency leniency, |
| final long maxTries) { |
| |
| return new Iterable<PhoneNumberMatch>() { |
| public Iterator<PhoneNumberMatch> iterator() { |
| return new PhoneNumberMatcher( |
| PhoneNumberUtil.this, text, defaultRegion, leniency, maxTries); |
| } |
| }; |
| } |
| |
| /** |
| * Parses a string and fills up the phoneNumber. This method is the same as the public |
| * parse() method, with the exception that it allows the default region to be null, for use by |
| * isNumberMatch(). checkRegion should be set to false if it is permitted for the default region |
| * to be null or unknown ("ZZ"). |
| */ |
| private void parseHelper(String numberToParse, String defaultRegion, boolean keepRawInput, |
| boolean checkRegion, PhoneNumber phoneNumber) |
| throws NumberParseException { |
| if (numberToParse == null) { |
| throw new NumberParseException(NumberParseException.ErrorType.NOT_A_NUMBER, |
| "The phone number supplied was null."); |
| } |
| // Extract a possible number from the string passed in (this strips leading characters that |
| // could not be the start of a phone number.) |
| String number = extractPossibleNumber(numberToParse); |
| if (!isViablePhoneNumber(number)) { |
| throw new NumberParseException(NumberParseException.ErrorType.NOT_A_NUMBER, |
| "The string supplied did not seem to be a phone number."); |
| } |
| |
| // Check the region supplied is valid, or that the extracted number starts with some sort of + |
| // sign so the number's region can be determined. |
| if (checkRegion && !checkRegionForParsing(number, defaultRegion)) { |
| throw new NumberParseException(NumberParseException.ErrorType.INVALID_COUNTRY_CODE, |
| "Missing or invalid default region."); |
| } |
| |
| if (keepRawInput) { |
| phoneNumber.setRawInput(numberToParse); |
| } |
| StringBuilder nationalNumber = new StringBuilder(number); |
| // Attempt to parse extension first, since it doesn't require region-specific data and we want |
| // to have the non-normalised number here. |
| String extension = maybeStripExtension(nationalNumber); |
| if (extension.length() > 0) { |
| phoneNumber.setExtension(extension); |
| } |
| |
| PhoneMetadata regionMetadata = getMetadataForRegion(defaultRegion); |
| // Check to see if the number is given in international format so we know whether this number is |
| // from the default region or not. |
| StringBuilder normalizedNationalNumber = new StringBuilder(); |
| int countryCode = maybeExtractCountryCode(nationalNumber.toString(), regionMetadata, |
| normalizedNationalNumber, keepRawInput, phoneNumber); |
| if (countryCode != 0) { |
| String phoneNumberRegion = getRegionCodeForCountryCode(countryCode); |
| if (!phoneNumberRegion.equals(defaultRegion)) { |
| regionMetadata = getMetadataForRegion(phoneNumberRegion); |
| } |
| } else { |
| // If no extracted country calling code, use the region supplied instead. The national number |
| // is just the normalized version of the number we were given to parse. |
| normalize(nationalNumber); |
| normalizedNationalNumber.append(nationalNumber); |
| if (defaultRegion != null) { |
| countryCode = regionMetadata.getCountryCode(); |
| phoneNumber.setCountryCode(countryCode); |
| } else if (keepRawInput) { |
| phoneNumber.clearCountryCodeSource(); |
| } |
| } |
| if (normalizedNationalNumber.length() < MIN_LENGTH_FOR_NSN) { |
| throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_NSN, |
| "The string supplied is too short to be a phone number."); |
| } |
| if (regionMetadata != null) { |
| String carrierCode = |
| maybeStripNationalPrefixAndCarrierCode(normalizedNationalNumber, regionMetadata); |
| if (keepRawInput) { |
| phoneNumber.setPreferredDomesticCarrierCode(carrierCode); |
| } |
| } |
| int lengthOfNationalNumber = normalizedNationalNumber.length(); |
| if (lengthOfNationalNumber < MIN_LENGTH_FOR_NSN) { |
| throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_NSN, |
| "The string supplied is too short to be a phone number."); |
| } |
| if (lengthOfNationalNumber > MAX_LENGTH_FOR_NSN) { |
| throw new NumberParseException(NumberParseException.ErrorType.TOO_LONG, |
| "The string supplied is too long to be a phone number."); |
| } |
| if (normalizedNationalNumber.charAt(0) == '0' && |
| regionMetadata != null && |
| regionMetadata.isLeadingZeroPossible()) { |
| phoneNumber.setItalianLeadingZero(true); |
| } |
| phoneNumber.setNationalNumber(Long.parseLong(normalizedNationalNumber.toString())); |
| } |
| |
| /** |
| * Takes two phone numbers and compares them for equality. |
| * |
| * <p>Returns EXACT_MATCH if the country_code, NSN, presence of a leading zero for Italian numbers |
| * and any extension present are the same. |
| * Returns NSN_MATCH if either or both has no region specified, and the NSNs and extensions are |
| * the same. |
| * Returns SHORT_NSN_MATCH if either or both has no region specified, or the region specified is |
| * the same, and one NSN could be a shorter version of the other number. This includes the case |
| * where one has an extension specified, and the other does not. |
| * Returns NO_MATCH otherwise. |
| * For example, the numbers +1 345 657 1234 and 657 1234 are a SHORT_NSN_MATCH. |
| * The numbers +1 345 657 1234 and 345 657 are a NO_MATCH. |
| * |
| * @param firstNumberIn first number to compare |
| * @param secondNumberIn second number to compare |
| * |
| * @return NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH or EXACT_MATCH depending on the level of equality |
| * of the two numbers, described in the method definition. |
| */ |
| public MatchType isNumberMatch(PhoneNumber firstNumberIn, PhoneNumber secondNumberIn) { |
| // Make copies of the phone number so that the numbers passed in are not edited. |
| PhoneNumber firstNumber = new PhoneNumber(); |
| firstNumber.mergeFrom(firstNumberIn); |
| PhoneNumber secondNumber = new PhoneNumber(); |
| secondNumber.mergeFrom(secondNumberIn); |
| // First clear raw_input, country_code_source and preferred_domestic_carrier_code fields and any |
| // empty-string extensions so that we can use the proto-buffer equality method. |
| firstNumber.clearRawInput(); |
| firstNumber.clearCountryCodeSource(); |
| firstNumber.clearPreferredDomesticCarrierCode(); |
| secondNumber.clearRawInput(); |
| secondNumber.clearCountryCodeSource(); |
| secondNumber.clearPreferredDomesticCarrierCode(); |
| if (firstNumber.hasExtension() && |
| firstNumber.getExtension().length() == 0) { |
| firstNumber.clearExtension(); |
| } |
| if (secondNumber.hasExtension() && |
| secondNumber.getExtension().length() == 0) { |
| secondNumber.clearExtension(); |
| } |
| // Early exit if both had extensions and these are different. |
| if (firstNumber.hasExtension() && secondNumber.hasExtension() && |
| !firstNumber.getExtension().equals(secondNumber.getExtension())) { |
| return MatchType.NO_MATCH; |
| } |
| int firstNumberCountryCode = firstNumber.getCountryCode(); |
| int secondNumberCountryCode = secondNumber.getCountryCode(); |
| // Both had country_code specified. |
| if (firstNumberCountryCode != 0 && secondNumberCountryCode != 0) { |
| if (firstNumber.exactlySameAs(secondNumber)) { |
| return MatchType.EXACT_MATCH; |
| } else if (firstNumberCountryCode == secondNumberCountryCode && |
| isNationalNumberSuffixOfTheOther(firstNumber, secondNumber)) { |
| // A SHORT_NSN_MATCH occurs if there is a difference because of the presence or absence of |
| // an 'Italian leading zero', the presence or absence of an extension, or one NSN being a |
| // shorter variant of the other. |
| return MatchType.SHORT_NSN_MATCH; |
| } |
| // This is not a match. |
| return MatchType.NO_MATCH; |
| } |
| // Checks cases where one or both country_code fields were not specified. To make equality |
| // checks easier, we first set the country_code fields to be equal. |
| firstNumber.setCountryCode(secondNumberCountryCode); |
| // If all else was the same, then this is an NSN_MATCH. |
| if (firstNumber.exactlySameAs(secondNumber)) { |
| return MatchType.NSN_MATCH; |
| } |
| if (isNationalNumberSuffixOfTheOther(firstNumber, secondNumber)) { |
| return MatchType.SHORT_NSN_MATCH; |
| } |
| return MatchType.NO_MATCH; |
| } |
| |
| // Returns true when one national number is the suffix of the other or both are the same. |
| private boolean isNationalNumberSuffixOfTheOther(PhoneNumber firstNumber, |
| PhoneNumber secondNumber) { |
| String firstNumberNationalNumber = String.valueOf(firstNumber.getNationalNumber()); |
| String secondNumberNationalNumber = String.valueOf(secondNumber.getNationalNumber()); |
| // Note that endsWith returns true if the numbers are equal. |
| return firstNumberNationalNumber.endsWith(secondNumberNationalNumber) || |
| secondNumberNationalNumber.endsWith(firstNumberNationalNumber); |
| } |
| |
| /** |
| * Takes two phone numbers as strings and compares them for equality. This is a convenience |
| * wrapper for {@link #isNumberMatch(PhoneNumber, PhoneNumber)}. No default region is known. |
| * |
| * @param firstNumber first number to compare. Can contain formatting, and can have country |
| * calling code specified with + at the start. |
| * @param secondNumber second number to compare. Can contain formatting, and can have country |
| * calling code specified with + at the start. |
| * @return NOT_A_NUMBER, NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH, EXACT_MATCH. See |
| * isNumberMatch(PhoneNumber firstNumber, PhoneNumber secondNumber) for more details. |
| */ |
| public MatchType isNumberMatch(String firstNumber, String secondNumber) { |
| try { |
| PhoneNumber firstNumberAsProto = parse(firstNumber, UNKNOWN_REGION); |
| return isNumberMatch(firstNumberAsProto, secondNumber); |
| } catch (NumberParseException e) { |
| if (e.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { |
| try { |
| PhoneNumber secondNumberAsProto = parse(secondNumber, UNKNOWN_REGION); |
| return isNumberMatch(secondNumberAsProto, firstNumber); |
| } catch (NumberParseException e2) { |
| if (e2.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { |
| try { |
| PhoneNumber firstNumberProto = new PhoneNumber(); |
| PhoneNumber secondNumberProto = new PhoneNumber(); |
| parseHelper(firstNumber, null, false, false, firstNumberProto); |
| parseHelper(secondNumber, null, false, false, secondNumberProto); |
| return isNumberMatch(firstNumberProto, secondNumberProto); |
| } catch (NumberParseException e3) { |
| // Fall through and return MatchType.NOT_A_NUMBER. |
| } |
| } |
| } |
| } |
| } |
| // One or more of the phone numbers we are trying to match is not a viable phone number. |
| return MatchType.NOT_A_NUMBER; |
| } |
| |
| /** |
| * Takes two phone numbers and compares them for equality. This is a convenience wrapper for |
| * {@link #isNumberMatch(PhoneNumber, PhoneNumber)}. No default region is known. |
| * |
| * @param firstNumber first number to compare in proto buffer format. |
| * @param secondNumber second number to compare. Can contain formatting, and can have country |
| * calling code specified with + at the start. |
| * @return NOT_A_NUMBER, NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH, EXACT_MATCH. See |
| * isNumberMatch(PhoneNumber firstNumber, PhoneNumber secondNumber) for more details. |
| */ |
| public MatchType isNumberMatch(PhoneNumber firstNumber, String secondNumber) { |
| // First see if the second number has an implicit country calling code, by attempting to parse |
| // it. |
| try { |
| PhoneNumber secondNumberAsProto = parse(secondNumber, UNKNOWN_REGION); |
| return isNumberMatch(firstNumber, secondNumberAsProto); |
| } catch (NumberParseException e) { |
| if (e.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { |
| // The second number has no country calling code. EXACT_MATCH is no longer possible. |
| // We parse it as if the region was the same as that for the first number, and if |
| // EXACT_MATCH is returned, we replace this with NSN_MATCH. |
| String firstNumberRegion = getRegionCodeForCountryCode(firstNumber.getCountryCode()); |
| try { |
| if (!firstNumberRegion.equals(UNKNOWN_REGION)) { |
| PhoneNumber secondNumberWithFirstNumberRegion = parse(secondNumber, firstNumberRegion); |
| MatchType match = isNumberMatch(firstNumber, secondNumberWithFirstNumberRegion); |
| if (match == MatchType.EXACT_MATCH) { |
| return MatchType.NSN_MATCH; |
| } |
| return match; |
| } else { |
| // If the first number didn't have a valid country calling code, then we parse the |
| // second number without one as well. |
| PhoneNumber secondNumberProto = new PhoneNumber(); |
| parseHelper(secondNumber, null, false, false, secondNumberProto); |
| return isNumberMatch(firstNumber, secondNumberProto); |
| } |
| } catch (NumberParseException e2) { |
| // Fall-through to return NOT_A_NUMBER. |
| } |
| } |
| } |
| // One or more of the phone numbers we are trying to match is not a viable phone number. |
| return MatchType.NOT_A_NUMBER; |
| } |
| |
| /** |
| * Returns true if the number can only be dialled from within the region. If unknown, or the |
| * number can be dialled from outside the region as well, returns false. Does not check the |
| * number is a valid number. |
| * TODO: Make this method public when we have enough metadata to make it worthwhile. Currently |
| * visible for testing purposes only. |
| * |
| * @param number the phone-number for which we want to know whether it is only diallable from |
| * within the region |
| */ |
| boolean canBeInternationallyDialled(PhoneNumber number) { |
| String regionCode = getRegionCodeForNumber(number); |
| String nationalSignificantNumber = getNationalSignificantNumber(number); |
| if (!hasValidRegionCode(regionCode, number.getCountryCode(), nationalSignificantNumber)) { |
| return true; |
| } |
| PhoneMetadata metadata = getMetadataForRegion(regionCode); |
| return !isNumberMatchingDesc(nationalSignificantNumber, metadata.getNoInternationalDialling()); |
| } |
| } |