All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.google.i18n.phonenumbers.PhoneNumberUtil Maven / Gradle / Ivy

/*
 * Copyright (C) 2009 The Libphonenumber Authors
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.google.i18n.phonenumbers;

import com.google.i18n.phonenumbers.Phonemetadata.NumberFormat;
import com.google.i18n.phonenumbers.Phonemetadata.PhoneMetadata;
import com.google.i18n.phonenumbers.Phonemetadata.PhoneNumberDesc;
import com.google.i18n.phonenumbers.Phonenumber.PhoneNumber;
import com.google.i18n.phonenumbers.Phonenumber.PhoneNumber.CountryCodeSource;
import com.google.i18n.phonenumbers.internal.MatcherApi;
import com.google.i18n.phonenumbers.internal.RegexBasedMatcher;
import com.google.i18n.phonenumbers.internal.RegexCache;

import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.EnumSet;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.TreeSet;
import java.util.logging.Level;
import java.util.logging.Logger;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

/**
 * Utility for international phone numbers. Functionality includes formatting, parsing and
 * validation.
 *
 * 

If you use this library, and want to be notified about important changes, please sign up to * our mailing list. * * NOTE: A lot of methods in this class require Region Code strings. These must be provided using * CLDR two-letter region-code format. These should be in upper-case. The list of the codes * can be found here: * http://www.unicode.org/cldr/charts/30/supplemental/territory_information.html */ public class PhoneNumberUtil { private static final Logger logger = Logger.getLogger(PhoneNumberUtil.class.getName()); /** Flags to use when compiling regular expressions for phone numbers. */ static final int REGEX_FLAGS = Pattern.UNICODE_CASE | Pattern.CASE_INSENSITIVE; // The minimum and maximum length of the national significant number. private static final int MIN_LENGTH_FOR_NSN = 2; // The ITU says the maximum length should be 15, but we have found longer numbers in Germany. static final int MAX_LENGTH_FOR_NSN = 17; // The maximum length of the country calling code. static final int MAX_LENGTH_COUNTRY_CODE = 3; // We don't allow input strings for parsing to be longer than 250 chars. This prevents malicious // input from overflowing the regular-expression engine. private static final int MAX_INPUT_STRING_LENGTH = 250; // Region-code for the unknown region. private static final String UNKNOWN_REGION = "ZZ"; private static final int NANPA_COUNTRY_CODE = 1; // The prefix that needs to be inserted in front of a Colombian landline number when dialed from // a mobile phone in Colombia. private static final String COLOMBIA_MOBILE_TO_FIXED_LINE_PREFIX = "3"; // Map of country calling codes that use a mobile token before the area code. One example of when // this is relevant is when determining the length of the national destination code, which should // be the length of the area code plus the length of the mobile token. private static final Map MOBILE_TOKEN_MAPPINGS; // Set of country codes that have geographically assigned mobile numbers (see GEO_MOBILE_COUNTRIES // below) which are not based on *area codes*. For example, in China mobile numbers start with a // carrier indicator, and beyond that are geographically assigned: this carrier indicator is not // considered to be an area code. private static final Set GEO_MOBILE_COUNTRIES_WITHOUT_MOBILE_AREA_CODES; // Set of country calling codes that have geographically assigned mobile numbers. This may not be // complete; we add calling codes case by case, as we find geographical mobile numbers or hear // from user reports. Note that countries like the US, where we can't distinguish between // fixed-line or mobile numbers, are not listed here, since we consider FIXED_LINE_OR_MOBILE to be // a possibly geographically-related type anyway (like FIXED_LINE). private static final Set GEO_MOBILE_COUNTRIES; // The PLUS_SIGN signifies the international prefix. static final char PLUS_SIGN = '+'; private static final char STAR_SIGN = '*'; private static final String RFC3966_EXTN_PREFIX = ";ext="; private static final String RFC3966_PREFIX = "tel:"; private static final String RFC3966_PHONE_CONTEXT = ";phone-context="; private static final String RFC3966_ISDN_SUBADDRESS = ";isub="; // A map that contains characters that are essential when dialling. That means any of the // characters in this map must not be removed from a number when dialling, otherwise the call // will not reach the intended destination. private static final Map DIALLABLE_CHAR_MAPPINGS; // Only upper-case variants of alpha characters are stored. private static final Map ALPHA_MAPPINGS; // For performance reasons, amalgamate both into one map. private static final Map ALPHA_PHONE_MAPPINGS; // Separate map of all symbols that we wish to retain when formatting alpha numbers. This // includes digits, ASCII letters and number grouping symbols such as "-" and " ". private static final Map ALL_PLUS_NUMBER_GROUPING_SYMBOLS; static { HashMap mobileTokenMap = new HashMap(); mobileTokenMap.put(54, "9"); MOBILE_TOKEN_MAPPINGS = Collections.unmodifiableMap(mobileTokenMap); HashSet geoMobileCountriesWithoutMobileAreaCodes = new HashSet(); geoMobileCountriesWithoutMobileAreaCodes.add(86); // China GEO_MOBILE_COUNTRIES_WITHOUT_MOBILE_AREA_CODES = Collections.unmodifiableSet(geoMobileCountriesWithoutMobileAreaCodes); HashSet geoMobileCountries = new HashSet(); geoMobileCountries.add(52); // Mexico geoMobileCountries.add(54); // Argentina geoMobileCountries.add(55); // Brazil geoMobileCountries.add(62); // Indonesia: some prefixes only (fixed CMDA wireless) geoMobileCountries.addAll(geoMobileCountriesWithoutMobileAreaCodes); GEO_MOBILE_COUNTRIES = Collections.unmodifiableSet(geoMobileCountries); // Simple ASCII digits map used to populate ALPHA_PHONE_MAPPINGS and // ALL_PLUS_NUMBER_GROUPING_SYMBOLS. HashMap asciiDigitMappings = new HashMap(); asciiDigitMappings.put('0', '0'); asciiDigitMappings.put('1', '1'); asciiDigitMappings.put('2', '2'); asciiDigitMappings.put('3', '3'); asciiDigitMappings.put('4', '4'); asciiDigitMappings.put('5', '5'); asciiDigitMappings.put('6', '6'); asciiDigitMappings.put('7', '7'); asciiDigitMappings.put('8', '8'); asciiDigitMappings.put('9', '9'); HashMap alphaMap = new HashMap(40); alphaMap.put('A', '2'); alphaMap.put('B', '2'); alphaMap.put('C', '2'); alphaMap.put('D', '3'); alphaMap.put('E', '3'); alphaMap.put('F', '3'); alphaMap.put('G', '4'); alphaMap.put('H', '4'); alphaMap.put('I', '4'); alphaMap.put('J', '5'); alphaMap.put('K', '5'); alphaMap.put('L', '5'); alphaMap.put('M', '6'); alphaMap.put('N', '6'); alphaMap.put('O', '6'); alphaMap.put('P', '7'); alphaMap.put('Q', '7'); alphaMap.put('R', '7'); alphaMap.put('S', '7'); alphaMap.put('T', '8'); alphaMap.put('U', '8'); alphaMap.put('V', '8'); alphaMap.put('W', '9'); alphaMap.put('X', '9'); alphaMap.put('Y', '9'); alphaMap.put('Z', '9'); ALPHA_MAPPINGS = Collections.unmodifiableMap(alphaMap); HashMap combinedMap = new HashMap(100); combinedMap.putAll(ALPHA_MAPPINGS); combinedMap.putAll(asciiDigitMappings); ALPHA_PHONE_MAPPINGS = Collections.unmodifiableMap(combinedMap); HashMap diallableCharMap = new HashMap(); diallableCharMap.putAll(asciiDigitMappings); diallableCharMap.put(PLUS_SIGN, PLUS_SIGN); diallableCharMap.put('*', '*'); diallableCharMap.put('#', '#'); DIALLABLE_CHAR_MAPPINGS = Collections.unmodifiableMap(diallableCharMap); HashMap allPlusNumberGroupings = new HashMap(); // Put (lower letter -> upper letter) and (upper letter -> upper letter) mappings. for (char c : ALPHA_MAPPINGS.keySet()) { allPlusNumberGroupings.put(Character.toLowerCase(c), c); allPlusNumberGroupings.put(c, c); } allPlusNumberGroupings.putAll(asciiDigitMappings); // Put grouping symbols. allPlusNumberGroupings.put('-', '-'); allPlusNumberGroupings.put('\uFF0D', '-'); allPlusNumberGroupings.put('\u2010', '-'); allPlusNumberGroupings.put('\u2011', '-'); allPlusNumberGroupings.put('\u2012', '-'); allPlusNumberGroupings.put('\u2013', '-'); allPlusNumberGroupings.put('\u2014', '-'); allPlusNumberGroupings.put('\u2015', '-'); allPlusNumberGroupings.put('\u2212', '-'); allPlusNumberGroupings.put('/', '/'); allPlusNumberGroupings.put('\uFF0F', '/'); allPlusNumberGroupings.put(' ', ' '); allPlusNumberGroupings.put('\u3000', ' '); allPlusNumberGroupings.put('\u2060', ' '); allPlusNumberGroupings.put('.', '.'); allPlusNumberGroupings.put('\uFF0E', '.'); ALL_PLUS_NUMBER_GROUPING_SYMBOLS = Collections.unmodifiableMap(allPlusNumberGroupings); } // Pattern that makes it easy to distinguish whether a region has a single international dialing // prefix or not. If a region has a single international prefix (e.g. 011 in USA), it will be // represented as a string that contains a sequence of ASCII digits, and possibly a tilde, which // signals waiting for the tone. If there are multiple available international prefixes in a // region, they will be represented as a regex string that always contains one or more characters // that are not ASCII digits or a tilde. private static final Pattern SINGLE_INTERNATIONAL_PREFIX = Pattern.compile("[\\d]+(?:[~\u2053\u223C\uFF5E][\\d]+)?"); // Regular expression of acceptable punctuation found in phone numbers, used to find numbers in // text and to decide what is a viable phone number. This excludes diallable characters. // This consists of dash characters, white space characters, full stops, slashes, // square brackets, parentheses and tildes. It also includes the letter 'x' as that is found as a // placeholder for carrier information in some phone numbers. Full-width variants are also // present. static final String VALID_PUNCTUATION = "-x\u2010-\u2015\u2212\u30FC\uFF0D-\uFF0F " + "\u00A0\u00AD\u200B\u2060\u3000()\uFF08\uFF09\uFF3B\uFF3D.\\[\\]/~\u2053\u223C\uFF5E"; private static final String DIGITS = "\\p{Nd}"; // We accept alpha characters in phone numbers, ASCII only, upper and lower case. private static final String VALID_ALPHA = Arrays.toString(ALPHA_MAPPINGS.keySet().toArray()).replaceAll("[, \\[\\]]", "") + Arrays.toString(ALPHA_MAPPINGS.keySet().toArray()) .toLowerCase().replaceAll("[, \\[\\]]", ""); static final String PLUS_CHARS = "+\uFF0B"; static final Pattern PLUS_CHARS_PATTERN = Pattern.compile("[" + PLUS_CHARS + "]+"); private static final Pattern SEPARATOR_PATTERN = Pattern.compile("[" + VALID_PUNCTUATION + "]+"); private static final Pattern CAPTURING_DIGIT_PATTERN = Pattern.compile("(" + DIGITS + ")"); // Regular expression of acceptable characters that may start a phone number for the purposes of // parsing. This allows us to strip away meaningless prefixes to phone numbers that may be // mistakenly given to us. This consists of digits, the plus symbol and arabic-indic digits. This // does not contain alpha characters, although they may be used later in the number. It also does // not include other punctuation, as this will be stripped later during parsing and is of no // information value when parsing a number. private static final String VALID_START_CHAR = "[" + PLUS_CHARS + DIGITS + "]"; private static final Pattern VALID_START_CHAR_PATTERN = Pattern.compile(VALID_START_CHAR); // Regular expression of characters typically used to start a second phone number for the purposes // of parsing. This allows us to strip off parts of the number that are actually the start of // another number, such as for: (530) 583-6985 x302/x2303 -> the second extension here makes this // actually two phone numbers, (530) 583-6985 x302 and (530) 583-6985 x2303. We remove the second // extension so that the first number is parsed correctly. private static final String SECOND_NUMBER_START = "[\\\\/] *x"; static final Pattern SECOND_NUMBER_START_PATTERN = Pattern.compile(SECOND_NUMBER_START); // Regular expression of trailing characters that we want to remove. We remove all characters that // are not alpha or numerical characters. The hash character is retained here, as it may signify // the previous block was an extension. private static final String UNWANTED_END_CHARS = "[[\\P{N}&&\\P{L}]&&[^#]]+$"; static final Pattern UNWANTED_END_CHAR_PATTERN = Pattern.compile(UNWANTED_END_CHARS); // We use this pattern to check if the phone number has at least three letters in it - if so, then // we treat it as a number where some phone-number digits are represented by letters. private static final Pattern VALID_ALPHA_PHONE_PATTERN = Pattern.compile("(?:.*?[A-Za-z]){3}.*"); // Regular expression of viable phone numbers. This is location independent. Checks we have at // least three leading digits, and only valid punctuation, alpha characters and // digits in the phone number. Does not include extension data. // The symbol 'x' is allowed here as valid punctuation since it is often used as a placeholder for // carrier codes, for example in Brazilian phone numbers. We also allow multiple "+" characters at // the start. // Corresponds to the following: // [digits]{minLengthNsn}| // plus_sign*(([punctuation]|[star])*[digits]){3,}([punctuation]|[star]|[digits]|[alpha])* // // The first reg-ex is to allow short numbers (two digits long) to be parsed if they are entered // as "15" etc, but only if there is no punctuation in them. The second expression restricts the // number of digits to three or more, but then allows them to be in international form, and to // have alpha-characters and punctuation. // // Note VALID_PUNCTUATION starts with a -, so must be the first in the range. private static final String VALID_PHONE_NUMBER = DIGITS + "{" + MIN_LENGTH_FOR_NSN + "}" + "|" + "[" + PLUS_CHARS + "]*+(?:[" + VALID_PUNCTUATION + STAR_SIGN + "]*" + DIGITS + "){3,}[" + VALID_PUNCTUATION + STAR_SIGN + VALID_ALPHA + DIGITS + "]*"; // Default extension prefix to use when formatting. This will be put in front of any extension // component of the number, after the main national number is formatted. For example, if you wish // the default extension formatting to be " extn: 3456", then you should specify " extn: " here // as the default extension prefix. This can be overridden by region-specific preferences. private static final String DEFAULT_EXTN_PREFIX = " ext. "; // Regexp of all possible ways to write extensions, for use when parsing. This will be run as a // case-insensitive regexp match. Wide character versions are also provided after each ASCII // version. private static final String EXTN_PATTERNS_FOR_PARSING = createExtnPattern(true); static final String EXTN_PATTERNS_FOR_MATCHING = createExtnPattern(false); /** * Helper method for constructing regular expressions for parsing. Creates an expression that * captures up to maxLength digits. */ private static String extnDigits(int maxLength) { return "(" + DIGITS + "{1," + maxLength + "})"; } /** * Helper initialiser method to create the regular-expression pattern to match extensions. * Note that there are currently six capturing groups for the extension itself. If this number is * changed, MaybeStripExtension needs to be updated. */ private static String createExtnPattern(boolean forParsing) { // We cap the maximum length of an extension based on the ambiguity of the way the extension is // prefixed. As per ITU, the officially allowed length for extensions is actually 40, but we // don't support this since we haven't seen real examples and this introduces many false // interpretations as the extension labels are not standardized. int extLimitAfterExplicitLabel = 20; int extLimitAfterLikelyLabel = 15; int extLimitAfterAmbiguousChar = 9; int extLimitWhenNotSure = 6; String possibleSeparatorsBetweenNumberAndExtLabel = "[ \u00A0\\t,]*"; // Optional full stop (.) or colon, followed by zero or more spaces/tabs/commas. String possibleCharsAfterExtLabel = "[:\\.\uFF0E]?[ \u00A0\\t,-]*"; String optionalExtnSuffix = "#?"; // Here the extension is called out in more explicit way, i.e mentioning it obvious patterns // like "ext.". Canonical-equivalence doesn't seem to be an option with Android java, so we // allow two options for representing the accented o - the character itself, and one in the // unicode decomposed form with the combining acute accent. String explicitExtLabels = "(?:e?xt(?:ensi(?:o\u0301?|\u00F3))?n?|\uFF45?\uFF58\uFF54\uFF4E?|\u0434\u043E\u0431|anexo)"; // One-character symbols that can be used to indicate an extension, and less commonly used // or more ambiguous extension labels. String ambiguousExtLabels = "(?:[x\uFF58#\uFF03~\uFF5E]|int|\uFF49\uFF4E\uFF54)"; // When extension is not separated clearly. String ambiguousSeparator = "[- ]+"; String rfcExtn = RFC3966_EXTN_PREFIX + extnDigits(extLimitAfterExplicitLabel); String explicitExtn = possibleSeparatorsBetweenNumberAndExtLabel + explicitExtLabels + possibleCharsAfterExtLabel + extnDigits(extLimitAfterExplicitLabel) + optionalExtnSuffix; String ambiguousExtn = possibleSeparatorsBetweenNumberAndExtLabel + ambiguousExtLabels + possibleCharsAfterExtLabel + extnDigits(extLimitAfterAmbiguousChar) + optionalExtnSuffix; String americanStyleExtnWithSuffix = ambiguousSeparator + extnDigits(extLimitWhenNotSure) + "#"; // The first regular expression covers RFC 3966 format, where the extension is added using // ";ext=". The second more generic where extension is mentioned with explicit labels like // "ext:". In both the above cases we allow more numbers in extension than any other extension // labels. The third one captures when single character extension labels or less commonly used // labels are used. In such cases we capture fewer extension digits in order to reduce the // chance of falsely interpreting two numbers beside each other as a number + extension. The // fourth one covers the special case of American numbers where the extension is written with a // hash at the end, such as "- 503#". String extensionPattern = rfcExtn + "|" + explicitExtn + "|" + ambiguousExtn + "|" + americanStyleExtnWithSuffix; // Additional pattern that is supported when parsing extensions, not when matching. if (forParsing) { // This is same as possibleSeparatorsBetweenNumberAndExtLabel, but not matching comma as // extension label may have it. String possibleSeparatorsNumberExtLabelNoComma = "[ \u00A0\\t]*"; // ",," is commonly used for auto dialling the extension when connected. First comma is matched // through possibleSeparatorsBetweenNumberAndExtLabel, so we do not repeat it here. Semi-colon // works in Iphone and Android also to pop up a button with the extension number following. String autoDiallingAndExtLabelsFound = "(?:,{2}|;)"; String autoDiallingExtn = possibleSeparatorsNumberExtLabelNoComma + autoDiallingAndExtLabelsFound + possibleCharsAfterExtLabel + extnDigits(extLimitAfterLikelyLabel) + optionalExtnSuffix; String onlyCommasExtn = possibleSeparatorsNumberExtLabelNoComma + "(?:,)+" + possibleCharsAfterExtLabel + extnDigits(extLimitAfterAmbiguousChar) + optionalExtnSuffix; // Here the first pattern is exclusively for extension autodialling formats which are used // when dialling and in this case we accept longer extensions. However, the second pattern // is more liberal on the number of commas that acts as extension labels, so we have a strict // cap on the number of digits in such extensions. return extensionPattern + "|" + autoDiallingExtn + "|" + onlyCommasExtn; } return extensionPattern; } // Regexp of all known extension prefixes used by different regions followed by 1 or more valid // digits, for use when parsing. private static final Pattern EXTN_PATTERN = Pattern.compile("(?:" + EXTN_PATTERNS_FOR_PARSING + ")$", REGEX_FLAGS); // We append optionally the extension pattern to the end here, as a valid phone number may // have an extension prefix appended, followed by 1 or more digits. private static final Pattern VALID_PHONE_NUMBER_PATTERN = Pattern.compile(VALID_PHONE_NUMBER + "(?:" + EXTN_PATTERNS_FOR_PARSING + ")?", REGEX_FLAGS); static final Pattern NON_DIGITS_PATTERN = Pattern.compile("(\\D+)"); // The FIRST_GROUP_PATTERN was originally set to $1 but there are some countries for which the // first group is not used in the national pattern (e.g. Argentina) so the $1 group does not match // correctly. Therefore, we use \d, so that the first group actually used in the pattern will be // matched. private static final Pattern FIRST_GROUP_PATTERN = Pattern.compile("(\\$\\d)"); // Constants used in the formatting rules to represent the national prefix, first group and // carrier code respectively. private static final String NP_STRING = "$NP"; private static final String FG_STRING = "$FG"; private static final String CC_STRING = "$CC"; // A pattern that is used to determine if the national prefix formatting rule has the first group // only, i.e., does not start with the national prefix. Note that the pattern explicitly allows // for unbalanced parentheses. private static final Pattern FIRST_GROUP_ONLY_PREFIX_PATTERN = Pattern.compile("\\(?\\$1\\)?"); private static PhoneNumberUtil instance = null; public static final String REGION_CODE_FOR_NON_GEO_ENTITY = "001"; /** * INTERNATIONAL and NATIONAL formats are consistent with the definition in ITU-T Recommendation * E.123. However we follow local conventions such as using '-' instead of whitespace as * separators. For example, the number of the Google Switzerland office will be written as * "+41 44 668 1800" in INTERNATIONAL format, and as "044 668 1800" in NATIONAL format. E164 * format is as per INTERNATIONAL format but with no formatting applied, e.g. "+41446681800". * RFC3966 is as per INTERNATIONAL format, but with all spaces and other separating symbols * replaced with a hyphen, and with any phone number extension appended with ";ext=". It also * will have a prefix of "tel:" added, e.g. "tel:+41-44-668-1800". * * Note: If you are considering storing the number in a neutral format, you are highly advised to * use the PhoneNumber class. */ public enum PhoneNumberFormat { E164, INTERNATIONAL, NATIONAL, RFC3966 } /** * Type of phone numbers. */ public enum PhoneNumberType { FIXED_LINE, MOBILE, // In some regions (e.g. the USA), it is impossible to distinguish between fixed-line and // mobile numbers by looking at the phone number itself. FIXED_LINE_OR_MOBILE, // Freephone lines TOLL_FREE, PREMIUM_RATE, // The cost of this call is shared between the caller and the recipient, and is hence typically // less than PREMIUM_RATE calls. See // http://en.wikipedia.org/wiki/Shared_Cost_Service for // more information. SHARED_COST, // Voice over IP numbers. This includes TSoIP (Telephony Service over IP). VOIP, // A personal number is associated with a particular person, and may be routed to either a // MOBILE or FIXED_LINE number. Some more information can be found here: // http://en.wikipedia.org/wiki/Personal_Numbers PERSONAL_NUMBER, PAGER, // Used for "Universal Access Numbers" or "Company Numbers". They may be further routed to // specific offices, but allow one number to be used for a company. UAN, // Used for "Voice Mail Access Numbers". VOICEMAIL, // A phone number is of type UNKNOWN when it does not fit any of the known patterns for a // specific region. UNKNOWN } /** * Types of phone number matches. See detailed description beside the isNumberMatch() method. */ public enum MatchType { NOT_A_NUMBER, NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH, EXACT_MATCH, } /** * Possible outcomes when testing if a PhoneNumber is possible. */ public enum ValidationResult { /** The number length matches that of valid numbers for this region. */ IS_POSSIBLE, /** * The number length matches that of local numbers for this region only (i.e. numbers that may * be able to be dialled within an area, but do not have all the information to be dialled from * anywhere inside or outside the country). */ IS_POSSIBLE_LOCAL_ONLY, /** The number has an invalid country calling code. */ INVALID_COUNTRY_CODE, /** The number is shorter than all valid numbers for this region. */ TOO_SHORT, /** * The number is longer than the shortest valid numbers for this region, shorter than the * longest valid numbers for this region, and does not itself have a number length that matches * valid numbers for this region. This can also be returned in the case where * isPossibleNumberForTypeWithReason was called, and there are no numbers of this type at all * for this region. */ INVALID_LENGTH, /** The number is longer than all valid numbers for this region. */ TOO_LONG, } /** * Leniency when {@linkplain PhoneNumberUtil#findNumbers finding} potential phone numbers in text * segments. The levels here are ordered in increasing strictness. */ public enum Leniency { /** * Phone numbers accepted are {@linkplain PhoneNumberUtil#isPossibleNumber(PhoneNumber) * possible}, but not necessarily {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid}. */ POSSIBLE { @Override boolean verify( PhoneNumber number, CharSequence candidate, PhoneNumberUtil util, PhoneNumberMatcher matcher) { return util.isPossibleNumber(number); } }, /** * Phone numbers accepted are {@linkplain PhoneNumberUtil#isPossibleNumber(PhoneNumber) * possible} and {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid}. Numbers written * in national format must have their national-prefix present if it is usually written for a * number of this type. */ VALID { @Override boolean verify( PhoneNumber number, CharSequence candidate, PhoneNumberUtil util, PhoneNumberMatcher matcher) { if (!util.isValidNumber(number) || !PhoneNumberMatcher.containsOnlyValidXChars(number, candidate.toString(), util)) { return false; } return PhoneNumberMatcher.isNationalPrefixPresentIfRequired(number, util); } }, /** * Phone numbers accepted are {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid} and * are grouped in a possible way for this locale. For example, a US number written as * "65 02 53 00 00" and "650253 0000" are not accepted at this leniency level, whereas * "650 253 0000", "650 2530000" or "6502530000" are. * Numbers with more than one '/' symbol in the national significant number are also dropped at * this level. *

* Warning: This level might result in lower coverage especially for regions outside of country * code "+1". If you are not sure about which level to use, email the discussion group * [email protected]. */ STRICT_GROUPING { @Override boolean verify( PhoneNumber number, CharSequence candidate, PhoneNumberUtil util, PhoneNumberMatcher matcher) { String candidateString = candidate.toString(); if (!util.isValidNumber(number) || !PhoneNumberMatcher.containsOnlyValidXChars(number, candidateString, util) || PhoneNumberMatcher.containsMoreThanOneSlashInNationalNumber(number, candidateString) || !PhoneNumberMatcher.isNationalPrefixPresentIfRequired(number, util)) { return false; } return matcher.checkNumberGroupingIsValid( number, candidate, util, new PhoneNumberMatcher.NumberGroupingChecker() { @Override public boolean checkGroups(PhoneNumberUtil util, PhoneNumber number, StringBuilder normalizedCandidate, String[] expectedNumberGroups) { return PhoneNumberMatcher.allNumberGroupsRemainGrouped( util, number, normalizedCandidate, expectedNumberGroups); } }); } }, /** * Phone numbers accepted are {@linkplain PhoneNumberUtil#isValidNumber(PhoneNumber) valid} and * are grouped in the same way that we would have formatted it, or as a single block. For * example, a US number written as "650 2530000" is not accepted at this leniency level, whereas * "650 253 0000" or "6502530000" are. * Numbers with more than one '/' symbol are also dropped at this level. *

* Warning: This level might result in lower coverage especially for regions outside of country * code "+1". If you are not sure about which level to use, email the discussion group * [email protected]. */ EXACT_GROUPING { @Override boolean verify( PhoneNumber number, CharSequence candidate, PhoneNumberUtil util, PhoneNumberMatcher matcher) { String candidateString = candidate.toString(); if (!util.isValidNumber(number) || !PhoneNumberMatcher.containsOnlyValidXChars(number, candidateString, util) || PhoneNumberMatcher.containsMoreThanOneSlashInNationalNumber(number, candidateString) || !PhoneNumberMatcher.isNationalPrefixPresentIfRequired(number, util)) { return false; } return matcher.checkNumberGroupingIsValid( number, candidate, util, new PhoneNumberMatcher.NumberGroupingChecker() { @Override public boolean checkGroups(PhoneNumberUtil util, PhoneNumber number, StringBuilder normalizedCandidate, String[] expectedNumberGroups) { return PhoneNumberMatcher.allNumberGroupsAreExactlyPresent( util, number, normalizedCandidate, expectedNumberGroups); } }); } }; /** Returns true if {@code number} is a verified number according to this leniency. */ abstract boolean verify( PhoneNumber number, CharSequence candidate, PhoneNumberUtil util, PhoneNumberMatcher matcher); } // A source of metadata for different regions. private final MetadataSource metadataSource; // A mapping from a country calling code to the region codes which denote the region represented // by that country calling code. In the case of multiple regions sharing a calling code, such as // the NANPA regions, the one indicated with "isMainCountryForCode" in the metadata should be // first. private final Map> countryCallingCodeToRegionCodeMap; // An API for validation checking. private final MatcherApi matcherApi = RegexBasedMatcher.create(); // The set of regions that share country calling code 1. // There are roughly 26 regions. // We set the initial capacity of the HashSet to 35 to offer a load factor of roughly 0.75. private final Set nanpaRegions = new HashSet(35); // A cache for frequently used region-specific regular expressions. // The initial capacity is set to 100 as this seems to be an optimal value for Android, based on // performance measurements. private final RegexCache regexCache = new RegexCache(100); // The set of regions the library supports. // There are roughly 240 of them and we set the initial capacity of the HashSet to 320 to offer a // load factor of roughly 0.75. private final Set supportedRegions = new HashSet(320); // The set of country calling codes that map to the non-geo entity region ("001"). This set // currently contains < 12 elements so the default capacity of 16 (load factor=0.75) is fine. private final Set countryCodesForNonGeographicalRegion = new HashSet(); /** * This class implements a singleton, the constructor is only visible to facilitate testing. */ // @VisibleForTesting PhoneNumberUtil(MetadataSource metadataSource, Map> countryCallingCodeToRegionCodeMap) { this.metadataSource = metadataSource; this.countryCallingCodeToRegionCodeMap = countryCallingCodeToRegionCodeMap; for (Map.Entry> entry : countryCallingCodeToRegionCodeMap.entrySet()) { List regionCodes = entry.getValue(); // We can assume that if the country calling code maps to the non-geo entity region code then // that's the only region code it maps to. if (regionCodes.size() == 1 && REGION_CODE_FOR_NON_GEO_ENTITY.equals(regionCodes.get(0))) { // This is the subset of all country codes that map to the non-geo entity region code. countryCodesForNonGeographicalRegion.add(entry.getKey()); } else { // The supported regions set does not include the "001" non-geo entity region code. supportedRegions.addAll(regionCodes); } } // If the non-geo entity still got added to the set of supported regions it must be because // there are entries that list the non-geo entity alongside normal regions (which is wrong). // If we discover this, remove the non-geo entity from the set of supported regions and log. if (supportedRegions.remove(REGION_CODE_FOR_NON_GEO_ENTITY)) { logger.log(Level.WARNING, "invalid metadata (country calling code was mapped to the non-geo " + "entity as well as specific region(s))"); } nanpaRegions.addAll(countryCallingCodeToRegionCodeMap.get(NANPA_COUNTRY_CODE)); } /** * Attempts to extract a possible number from the string passed in. This currently strips all * leading characters that cannot be used to start a phone number. Characters that can be used to * start a phone number are defined in the VALID_START_CHAR_PATTERN. If none of these characters * are found in the number passed in, an empty string is returned. This function also attempts to * strip off any alternative extensions or endings if two or more are present, such as in the case * of: (530) 583-6985 x302/x2303. The second extension here makes this actually two phone numbers, * (530) 583-6985 x302 and (530) 583-6985 x2303. We remove the second extension so that the first * number is parsed correctly. * * @param number the string that might contain a phone number * @return the number, stripped of any non-phone-number prefix (such as "Tel:") or an empty * string if no character used to start phone numbers (such as + or any digit) is found in the * number */ static CharSequence extractPossibleNumber(CharSequence number) { Matcher m = VALID_START_CHAR_PATTERN.matcher(number); if (m.find()) { number = number.subSequence(m.start(), number.length()); // Remove trailing non-alpha non-numerical characters. Matcher trailingCharsMatcher = UNWANTED_END_CHAR_PATTERN.matcher(number); if (trailingCharsMatcher.find()) { number = number.subSequence(0, trailingCharsMatcher.start()); } // Check for extra numbers at the end. Matcher secondNumber = SECOND_NUMBER_START_PATTERN.matcher(number); if (secondNumber.find()) { number = number.subSequence(0, secondNumber.start()); } return number; } else { return ""; } } /** * Checks to see if the string of characters could possibly be a phone number at all. At the * moment, checks to see that the string begins with at least 2 digits, ignoring any punctuation * commonly found in phone numbers. * This method does not require the number to be normalized in advance - but does assume that * leading non-number symbols have been removed, such as by the method extractPossibleNumber. * * @param number string to be checked for viability as a phone number * @return true if the number could be a phone number of some sort, otherwise false */ // @VisibleForTesting static boolean isViablePhoneNumber(CharSequence number) { if (number.length() < MIN_LENGTH_FOR_NSN) { return false; } Matcher m = VALID_PHONE_NUMBER_PATTERN.matcher(number); return m.matches(); } /** * Normalizes a string of characters representing a phone number. This performs the following * conversions: * - Punctuation is stripped. * For ALPHA/VANITY numbers: * - Letters are converted to their numeric representation on a telephone keypad. The keypad * used here is the one defined in ITU Recommendation E.161. This is only done if there are 3 * or more letters in the number, to lessen the risk that such letters are typos. * For other numbers: * - Wide-ascii digits are converted to normal ASCII (European) digits. * - Arabic-Indic numerals are converted to European numerals. * - Spurious alpha characters are stripped. * * @param number a StringBuilder of characters representing a phone number that will be * normalized in place */ static StringBuilder normalize(StringBuilder number) { Matcher m = VALID_ALPHA_PHONE_PATTERN.matcher(number); if (m.matches()) { number.replace(0, number.length(), normalizeHelper(number, ALPHA_PHONE_MAPPINGS, true)); } else { number.replace(0, number.length(), normalizeDigitsOnly(number)); } return number; } /** * Normalizes a string of characters representing a phone number. This converts wide-ascii and * arabic-indic numerals to European numerals, and strips punctuation and alpha characters. * * @param number a string of characters representing a phone number * @return the normalized string version of the phone number */ public static String normalizeDigitsOnly(CharSequence number) { return normalizeDigits(number, false /* strip non-digits */).toString(); } static StringBuilder normalizeDigits(CharSequence number, boolean keepNonDigits) { StringBuilder normalizedDigits = new StringBuilder(number.length()); for (int i = 0; i < number.length(); i++) { char c = number.charAt(i); int digit = Character.digit(c, 10); if (digit != -1) { normalizedDigits.append(digit); } else if (keepNonDigits) { normalizedDigits.append(c); } } return normalizedDigits; } /** * Normalizes a string of characters representing a phone number. This strips all characters which * are not diallable on a mobile phone keypad (including all non-ASCII digits). * * @param number a string of characters representing a phone number * @return the normalized string version of the phone number */ public static String normalizeDiallableCharsOnly(CharSequence number) { return normalizeHelper(number, DIALLABLE_CHAR_MAPPINGS, true /* remove non matches */); } /** * Converts all alpha characters in a number to their respective digits on a keypad, but retains * existing formatting. */ public static String convertAlphaCharactersInNumber(CharSequence number) { return normalizeHelper(number, ALPHA_PHONE_MAPPINGS, false); } /** * Gets the length of the geographical area code from the * PhoneNumber object passed in, so that clients could use it * to split a national significant number into geographical area code and subscriber number. It * works in such a way that the resultant subscriber number should be diallable, at least on some * devices. An example of how this could be used: * *

{@code
   * PhoneNumberUtil phoneUtil = PhoneNumberUtil.getInstance();
   * PhoneNumber number = phoneUtil.parse("16502530000", "US");
   * String nationalSignificantNumber = phoneUtil.getNationalSignificantNumber(number);
   * String areaCode;
   * String subscriberNumber;
   *
   * int areaCodeLength = phoneUtil.getLengthOfGeographicalAreaCode(number);
   * if (areaCodeLength > 0) {
   *   areaCode = nationalSignificantNumber.substring(0, areaCodeLength);
   *   subscriberNumber = nationalSignificantNumber.substring(areaCodeLength);
   * } else {
   *   areaCode = "";
   *   subscriberNumber = nationalSignificantNumber;
   * }
   * }
* * N.B.: area code is a very ambiguous concept, so the I18N team generally recommends against * using it for most purposes, but recommends using the more general {@code national_number} * instead. Read the following carefully before deciding to use this method: *
    *
  • geographical area codes change over time, and this method honors those changes; * therefore, it doesn't guarantee the stability of the result it produces. *
  • subscriber numbers may not be diallable from all devices (notably mobile devices, which * typically requires the full national_number to be dialled in most regions). *
  • most non-geographical numbers have no area codes, including numbers from non-geographical * entities *
  • some geographical numbers have no area codes. *
* @param number the PhoneNumber object for which clients * want to know the length of the area code * @return the length of area code of the PhoneNumber object * passed in */ public int getLengthOfGeographicalAreaCode(PhoneNumber number) { PhoneMetadata metadata = getMetadataForRegion(getRegionCodeForNumber(number)); if (metadata == null) { return 0; } // If a country doesn't use a national prefix, and this number doesn't have an Italian leading // zero, we assume it is a closed dialling plan with no area codes. if (!metadata.hasNationalPrefix() && !number.isItalianLeadingZero()) { return 0; } PhoneNumberType type = getNumberType(number); int countryCallingCode = number.getCountryCode(); if (type == PhoneNumberType.MOBILE // Note this is a rough heuristic; it doesn't cover Indonesia well, for example, where area // codes are present for some mobile phones but not for others. We have no better way of // representing this in the metadata at this point. && GEO_MOBILE_COUNTRIES_WITHOUT_MOBILE_AREA_CODES.contains(countryCallingCode)) { return 0; } if (!isNumberGeographical(type, countryCallingCode)) { return 0; } return getLengthOfNationalDestinationCode(number); } /** * Gets the length of the national destination code (NDC) from the * PhoneNumber object passed in, so that clients could use it * to split a national significant number into NDC and subscriber number. The NDC of a phone * number is normally the first group of digit(s) right after the country calling code when the * number is formatted in the international format, if there is a subscriber number part that * follows. * * N.B.: similar to an area code, not all numbers have an NDC! * * An example of how this could be used: * *
{@code
   * PhoneNumberUtil phoneUtil = PhoneNumberUtil.getInstance();
   * PhoneNumber number = phoneUtil.parse("18002530000", "US");
   * String nationalSignificantNumber = phoneUtil.getNationalSignificantNumber(number);
   * String nationalDestinationCode;
   * String subscriberNumber;
   *
   * int nationalDestinationCodeLength = phoneUtil.getLengthOfNationalDestinationCode(number);
   * if (nationalDestinationCodeLength > 0) {
   *   nationalDestinationCode = nationalSignificantNumber.substring(0,
   *       nationalDestinationCodeLength);
   *   subscriberNumber = nationalSignificantNumber.substring(nationalDestinationCodeLength);
   * } else {
   *   nationalDestinationCode = "";
   *   subscriberNumber = nationalSignificantNumber;
   * }
   * }
* * Refer to the unittests to see the difference between this function and * {@link #getLengthOfGeographicalAreaCode}. * * @param number the PhoneNumber object for which clients * want to know the length of the NDC * @return the length of NDC of the PhoneNumber object * passed in, which could be zero */ public int getLengthOfNationalDestinationCode(PhoneNumber number) { PhoneNumber copiedProto; if (number.hasExtension()) { // We don't want to alter the proto given to us, but we don't want to include the extension // when we format it, so we copy it and clear the extension here. copiedProto = new PhoneNumber(); copiedProto.mergeFrom(number); copiedProto.clearExtension(); } else { copiedProto = number; } String nationalSignificantNumber = format(copiedProto, PhoneNumberUtil.PhoneNumberFormat.INTERNATIONAL); String[] numberGroups = NON_DIGITS_PATTERN.split(nationalSignificantNumber); // The pattern will start with "+COUNTRY_CODE " so the first group will always be the empty // string (before the + symbol) and the second group will be the country calling code. The third // group will be area code if it is not the last group. if (numberGroups.length <= 3) { return 0; } if (getNumberType(number) == PhoneNumberType.MOBILE) { // For example Argentinian mobile numbers, when formatted in the international format, are in // the form of +54 9 NDC XXXX.... As a result, we take the length of the third group (NDC) and // add the length of the second group (which is the mobile token), which also forms part of // the national significant number. This assumes that the mobile token is always formatted // separately from the rest of the phone number. String mobileToken = getCountryMobileToken(number.getCountryCode()); if (!mobileToken.equals("")) { return numberGroups[2].length() + numberGroups[3].length(); } } return numberGroups[2].length(); } /** * Returns the mobile token for the provided country calling code if it has one, otherwise * returns an empty string. A mobile token is a number inserted before the area code when dialing * a mobile number from that country from abroad. * * @param countryCallingCode the country calling code for which we want the mobile token * @return the mobile token, as a string, for the given country calling code */ public static String getCountryMobileToken(int countryCallingCode) { if (MOBILE_TOKEN_MAPPINGS.containsKey(countryCallingCode)) { return MOBILE_TOKEN_MAPPINGS.get(countryCallingCode); } return ""; } /** * Normalizes a string of characters representing a phone number by replacing all characters found * in the accompanying map with the values therein, and stripping all other characters if * removeNonMatches is true. * * @param number a string of characters representing a phone number * @param normalizationReplacements a mapping of characters to what they should be replaced by in * the normalized version of the phone number * @param removeNonMatches indicates whether characters that are not able to be replaced should * be stripped from the number. If this is false, they will be left unchanged in the number. * @return the normalized string version of the phone number */ private static String normalizeHelper(CharSequence number, Map normalizationReplacements, boolean removeNonMatches) { StringBuilder normalizedNumber = new StringBuilder(number.length()); for (int i = 0; i < number.length(); i++) { char character = number.charAt(i); Character newDigit = normalizationReplacements.get(Character.toUpperCase(character)); if (newDigit != null) { normalizedNumber.append(newDigit); } else if (!removeNonMatches) { normalizedNumber.append(character); } // If neither of the above are true, we remove this character. } return normalizedNumber.toString(); } /** * Sets or resets the PhoneNumberUtil singleton instance. If set to null, the next call to * {@code getInstance()} will load (and return) the default instance. */ // @VisibleForTesting static synchronized void setInstance(PhoneNumberUtil util) { instance = util; } /** * Returns all regions the library has metadata for. * * @return an unordered set of the two-letter region codes for every geographical region the * library supports */ public Set getSupportedRegions() { return Collections.unmodifiableSet(supportedRegions); } /** * Returns all global network calling codes the library has metadata for. * * @return an unordered set of the country calling codes for every non-geographical entity the * library supports */ public Set getSupportedGlobalNetworkCallingCodes() { return Collections.unmodifiableSet(countryCodesForNonGeographicalRegion); } /** * Returns all country calling codes the library has metadata for, covering both non-geographical * entities (global network calling codes) and those used for geographical entities. This could be * used to populate a drop-down box of country calling codes for a phone-number widget, for * instance. * * @return an unordered set of the country calling codes for every geographical and * non-geographical entity the library supports */ public Set getSupportedCallingCodes() { return Collections.unmodifiableSet(countryCallingCodeToRegionCodeMap.keySet()); } /** * Returns true if there is any possible number data set for a particular PhoneNumberDesc. */ private static boolean descHasPossibleNumberData(PhoneNumberDesc desc) { // If this is empty, it means numbers of this type inherit from the "general desc" -> the value // "-1" means that no numbers exist for this type. return desc.getPossibleLengthCount() != 1 || desc.getPossibleLength(0) != -1; } // Note: descHasData must account for any of MetadataFilter's excludableChildFields potentially // being absent from the metadata. It must check them all. For any changes in descHasData, ensure // that all the excludableChildFields are still being checked. If your change is safe simply // mention why during a review without needing to change MetadataFilter. /** * Returns true if there is any data set for a particular PhoneNumberDesc. */ private static boolean descHasData(PhoneNumberDesc desc) { // Checking most properties since we don't know what's present, since a custom build may have // stripped just one of them (e.g. liteBuild strips exampleNumber). We don't bother checking the // possibleLengthsLocalOnly, since if this is the only thing that's present we don't really // support the type at all: no type-specific methods will work with only this data. return desc.hasExampleNumber() || descHasPossibleNumberData(desc) || desc.hasNationalNumberPattern(); } /** * Returns the types we have metadata for based on the PhoneMetadata object passed in, which must * be non-null. */ private Set getSupportedTypesForMetadata(PhoneMetadata metadata) { Set types = new TreeSet(); for (PhoneNumberType type : PhoneNumberType.values()) { if (type == PhoneNumberType.FIXED_LINE_OR_MOBILE || type == PhoneNumberType.UNKNOWN) { // Never return FIXED_LINE_OR_MOBILE (it is a convenience type, and represents that a // particular number type can't be determined) or UNKNOWN (the non-type). continue; } if (descHasData(getNumberDescByType(metadata, type))) { types.add(type); } } return Collections.unmodifiableSet(types); } /** * Returns the types for a given region which the library has metadata for. Will not include * FIXED_LINE_OR_MOBILE (if numbers in this region could be classified as FIXED_LINE_OR_MOBILE, * both FIXED_LINE and MOBILE would be present) and UNKNOWN. * * No types will be returned for invalid or unknown region codes. */ public Set getSupportedTypesForRegion(String regionCode) { if (!isValidRegionCode(regionCode)) { logger.log(Level.WARNING, "Invalid or unknown region code provided: " + regionCode); return Collections.unmodifiableSet(new TreeSet()); } PhoneMetadata metadata = getMetadataForRegion(regionCode); return getSupportedTypesForMetadata(metadata); } /** * Returns the types for a country-code belonging to a non-geographical entity which the library * has metadata for. Will not include FIXED_LINE_OR_MOBILE (if numbers for this non-geographical * entity could be classified as FIXED_LINE_OR_MOBILE, both FIXED_LINE and MOBILE would be * present) and UNKNOWN. * * No types will be returned for country calling codes that do not map to a known non-geographical * entity. */ public Set getSupportedTypesForNonGeoEntity(int countryCallingCode) { PhoneMetadata metadata = getMetadataForNonGeographicalRegion(countryCallingCode); if (metadata == null) { logger.log(Level.WARNING, "Unknown country calling code for a non-geographical entity " + "provided: " + countryCallingCode); return Collections.unmodifiableSet(new TreeSet()); } return getSupportedTypesForMetadata(metadata); } /** * Gets a {@link PhoneNumberUtil} instance to carry out international phone number formatting, * parsing, or validation. The instance is loaded with all phone number metadata. * *

The {@link PhoneNumberUtil} is implemented as a singleton. Therefore, calling getInstance * multiple times will only result in one instance being created. * * @return a PhoneNumberUtil instance */ public static synchronized PhoneNumberUtil getInstance() { if (instance == null) { setInstance(createInstance(MetadataManager.DEFAULT_METADATA_LOADER)); } return instance; } /** * Create a new {@link PhoneNumberUtil} instance to carry out international phone number * formatting, parsing, or validation. The instance is loaded with all metadata by * using the metadataLoader specified. * *

This method should only be used in the rare case in which you want to manage your own * metadata loading. Calling this method multiple times is very expensive, as each time * a new instance is created from scratch. When in doubt, use {@link #getInstance}. * * @param metadataLoader customized metadata loader. This should not be null * @return a PhoneNumberUtil instance */ public static PhoneNumberUtil createInstance(MetadataLoader metadataLoader) { if (metadataLoader == null) { throw new IllegalArgumentException("metadataLoader could not be null."); } return createInstance(new MultiFileMetadataSourceImpl(metadataLoader)); } /** * Create a new {@link PhoneNumberUtil} instance to carry out international phone number * formatting, parsing, or validation. The instance is loaded with all metadata by * using the metadataSource specified. * *

This method should only be used in the rare case in which you want to manage your own * metadata loading. Calling this method multiple times is very expensive, as each time * a new instance is created from scratch. When in doubt, use {@link #getInstance}. * * @param metadataSource customized metadata source. This should not be null * @return a PhoneNumberUtil instance */ private static PhoneNumberUtil createInstance(MetadataSource metadataSource) { if (metadataSource == null) { throw new IllegalArgumentException("metadataSource could not be null."); } return new PhoneNumberUtil(metadataSource, CountryCodeToRegionCodeMap.getCountryCodeToRegionCodeMap()); } /** * Helper function to check if the national prefix formatting rule has the first group only, i.e., * does not start with the national prefix. */ static boolean formattingRuleHasFirstGroupOnly(String nationalPrefixFormattingRule) { return nationalPrefixFormattingRule.length() == 0 || FIRST_GROUP_ONLY_PREFIX_PATTERN.matcher(nationalPrefixFormattingRule).matches(); } /** * Tests whether a phone number has a geographical association. It checks if the number is * associated with a certain region in the country to which it belongs. Note that this doesn't * verify if the number is actually in use. */ public boolean isNumberGeographical(PhoneNumber phoneNumber) { return isNumberGeographical(getNumberType(phoneNumber), phoneNumber.getCountryCode()); } /** * Overload of isNumberGeographical(PhoneNumber), since calculating the phone number type is * expensive; if we have already done this, we don't want to do it again. */ public boolean isNumberGeographical(PhoneNumberType phoneNumberType, int countryCallingCode) { return phoneNumberType == PhoneNumberType.FIXED_LINE || phoneNumberType == PhoneNumberType.FIXED_LINE_OR_MOBILE || (GEO_MOBILE_COUNTRIES.contains(countryCallingCode) && phoneNumberType == PhoneNumberType.MOBILE); } /** * Helper function to check region code is not unknown or null. */ private boolean isValidRegionCode(String regionCode) { return regionCode != null && supportedRegions.contains(regionCode); } /** * Helper function to check the country calling code is valid. */ private boolean hasValidCountryCallingCode(int countryCallingCode) { return countryCallingCodeToRegionCodeMap.containsKey(countryCallingCode); } /** * Formats a phone number in the specified format using default rules. Note that this does not * promise to produce a phone number that the user can dial from where they are - although we do * format in either 'national' or 'international' format depending on what the client asks for, we * do not currently support a more abbreviated format, such as for users in the same "area" who * could potentially dial the number without area code. Note that if the phone number has a * country calling code of 0 or an otherwise invalid country calling code, we cannot work out * which formatting rules to apply so we return the national significant number with no formatting * applied. * * @param number the phone number to be formatted * @param numberFormat the format the phone number should be formatted into * @return the formatted phone number */ public String format(PhoneNumber number, PhoneNumberFormat numberFormat) { if (number.getNationalNumber() == 0 && number.hasRawInput()) { // Unparseable numbers that kept their raw input just use that. // This is the only case where a number can be formatted as E164 without a // leading '+' symbol (but the original number wasn't parseable anyway). // TODO: Consider removing the 'if' above so that unparseable // strings without raw input format to the empty string instead of "+00". String rawInput = number.getRawInput(); if (rawInput.length() > 0) { return rawInput; } } StringBuilder formattedNumber = new StringBuilder(20); format(number, numberFormat, formattedNumber); return formattedNumber.toString(); } /** * Same as {@link #format(PhoneNumber, PhoneNumberFormat)}, but accepts a mutable StringBuilder as * a parameter to decrease object creation when invoked many times. */ public void format(PhoneNumber number, PhoneNumberFormat numberFormat, StringBuilder formattedNumber) { // Clear the StringBuilder first. formattedNumber.setLength(0); int countryCallingCode = number.getCountryCode(); String nationalSignificantNumber = getNationalSignificantNumber(number); if (numberFormat == PhoneNumberFormat.E164) { // Early exit for E164 case (even if the country calling code is invalid) since no formatting // of the national number needs to be applied. Extensions are not formatted. formattedNumber.append(nationalSignificantNumber); prefixNumberWithCountryCallingCode(countryCallingCode, PhoneNumberFormat.E164, formattedNumber); return; } if (!hasValidCountryCallingCode(countryCallingCode)) { formattedNumber.append(nationalSignificantNumber); return; } // Note getRegionCodeForCountryCode() is used because formatting information for regions which // share a country calling code is contained by only one region for performance reasons. For // example, for NANPA regions it will be contained in the metadata for US. String regionCode = getRegionCodeForCountryCode(countryCallingCode); // Metadata cannot be null because the country calling code is valid (which means that the // region code cannot be ZZ and must be one of our supported region codes). PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCallingCode, regionCode); formattedNumber.append(formatNsn(nationalSignificantNumber, metadata, numberFormat)); maybeAppendFormattedExtension(number, metadata, numberFormat, formattedNumber); prefixNumberWithCountryCallingCode(countryCallingCode, numberFormat, formattedNumber); } /** * Formats a phone number in the specified format using client-defined formatting rules. Note that * if the phone number has a country calling code of zero or an otherwise invalid country calling * code, we cannot work out things like whether there should be a national prefix applied, or how * to format extensions, so we return the national significant number with no formatting applied. * * @param number the phone number to be formatted * @param numberFormat the format the phone number should be formatted into * @param userDefinedFormats formatting rules specified by clients * @return the formatted phone number */ public String formatByPattern(PhoneNumber number, PhoneNumberFormat numberFormat, List userDefinedFormats) { int countryCallingCode = number.getCountryCode(); String nationalSignificantNumber = getNationalSignificantNumber(number); if (!hasValidCountryCallingCode(countryCallingCode)) { return nationalSignificantNumber; } // Note getRegionCodeForCountryCode() is used because formatting information for regions which // share a country calling code is contained by only one region for performance reasons. For // example, for NANPA regions it will be contained in the metadata for US. String regionCode = getRegionCodeForCountryCode(countryCallingCode); // Metadata cannot be null because the country calling code is valid. PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCallingCode, regionCode); StringBuilder formattedNumber = new StringBuilder(20); NumberFormat formattingPattern = chooseFormattingPatternForNumber(userDefinedFormats, nationalSignificantNumber); if (formattingPattern == null) { // If no pattern above is matched, we format the number as a whole. formattedNumber.append(nationalSignificantNumber); } else { NumberFormat.Builder numFormatCopy = NumberFormat.newBuilder(); // Before we do a replacement of the national prefix pattern $NP with the national prefix, we // need to copy the rule so that subsequent replacements for different numbers have the // appropriate national prefix. numFormatCopy.mergeFrom(formattingPattern); String nationalPrefixFormattingRule = formattingPattern.getNationalPrefixFormattingRule(); if (nationalPrefixFormattingRule.length() > 0) { String nationalPrefix = metadata.getNationalPrefix(); if (nationalPrefix.length() > 0) { // Replace $NP with national prefix and $FG with the first group ($1). nationalPrefixFormattingRule = nationalPrefixFormattingRule.replace(NP_STRING, nationalPrefix); nationalPrefixFormattingRule = nationalPrefixFormattingRule.replace(FG_STRING, "$1"); numFormatCopy.setNationalPrefixFormattingRule(nationalPrefixFormattingRule); } else { // We don't want to have a rule for how to format the national prefix if there isn't one. numFormatCopy.clearNationalPrefixFormattingRule(); } } formattedNumber.append( formatNsnUsingPattern(nationalSignificantNumber, numFormatCopy.build(), numberFormat)); } maybeAppendFormattedExtension(number, metadata, numberFormat, formattedNumber); prefixNumberWithCountryCallingCode(countryCallingCode, numberFormat, formattedNumber); return formattedNumber.toString(); } /** * Formats a phone number in national format for dialing using the carrier as specified in the * {@code carrierCode}. The {@code carrierCode} will always be used regardless of whether the * phone number already has a preferred domestic carrier code stored. If {@code carrierCode} * contains an empty string, returns the number in national format without any carrier code. * * @param number the phone number to be formatted * @param carrierCode the carrier selection code to be used * @return the formatted phone number in national format for dialing using the carrier as * specified in the {@code carrierCode} */ public String formatNationalNumberWithCarrierCode(PhoneNumber number, CharSequence carrierCode) { int countryCallingCode = number.getCountryCode(); String nationalSignificantNumber = getNationalSignificantNumber(number); if (!hasValidCountryCallingCode(countryCallingCode)) { return nationalSignificantNumber; } // Note getRegionCodeForCountryCode() is used because formatting information for regions which // share a country calling code is contained by only one region for performance reasons. For // example, for NANPA regions it will be contained in the metadata for US. String regionCode = getRegionCodeForCountryCode(countryCallingCode); // Metadata cannot be null because the country calling code is valid. PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCallingCode, regionCode); StringBuilder formattedNumber = new StringBuilder(20); formattedNumber.append(formatNsn(nationalSignificantNumber, metadata, PhoneNumberFormat.NATIONAL, carrierCode)); maybeAppendFormattedExtension(number, metadata, PhoneNumberFormat.NATIONAL, formattedNumber); prefixNumberWithCountryCallingCode(countryCallingCode, PhoneNumberFormat.NATIONAL, formattedNumber); return formattedNumber.toString(); } private PhoneMetadata getMetadataForRegionOrCallingCode( int countryCallingCode, String regionCode) { return REGION_CODE_FOR_NON_GEO_ENTITY.equals(regionCode) ? getMetadataForNonGeographicalRegion(countryCallingCode) : getMetadataForRegion(regionCode); } /** * Formats a phone number in national format for dialing using the carrier as specified in the * preferredDomesticCarrierCode field of the PhoneNumber object passed in. If that is missing, * use the {@code fallbackCarrierCode} passed in instead. If there is no * {@code preferredDomesticCarrierCode}, and the {@code fallbackCarrierCode} contains an empty * string, return the number in national format without any carrier code. * *

Use {@link #formatNationalNumberWithCarrierCode} instead if the carrier code passed in * should take precedence over the number's {@code preferredDomesticCarrierCode} when formatting. * * @param number the phone number to be formatted * @param fallbackCarrierCode the carrier selection code to be used, if none is found in the * phone number itself * @return the formatted phone number in national format for dialing using the number's * {@code preferredDomesticCarrierCode}, or the {@code fallbackCarrierCode} passed in if * none is found */ public String formatNationalNumberWithPreferredCarrierCode(PhoneNumber number, CharSequence fallbackCarrierCode) { return formatNationalNumberWithCarrierCode(number, // Historically, we set this to an empty string when parsing with raw input if none was // found in the input string. However, this doesn't result in a number we can dial. For this // reason, we treat the empty string the same as if it isn't set at all. number.getPreferredDomesticCarrierCode().length() > 0 ? number.getPreferredDomesticCarrierCode() : fallbackCarrierCode); } /** * Returns a number formatted in such a way that it can be dialed from a mobile phone in a * specific region. If the number cannot be reached from the region (e.g. some countries block * toll-free numbers from being called outside of the country), the method returns an empty * string. * * @param number the phone number to be formatted * @param regionCallingFrom the region where the call is being placed * @param withFormatting whether the number should be returned with formatting symbols, such as * spaces and dashes. * @return the formatted phone number */ public String formatNumberForMobileDialing(PhoneNumber number, String regionCallingFrom, boolean withFormatting) { int countryCallingCode = number.getCountryCode(); if (!hasValidCountryCallingCode(countryCallingCode)) { return number.hasRawInput() ? number.getRawInput() : ""; } String formattedNumber = ""; // Clear the extension, as that part cannot normally be dialed together with the main number. PhoneNumber numberNoExt = new PhoneNumber().mergeFrom(number).clearExtension(); String regionCode = getRegionCodeForCountryCode(countryCallingCode); PhoneNumberType numberType = getNumberType(numberNoExt); boolean isValidNumber = (numberType != PhoneNumberType.UNKNOWN); if (regionCallingFrom.equals(regionCode)) { boolean isFixedLineOrMobile = (numberType == PhoneNumberType.FIXED_LINE) || (numberType == PhoneNumberType.MOBILE) || (numberType == PhoneNumberType.FIXED_LINE_OR_MOBILE); // Carrier codes may be needed in some countries. We handle this here. if (regionCode.equals("CO") && numberType == PhoneNumberType.FIXED_LINE) { formattedNumber = formatNationalNumberWithCarrierCode(numberNoExt, COLOMBIA_MOBILE_TO_FIXED_LINE_PREFIX); } else if (regionCode.equals("BR") && isFixedLineOrMobile) { // Historically, we set this to an empty string when parsing with raw input if none was // found in the input string. However, this doesn't result in a number we can dial. For this // reason, we treat the empty string the same as if it isn't set at all. formattedNumber = numberNoExt.getPreferredDomesticCarrierCode().length() > 0 ? formattedNumber = formatNationalNumberWithPreferredCarrierCode(numberNoExt, "") // Brazilian fixed line and mobile numbers need to be dialed with a carrier code when // called within Brazil. Without that, most of the carriers won't connect the call. // Because of that, we return an empty string here. : ""; } else if (countryCallingCode == NANPA_COUNTRY_CODE) { // For NANPA countries, we output international format for numbers that can be dialed // internationally, since that always works, except for numbers which might potentially be // short numbers, which are always dialled in national format. PhoneMetadata regionMetadata = getMetadataForRegion(regionCallingFrom); if (canBeInternationallyDialled(numberNoExt) && testNumberLength(getNationalSignificantNumber(numberNoExt), regionMetadata) != ValidationResult.TOO_SHORT) { formattedNumber = format(numberNoExt, PhoneNumberFormat.INTERNATIONAL); } else { formattedNumber = format(numberNoExt, PhoneNumberFormat.NATIONAL); } } else { // For non-geographical countries, and Mexican, Chilean, and Uzbek fixed line and mobile // numbers, we output international format for numbers that can be dialed internationally as // that always works. if ((regionCode.equals(REGION_CODE_FOR_NON_GEO_ENTITY) // MX fixed line and mobile numbers should always be formatted in international format, // even when dialed within MX. For national format to work, a carrier code needs to be // used, and the correct carrier code depends on if the caller and callee are from the // same local area. It is trickier to get that to work correctly than using // international format, which is tested to work fine on all carriers. // CL fixed line numbers need the national prefix when dialing in the national format, // but don't have it when used for display. The reverse is true for mobile numbers. As // a result, we output them in the international format to make it work. // UZ mobile and fixed-line numbers have to be formatted in international format or // prefixed with special codes like 03, 04 (for fixed-line) and 05 (for mobile) for // dialling successfully from mobile devices. As we do not have complete information on // special codes and to be consistent with formatting across all phone types we return // the number in international format here. || ((regionCode.equals("MX") || regionCode.equals("CL") || regionCode.equals("UZ")) && isFixedLineOrMobile)) && canBeInternationallyDialled(numberNoExt)) { formattedNumber = format(numberNoExt, PhoneNumberFormat.INTERNATIONAL); } else { formattedNumber = format(numberNoExt, PhoneNumberFormat.NATIONAL); } } } else if (isValidNumber && canBeInternationallyDialled(numberNoExt)) { // We assume that short numbers are not diallable from outside their region, so if a number // is not a valid regular length phone number, we treat it as if it cannot be internationally // dialled. return withFormatting ? format(numberNoExt, PhoneNumberFormat.INTERNATIONAL) : format(numberNoExt, PhoneNumberFormat.E164); } return withFormatting ? formattedNumber : normalizeDiallableCharsOnly(formattedNumber); } /** * Formats a phone number for out-of-country dialing purposes. If no regionCallingFrom is * supplied, we format the number in its INTERNATIONAL format. If the country calling code is the * same as that of the region where the number is from, then NATIONAL formatting will be applied. * *

If the number itself has a country calling code of zero or an otherwise invalid country * calling code, then we return the number with no formatting applied. * *

Note this function takes care of the case for calling inside of NANPA and between Russia and * Kazakhstan (who share the same country calling code). In those cases, no international prefix * is used. For regions which have multiple international prefixes, the number in its * INTERNATIONAL format will be returned instead. * * @param number the phone number to be formatted * @param regionCallingFrom the region where the call is being placed * @return the formatted phone number */ public String formatOutOfCountryCallingNumber(PhoneNumber number, String regionCallingFrom) { if (!isValidRegionCode(regionCallingFrom)) { logger.log(Level.WARNING, "Trying to format number from invalid region " + regionCallingFrom + ". International formatting applied."); return format(number, PhoneNumberFormat.INTERNATIONAL); } int countryCallingCode = number.getCountryCode(); String nationalSignificantNumber = getNationalSignificantNumber(number); if (!hasValidCountryCallingCode(countryCallingCode)) { return nationalSignificantNumber; } if (countryCallingCode == NANPA_COUNTRY_CODE) { if (isNANPACountry(regionCallingFrom)) { // For NANPA regions, return the national format for these regions but prefix it with the // country calling code. return countryCallingCode + " " + format(number, PhoneNumberFormat.NATIONAL); } } else if (countryCallingCode == getCountryCodeForValidRegion(regionCallingFrom)) { // If regions share a country calling code, the country calling code need not be dialled. // This also applies when dialling within a region, so this if clause covers both these cases. // Technically this is the case for dialling from La Reunion to other overseas departments of // France (French Guiana, Martinique, Guadeloupe), but not vice versa - so we don't cover this // edge case for now and for those cases return the version including country calling code. // Details here: http://www.petitfute.com/voyage/225-info-pratiques-reunion return format(number, PhoneNumberFormat.NATIONAL); } // Metadata cannot be null because we checked 'isValidRegionCode()' above. PhoneMetadata metadataForRegionCallingFrom = getMetadataForRegion(regionCallingFrom); String internationalPrefix = metadataForRegionCallingFrom.getInternationalPrefix(); // In general, if there is a preferred international prefix, use that. Otherwise, for regions // that have multiple international prefixes, the international format of the number is // returned since we would not know which one to use. String internationalPrefixForFormatting = ""; if (metadataForRegionCallingFrom.hasPreferredInternationalPrefix()) { internationalPrefixForFormatting = metadataForRegionCallingFrom.getPreferredInternationalPrefix(); } else if (SINGLE_INTERNATIONAL_PREFIX.matcher(internationalPrefix).matches()) { internationalPrefixForFormatting = internationalPrefix; } String regionCode = getRegionCodeForCountryCode(countryCallingCode); // Metadata cannot be null because the country calling code is valid. PhoneMetadata metadataForRegion = getMetadataForRegionOrCallingCode(countryCallingCode, regionCode); String formattedNationalNumber = formatNsn(nationalSignificantNumber, metadataForRegion, PhoneNumberFormat.INTERNATIONAL); StringBuilder formattedNumber = new StringBuilder(formattedNationalNumber); maybeAppendFormattedExtension(number, metadataForRegion, PhoneNumberFormat.INTERNATIONAL, formattedNumber); if (internationalPrefixForFormatting.length() > 0) { formattedNumber.insert(0, " ").insert(0, countryCallingCode).insert(0, " ") .insert(0, internationalPrefixForFormatting); } else { prefixNumberWithCountryCallingCode(countryCallingCode, PhoneNumberFormat.INTERNATIONAL, formattedNumber); } return formattedNumber.toString(); } /** * Formats a phone number using the original phone number format that the number is parsed from. * The original format is embedded in the country_code_source field of the PhoneNumber object * passed in. If such information is missing, the number will be formatted into the NATIONAL * format by default. When we don't have a formatting pattern for the number, the method returns * the raw input when it is available. * * Note this method guarantees no digit will be inserted, removed or modified as a result of * formatting. * * @param number the phone number that needs to be formatted in its original number format * @param regionCallingFrom the region whose IDD needs to be prefixed if the original number * has one * @return the formatted phone number in its original number format */ public String formatInOriginalFormat(PhoneNumber number, String regionCallingFrom) { if (number.hasRawInput() && !hasFormattingPatternForNumber(number)) { // We check if we have the formatting pattern because without that, we might format the number // as a group without national prefix. return number.getRawInput(); } if (!number.hasCountryCodeSource()) { return format(number, PhoneNumberFormat.NATIONAL); } String formattedNumber; switch (number.getCountryCodeSource()) { case FROM_NUMBER_WITH_PLUS_SIGN: formattedNumber = format(number, PhoneNumberFormat.INTERNATIONAL); break; case FROM_NUMBER_WITH_IDD: formattedNumber = formatOutOfCountryCallingNumber(number, regionCallingFrom); break; case FROM_NUMBER_WITHOUT_PLUS_SIGN: formattedNumber = format(number, PhoneNumberFormat.INTERNATIONAL).substring(1); break; case FROM_DEFAULT_COUNTRY: // Fall-through to default case. default: String regionCode = getRegionCodeForCountryCode(number.getCountryCode()); // We strip non-digits from the NDD here, and from the raw input later, so that we can // compare them easily. String nationalPrefix = getNddPrefixForRegion(regionCode, true /* strip non-digits */); String nationalFormat = format(number, PhoneNumberFormat.NATIONAL); if (nationalPrefix == null || nationalPrefix.length() == 0) { // If the region doesn't have a national prefix at all, we can safely return the national // format without worrying about a national prefix being added. formattedNumber = nationalFormat; break; } // Otherwise, we check if the original number was entered with a national prefix. if (rawInputContainsNationalPrefix( number.getRawInput(), nationalPrefix, regionCode)) { // If so, we can safely return the national format. formattedNumber = nationalFormat; break; } // Metadata cannot be null here because getNddPrefixForRegion() (above) returns null if // there is no metadata for the region. PhoneMetadata metadata = getMetadataForRegion(regionCode); String nationalNumber = getNationalSignificantNumber(number); NumberFormat formatRule = chooseFormattingPatternForNumber(metadata.getNumberFormatList(), nationalNumber); // The format rule could still be null here if the national number was 0 and there was no // raw input (this should not be possible for numbers generated by the phonenumber library // as they would also not have a country calling code and we would have exited earlier). if (formatRule == null) { formattedNumber = nationalFormat; break; } // When the format we apply to this number doesn't contain national prefix, we can just // return the national format. // TODO: Refactor the code below with the code in // isNationalPrefixPresentIfRequired. String candidateNationalPrefixRule = formatRule.getNationalPrefixFormattingRule(); // We assume that the first-group symbol will never be _before_ the national prefix. int indexOfFirstGroup = candidateNationalPrefixRule.indexOf("$1"); if (indexOfFirstGroup <= 0) { formattedNumber = nationalFormat; break; } candidateNationalPrefixRule = candidateNationalPrefixRule.substring(0, indexOfFirstGroup); candidateNationalPrefixRule = normalizeDigitsOnly(candidateNationalPrefixRule); if (candidateNationalPrefixRule.length() == 0) { // National prefix not used when formatting this number. formattedNumber = nationalFormat; break; } // Otherwise, we need to remove the national prefix from our output. NumberFormat.Builder numFormatCopy = NumberFormat.newBuilder(); numFormatCopy.mergeFrom(formatRule); numFormatCopy.clearNationalPrefixFormattingRule(); List numberFormats = new ArrayList(1); numberFormats.add(numFormatCopy.build()); formattedNumber = formatByPattern(number, PhoneNumberFormat.NATIONAL, numberFormats); break; } String rawInput = number.getRawInput(); // If no digit is inserted/removed/modified as a result of our formatting, we return the // formatted phone number; otherwise we return the raw input the user entered. if (formattedNumber != null && rawInput.length() > 0) { String normalizedFormattedNumber = normalizeDiallableCharsOnly(formattedNumber); String normalizedRawInput = normalizeDiallableCharsOnly(rawInput); if (!normalizedFormattedNumber.equals(normalizedRawInput)) { formattedNumber = rawInput; } } return formattedNumber; } // Check if rawInput, which is assumed to be in the national format, has a national prefix. The // national prefix is assumed to be in digits-only form. private boolean rawInputContainsNationalPrefix(String rawInput, String nationalPrefix, String regionCode) { String normalizedNationalNumber = normalizeDigitsOnly(rawInput); if (normalizedNationalNumber.startsWith(nationalPrefix)) { try { // Some Japanese numbers (e.g. 00777123) might be mistaken to contain the national prefix // when written without it (e.g. 0777123) if we just do prefix matching. To tackle that, we // check the validity of the number if the assumed national prefix is removed (777123 won't // be valid in Japan). return isValidNumber( parse(normalizedNationalNumber.substring(nationalPrefix.length()), regionCode)); } catch (NumberParseException e) { return false; } } return false; } private boolean hasFormattingPatternForNumber(PhoneNumber number) { int countryCallingCode = number.getCountryCode(); String phoneNumberRegion = getRegionCodeForCountryCode(countryCallingCode); PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCallingCode, phoneNumberRegion); if (metadata == null) { return false; } String nationalNumber = getNationalSignificantNumber(number); NumberFormat formatRule = chooseFormattingPatternForNumber(metadata.getNumberFormatList(), nationalNumber); return formatRule != null; } /** * Formats a phone number for out-of-country dialing purposes. * * Note that in this version, if the number was entered originally using alpha characters and * this version of the number is stored in raw_input, this representation of the number will be * used rather than the digit representation. Grouping information, as specified by characters * such as "-" and " ", will be retained. * *

Caveats:

*
    *
  • This will not produce good results if the country calling code is both present in the raw * input _and_ is the start of the national number. This is not a problem in the regions * which typically use alpha numbers. *
  • This will also not produce good results if the raw input has any grouping information * within the first three digits of the national number, and if the function needs to strip * preceding digits/words in the raw input before these digits. Normally people group the * first three digits together so this is not a huge problem - and will be fixed if it * proves to be so. *
* * @param number the phone number that needs to be formatted * @param regionCallingFrom the region where the call is being placed * @return the formatted phone number */ public String formatOutOfCountryKeepingAlphaChars(PhoneNumber number, String regionCallingFrom) { String rawInput = number.getRawInput(); // If there is no raw input, then we can't keep alpha characters because there aren't any. // In this case, we return formatOutOfCountryCallingNumber. if (rawInput.length() == 0) { return formatOutOfCountryCallingNumber(number, regionCallingFrom); } int countryCode = number.getCountryCode(); if (!hasValidCountryCallingCode(countryCode)) { return rawInput; } // Strip any prefix such as country calling code, IDD, that was present. We do this by comparing // the number in raw_input with the parsed number. // To do this, first we normalize punctuation. We retain number grouping symbols such as " " // only. rawInput = normalizeHelper(rawInput, ALL_PLUS_NUMBER_GROUPING_SYMBOLS, true); // Now we trim everything before the first three digits in the parsed number. We choose three // because all valid alpha numbers have 3 digits at the start - if it does not, then we don't // trim anything at all. Similarly, if the national number was less than three digits, we don't // trim anything at all. String nationalNumber = getNationalSignificantNumber(number); if (nationalNumber.length() > 3) { int firstNationalNumberDigit = rawInput.indexOf(nationalNumber.substring(0, 3)); if (firstNationalNumberDigit != -1) { rawInput = rawInput.substring(firstNationalNumberDigit); } } PhoneMetadata metadataForRegionCallingFrom = getMetadataForRegion(regionCallingFrom); if (countryCode == NANPA_COUNTRY_CODE) { if (isNANPACountry(regionCallingFrom)) { return countryCode + " " + rawInput; } } else if (metadataForRegionCallingFrom != null && countryCode == getCountryCodeForValidRegion(regionCallingFrom)) { NumberFormat formattingPattern = chooseFormattingPatternForNumber(metadataForRegionCallingFrom.getNumberFormatList(), nationalNumber); if (formattingPattern == null) { // If no pattern above is matched, we format the original input. return rawInput; } NumberFormat.Builder newFormat = NumberFormat.newBuilder(); newFormat.mergeFrom(formattingPattern); // The first group is the first group of digits that the user wrote together. newFormat.setPattern("(\\d+)(.*)"); // Here we just concatenate them back together after the national prefix has been fixed. newFormat.setFormat("$1$2"); // Now we format using this pattern instead of the default pattern, but with the national // prefix prefixed if necessary. // This will not work in the cases where the pattern (and not the leading digits) decide // whether a national prefix needs to be used, since we have overridden the pattern to match // anything, but that is not the case in the metadata to date. return formatNsnUsingPattern(rawInput, newFormat.build(), PhoneNumberFormat.NATIONAL); } String internationalPrefixForFormatting = ""; // If an unsupported region-calling-from is entered, or a country with multiple international // prefixes, the international format of the number is returned, unless there is a preferred // international prefix. if (metadataForRegionCallingFrom != null) { String internationalPrefix = metadataForRegionCallingFrom.getInternationalPrefix(); internationalPrefixForFormatting = SINGLE_INTERNATIONAL_PREFIX.matcher(internationalPrefix).matches() ? internationalPrefix : metadataForRegionCallingFrom.getPreferredInternationalPrefix(); } StringBuilder formattedNumber = new StringBuilder(rawInput); String regionCode = getRegionCodeForCountryCode(countryCode); // Metadata cannot be null because the country calling code is valid. PhoneMetadata metadataForRegion = getMetadataForRegionOrCallingCode(countryCode, regionCode); maybeAppendFormattedExtension(number, metadataForRegion, PhoneNumberFormat.INTERNATIONAL, formattedNumber); if (internationalPrefixForFormatting.length() > 0) { formattedNumber.insert(0, " ").insert(0, countryCode).insert(0, " ") .insert(0, internationalPrefixForFormatting); } else { // Invalid region entered as country-calling-from (so no metadata was found for it) or the // region chosen has multiple international dialling prefixes. if (!isValidRegionCode(regionCallingFrom)) { logger.log(Level.WARNING, "Trying to format number from invalid region " + regionCallingFrom + ". International formatting applied."); } prefixNumberWithCountryCallingCode(countryCode, PhoneNumberFormat.INTERNATIONAL, formattedNumber); } return formattedNumber.toString(); } /** * Gets the national significant number of a phone number. Note a national significant number * doesn't contain a national prefix or any formatting. * * @param number the phone number for which the national significant number is needed * @return the national significant number of the PhoneNumber object passed in */ public String getNationalSignificantNumber(PhoneNumber number) { // If leading zero(s) have been set, we prefix this now. Note this is not a national prefix. StringBuilder nationalNumber = new StringBuilder(); if (number.isItalianLeadingZero() && number.getNumberOfLeadingZeros() > 0) { char[] zeros = new char[number.getNumberOfLeadingZeros()]; Arrays.fill(zeros, '0'); nationalNumber.append(new String(zeros)); } nationalNumber.append(number.getNationalNumber()); return nationalNumber.toString(); } /** * A helper function that is used by format and formatByPattern. */ private void prefixNumberWithCountryCallingCode(int countryCallingCode, PhoneNumberFormat numberFormat, StringBuilder formattedNumber) { switch (numberFormat) { case E164: formattedNumber.insert(0, countryCallingCode).insert(0, PLUS_SIGN); return; case INTERNATIONAL: formattedNumber.insert(0, " ").insert(0, countryCallingCode).insert(0, PLUS_SIGN); return; case RFC3966: formattedNumber.insert(0, "-").insert(0, countryCallingCode).insert(0, PLUS_SIGN) .insert(0, RFC3966_PREFIX); return; case NATIONAL: default: return; } } // Simple wrapper of formatNsn for the common case of no carrier code. private String formatNsn(String number, PhoneMetadata metadata, PhoneNumberFormat numberFormat) { return formatNsn(number, metadata, numberFormat, null); } // Note in some regions, the national number can be written in two completely different ways // depending on whether it forms part of the NATIONAL format or INTERNATIONAL format. The // numberFormat parameter here is used to specify which format to use for those cases. If a // carrierCode is specified, this will be inserted into the formatted string to replace $CC. private String formatNsn(String number, PhoneMetadata metadata, PhoneNumberFormat numberFormat, CharSequence carrierCode) { List intlNumberFormats = metadata.getIntlNumberFormatList(); // When the intlNumberFormats exists, we use that to format national number for the // INTERNATIONAL format instead of using the numberDesc.numberFormats. List availableFormats = (intlNumberFormats.size() == 0 || numberFormat == PhoneNumberFormat.NATIONAL) ? metadata.getNumberFormatList() : metadata.getIntlNumberFormatList(); NumberFormat formattingPattern = chooseFormattingPatternForNumber(availableFormats, number); return (formattingPattern == null) ? number : formatNsnUsingPattern(number, formattingPattern, numberFormat, carrierCode); } NumberFormat chooseFormattingPatternForNumber(List availableFormats, String nationalNumber) { for (NumberFormat numFormat : availableFormats) { int size = numFormat.getLeadingDigitsPatternCount(); if (size == 0 || regexCache.getPatternForRegex( // We always use the last leading_digits_pattern, as it is the most detailed. numFormat.getLeadingDigitsPattern(size - 1)).matcher(nationalNumber).lookingAt()) { Matcher m = regexCache.getPatternForRegex(numFormat.getPattern()).matcher(nationalNumber); if (m.matches()) { return numFormat; } } } return null; } // Simple wrapper of formatNsnUsingPattern for the common case of no carrier code. String formatNsnUsingPattern(String nationalNumber, NumberFormat formattingPattern, PhoneNumberFormat numberFormat) { return formatNsnUsingPattern(nationalNumber, formattingPattern, numberFormat, null); } // Note that carrierCode is optional - if null or an empty string, no carrier code replacement // will take place. private String formatNsnUsingPattern(String nationalNumber, NumberFormat formattingPattern, PhoneNumberFormat numberFormat, CharSequence carrierCode) { String numberFormatRule = formattingPattern.getFormat(); Matcher m = regexCache.getPatternForRegex(formattingPattern.getPattern()).matcher(nationalNumber); String formattedNationalNumber = ""; if (numberFormat == PhoneNumberFormat.NATIONAL && carrierCode != null && carrierCode.length() > 0 && formattingPattern.getDomesticCarrierCodeFormattingRule().length() > 0) { // Replace the $CC in the formatting rule with the desired carrier code. String carrierCodeFormattingRule = formattingPattern.getDomesticCarrierCodeFormattingRule(); carrierCodeFormattingRule = carrierCodeFormattingRule.replace(CC_STRING, carrierCode); // Now replace the $FG in the formatting rule with the first group and the carrier code // combined in the appropriate way. numberFormatRule = FIRST_GROUP_PATTERN.matcher(numberFormatRule) .replaceFirst(carrierCodeFormattingRule); formattedNationalNumber = m.replaceAll(numberFormatRule); } else { // Use the national prefix formatting rule instead. String nationalPrefixFormattingRule = formattingPattern.getNationalPrefixFormattingRule(); if (numberFormat == PhoneNumberFormat.NATIONAL && nationalPrefixFormattingRule != null && nationalPrefixFormattingRule.length() > 0) { Matcher firstGroupMatcher = FIRST_GROUP_PATTERN.matcher(numberFormatRule); formattedNationalNumber = m.replaceAll(firstGroupMatcher.replaceFirst(nationalPrefixFormattingRule)); } else { formattedNationalNumber = m.replaceAll(numberFormatRule); } } if (numberFormat == PhoneNumberFormat.RFC3966) { // Strip any leading punctuation. Matcher matcher = SEPARATOR_PATTERN.matcher(formattedNationalNumber); if (matcher.lookingAt()) { formattedNationalNumber = matcher.replaceFirst(""); } // Replace the rest with a dash between each number group. formattedNationalNumber = matcher.reset(formattedNationalNumber).replaceAll("-"); } return formattedNationalNumber; } /** * Gets a valid number for the specified region. * * @param regionCode the region for which an example number is needed * @return a valid fixed-line number for the specified region. Returns null when the metadata * does not contain such information, or the region 001 is passed in. For 001 (representing * non-geographical numbers), call {@link #getExampleNumberForNonGeoEntity} instead. */ public PhoneNumber getExampleNumber(String regionCode) { return getExampleNumberForType(regionCode, PhoneNumberType.FIXED_LINE); } /** * Gets an invalid number for the specified region. This is useful for unit-testing purposes, * where you want to test what will happen with an invalid number. Note that the number that is * returned will always be able to be parsed and will have the correct country code. It may also * be a valid *short* number/code for this region. Validity checking such numbers is handled with * {@link com.google.i18n.phonenumbers.ShortNumberInfo}. * * @param regionCode the region for which an example number is needed * @return an invalid number for the specified region. Returns null when an unsupported region or * the region 001 (Earth) is passed in. */ public PhoneNumber getInvalidExampleNumber(String regionCode) { if (!isValidRegionCode(regionCode)) { logger.log(Level.WARNING, "Invalid or unknown region code provided: " + regionCode); return null; } // We start off with a valid fixed-line number since every country supports this. Alternatively // we could start with a different number type, since fixed-line numbers typically have a wide // breadth of valid number lengths and we may have to make it very short before we get an // invalid number. PhoneNumberDesc desc = getNumberDescByType(getMetadataForRegion(regionCode), PhoneNumberType.FIXED_LINE); if (!desc.hasExampleNumber()) { // This shouldn't happen; we have a test for this. return null; } String exampleNumber = desc.getExampleNumber(); // Try and make the number invalid. We do this by changing the length. We try reducing the // length of the number, since currently no region has a number that is the same length as // MIN_LENGTH_FOR_NSN. This is probably quicker than making the number longer, which is another // alternative. We could also use the possible number pattern to extract the possible lengths of // the number to make this faster, but this method is only for unit-testing so simplicity is // preferred to performance. We don't want to return a number that can't be parsed, so we check // the number is long enough. We try all possible lengths because phone number plans often have // overlapping prefixes so the number 123456 might be valid as a fixed-line number, and 12345 as // a mobile number. It would be faster to loop in a different order, but we prefer numbers that // look closer to real numbers (and it gives us a variety of different lengths for the resulting // phone numbers - otherwise they would all be MIN_LENGTH_FOR_NSN digits long.) for (int phoneNumberLength = exampleNumber.length() - 1; phoneNumberLength >= MIN_LENGTH_FOR_NSN; phoneNumberLength--) { String numberToTry = exampleNumber.substring(0, phoneNumberLength); try { PhoneNumber possiblyValidNumber = parse(numberToTry, regionCode); if (!isValidNumber(possiblyValidNumber)) { return possiblyValidNumber; } } catch (NumberParseException e) { // Shouldn't happen: we have already checked the length, we know example numbers have // only valid digits, and we know the region code is fine. } } // We have a test to check that this doesn't happen for any of our supported regions. return null; } /** * Gets a valid number for the specified region and number type. * * @param regionCode the region for which an example number is needed * @param type the type of number that is needed * @return a valid number for the specified region and type. Returns null when the metadata * does not contain such information or if an invalid region or region 001 was entered. * For 001 (representing non-geographical numbers), call * {@link #getExampleNumberForNonGeoEntity} instead. */ public PhoneNumber getExampleNumberForType(String regionCode, PhoneNumberType type) { // Check the region code is valid. if (!isValidRegionCode(regionCode)) { logger.log(Level.WARNING, "Invalid or unknown region code provided: " + regionCode); return null; } PhoneNumberDesc desc = getNumberDescByType(getMetadataForRegion(regionCode), type); try { if (desc.hasExampleNumber()) { return parse(desc.getExampleNumber(), regionCode); } } catch (NumberParseException e) { logger.log(Level.SEVERE, e.toString()); } return null; } /** * Gets a valid number for the specified number type (it may belong to any country). * * @param type the type of number that is needed * @return a valid number for the specified type. Returns null when the metadata * does not contain such information. This should only happen when no numbers of this type are * allocated anywhere in the world anymore. */ public PhoneNumber getExampleNumberForType(PhoneNumberType type) { for (String regionCode : getSupportedRegions()) { PhoneNumber exampleNumber = getExampleNumberForType(regionCode, type); if (exampleNumber != null) { return exampleNumber; } } // If there wasn't an example number for a region, try the non-geographical entities. for (int countryCallingCode : getSupportedGlobalNetworkCallingCodes()) { PhoneNumberDesc desc = getNumberDescByType( getMetadataForNonGeographicalRegion(countryCallingCode), type); try { if (desc.hasExampleNumber()) { return parse("+" + countryCallingCode + desc.getExampleNumber(), UNKNOWN_REGION); } } catch (NumberParseException e) { logger.log(Level.SEVERE, e.toString()); } } // There are no example numbers of this type for any country in the library. return null; } /** * Gets a valid number for the specified country calling code for a non-geographical entity. * * @param countryCallingCode the country calling code for a non-geographical entity * @return a valid number for the non-geographical entity. Returns null when the metadata * does not contain such information, or the country calling code passed in does not belong * to a non-geographical entity. */ public PhoneNumber getExampleNumberForNonGeoEntity(int countryCallingCode) { PhoneMetadata metadata = getMetadataForNonGeographicalRegion(countryCallingCode); if (metadata != null) { // For geographical entities, fixed-line data is always present. However, for non-geographical // entities, this is not the case, so we have to go through different types to find the // example number. We don't check fixed-line or personal number since they aren't used by // non-geographical entities (if this changes, a unit-test will catch this.) for (PhoneNumberDesc desc : Arrays.asList(metadata.getMobile(), metadata.getTollFree(), metadata.getSharedCost(), metadata.getVoip(), metadata.getVoicemail(), metadata.getUan(), metadata.getPremiumRate())) { try { if (desc != null && desc.hasExampleNumber()) { return parse("+" + countryCallingCode + desc.getExampleNumber(), UNKNOWN_REGION); } } catch (NumberParseException e) { logger.log(Level.SEVERE, e.toString()); } } } else { logger.log(Level.WARNING, "Invalid or unknown country calling code provided: " + countryCallingCode); } return null; } /** * Appends the formatted extension of a phone number to formattedNumber, if the phone number had * an extension specified. */ private void maybeAppendFormattedExtension(PhoneNumber number, PhoneMetadata metadata, PhoneNumberFormat numberFormat, StringBuilder formattedNumber) { if (number.hasExtension() && number.getExtension().length() > 0) { if (numberFormat == PhoneNumberFormat.RFC3966) { formattedNumber.append(RFC3966_EXTN_PREFIX).append(number.getExtension()); } else { if (metadata.hasPreferredExtnPrefix()) { formattedNumber.append(metadata.getPreferredExtnPrefix()).append(number.getExtension()); } else { formattedNumber.append(DEFAULT_EXTN_PREFIX).append(number.getExtension()); } } } } PhoneNumberDesc getNumberDescByType(PhoneMetadata metadata, PhoneNumberType type) { switch (type) { case PREMIUM_RATE: return metadata.getPremiumRate(); case TOLL_FREE: return metadata.getTollFree(); case MOBILE: return metadata.getMobile(); case FIXED_LINE: case FIXED_LINE_OR_MOBILE: return metadata.getFixedLine(); case SHARED_COST: return metadata.getSharedCost(); case VOIP: return metadata.getVoip(); case PERSONAL_NUMBER: return metadata.getPersonalNumber(); case PAGER: return metadata.getPager(); case UAN: return metadata.getUan(); case VOICEMAIL: return metadata.getVoicemail(); default: return metadata.getGeneralDesc(); } } /** * Gets the type of a valid phone number. * * @param number the phone number that we want to know the type * @return the type of the phone number, or UNKNOWN if it is invalid */ public PhoneNumberType getNumberType(PhoneNumber number) { String regionCode = getRegionCodeForNumber(number); PhoneMetadata metadata = getMetadataForRegionOrCallingCode(number.getCountryCode(), regionCode); if (metadata == null) { return PhoneNumberType.UNKNOWN; } String nationalSignificantNumber = getNationalSignificantNumber(number); return getNumberTypeHelper(nationalSignificantNumber, metadata); } private PhoneNumberType getNumberTypeHelper(String nationalNumber, PhoneMetadata metadata) { if (!isNumberMatchingDesc(nationalNumber, metadata.getGeneralDesc())) { return PhoneNumberType.UNKNOWN; } if (isNumberMatchingDesc(nationalNumber, metadata.getPremiumRate())) { return PhoneNumberType.PREMIUM_RATE; } if (isNumberMatchingDesc(nationalNumber, metadata.getTollFree())) { return PhoneNumberType.TOLL_FREE; } if (isNumberMatchingDesc(nationalNumber, metadata.getSharedCost())) { return PhoneNumberType.SHARED_COST; } if (isNumberMatchingDesc(nationalNumber, metadata.getVoip())) { return PhoneNumberType.VOIP; } if (isNumberMatchingDesc(nationalNumber, metadata.getPersonalNumber())) { return PhoneNumberType.PERSONAL_NUMBER; } if (isNumberMatchingDesc(nationalNumber, metadata.getPager())) { return PhoneNumberType.PAGER; } if (isNumberMatchingDesc(nationalNumber, metadata.getUan())) { return PhoneNumberType.UAN; } if (isNumberMatchingDesc(nationalNumber, metadata.getVoicemail())) { return PhoneNumberType.VOICEMAIL; } boolean isFixedLine = isNumberMatchingDesc(nationalNumber, metadata.getFixedLine()); if (isFixedLine) { if (metadata.getSameMobileAndFixedLinePattern()) { return PhoneNumberType.FIXED_LINE_OR_MOBILE; } else if (isNumberMatchingDesc(nationalNumber, metadata.getMobile())) { return PhoneNumberType.FIXED_LINE_OR_MOBILE; } return PhoneNumberType.FIXED_LINE; } // Otherwise, test to see if the number is mobile. Only do this if certain that the patterns for // mobile and fixed line aren't the same. if (!metadata.getSameMobileAndFixedLinePattern() && isNumberMatchingDesc(nationalNumber, metadata.getMobile())) { return PhoneNumberType.MOBILE; } return PhoneNumberType.UNKNOWN; } /** * Returns the metadata for the given region code or {@code null} if the region code is invalid * or unknown. */ PhoneMetadata getMetadataForRegion(String regionCode) { if (!isValidRegionCode(regionCode)) { return null; } return metadataSource.getMetadataForRegion(regionCode); } PhoneMetadata getMetadataForNonGeographicalRegion(int countryCallingCode) { if (!countryCallingCodeToRegionCodeMap.containsKey(countryCallingCode)) { return null; } return metadataSource.getMetadataForNonGeographicalRegion(countryCallingCode); } boolean isNumberMatchingDesc(String nationalNumber, PhoneNumberDesc numberDesc) { // Check if any possible number lengths are present; if so, we use them to avoid checking the // validation pattern if they don't match. If they are absent, this means they match the general // description, which we have already checked before checking a specific number type. int actualLength = nationalNumber.length(); List possibleLengths = numberDesc.getPossibleLengthList(); if (possibleLengths.size() > 0 && !possibleLengths.contains(actualLength)) { return false; } return matcherApi.matchNationalNumber(nationalNumber, numberDesc, false); } /** * Tests whether a phone number matches a valid pattern. Note this doesn't verify the number * is actually in use, which is impossible to tell by just looking at a number itself. It only * verifies whether the parsed, canonicalised number is valid: not whether a particular series of * digits entered by the user is diallable from the region provided when parsing. For example, the * number +41 (0) 78 927 2696 can be parsed into a number with country code "41" and national * significant number "789272696". This is valid, while the original string is not diallable. * * @param number the phone number that we want to validate * @return a boolean that indicates whether the number is of a valid pattern */ public boolean isValidNumber(PhoneNumber number) { String regionCode = getRegionCodeForNumber(number); return isValidNumberForRegion(number, regionCode); } /** * Tests whether a phone number is valid for a certain region. Note this doesn't verify the number * is actually in use, which is impossible to tell by just looking at a number itself. If the * country calling code is not the same as the country calling code for the region, this * immediately exits with false. After this, the specific number pattern rules for the region are * examined. This is useful for determining for example whether a particular number is valid for * Canada, rather than just a valid NANPA number. * Warning: In most cases, you want to use {@link #isValidNumber} instead. For example, this * method will mark numbers from British Crown dependencies such as the Isle of Man as invalid for * the region "GB" (United Kingdom), since it has its own region code, "IM", which may be * undesirable. * * @param number the phone number that we want to validate * @param regionCode the region that we want to validate the phone number for * @return a boolean that indicates whether the number is of a valid pattern */ public boolean isValidNumberForRegion(PhoneNumber number, String regionCode) { int countryCode = number.getCountryCode(); PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCode, regionCode); if ((metadata == null) || (!REGION_CODE_FOR_NON_GEO_ENTITY.equals(regionCode) && countryCode != getCountryCodeForValidRegion(regionCode))) { // Either the region code was invalid, or the country calling code for this number does not // match that of the region code. return false; } String nationalSignificantNumber = getNationalSignificantNumber(number); return getNumberTypeHelper(nationalSignificantNumber, metadata) != PhoneNumberType.UNKNOWN; } /** * Returns the region where a phone number is from. This could be used for geocoding at the region * level. Only guarantees correct results for valid, full numbers (not short-codes, or invalid * numbers). * * @param number the phone number whose origin we want to know * @return the region where the phone number is from, or null if no region matches this calling * code */ public String getRegionCodeForNumber(PhoneNumber number) { int countryCode = number.getCountryCode(); List regions = countryCallingCodeToRegionCodeMap.get(countryCode); if (regions == null) { logger.log(Level.INFO, "Missing/invalid country_code (" + countryCode + ")"); return null; } if (regions.size() == 1) { return regions.get(0); } else { return getRegionCodeForNumberFromRegionList(number, regions); } } private String getRegionCodeForNumberFromRegionList(PhoneNumber number, List regionCodes) { String nationalNumber = getNationalSignificantNumber(number); for (String regionCode : regionCodes) { // If leadingDigits is present, use this. Otherwise, do full validation. // Metadata cannot be null because the region codes come from the country calling code map. PhoneMetadata metadata = getMetadataForRegion(regionCode); if (metadata.hasLeadingDigits()) { if (regexCache.getPatternForRegex(metadata.getLeadingDigits()) .matcher(nationalNumber).lookingAt()) { return regionCode; } } else if (getNumberTypeHelper(nationalNumber, metadata) != PhoneNumberType.UNKNOWN) { return regionCode; } } return null; } /** * Returns the region code that matches the specific country calling code. In the case of no * region code being found, ZZ will be returned. In the case of multiple regions, the one * designated in the metadata as the "main" region for this calling code will be returned. If the * countryCallingCode entered is valid but doesn't match a specific region (such as in the case of * non-geographical calling codes like 800) the value "001" will be returned (corresponding to * the value for World in the UN M.49 schema). */ public String getRegionCodeForCountryCode(int countryCallingCode) { List regionCodes = countryCallingCodeToRegionCodeMap.get(countryCallingCode); return regionCodes == null ? UNKNOWN_REGION : regionCodes.get(0); } /** * Returns a list with the region codes that match the specific country calling code. For * non-geographical country calling codes, the region code 001 is returned. Also, in the case * of no region code being found, an empty list is returned. */ public List getRegionCodesForCountryCode(int countryCallingCode) { List regionCodes = countryCallingCodeToRegionCodeMap.get(countryCallingCode); return Collections.unmodifiableList(regionCodes == null ? new ArrayList(0) : regionCodes); } /** * Returns the country calling code for a specific region. For example, this would be 1 for the * United States, and 64 for New Zealand. * * @param regionCode the region that we want to get the country calling code for * @return the country calling code for the region denoted by regionCode */ public int getCountryCodeForRegion(String regionCode) { if (!isValidRegionCode(regionCode)) { logger.log(Level.WARNING, "Invalid or missing region code (" + ((regionCode == null) ? "null" : regionCode) + ") provided."); return 0; } return getCountryCodeForValidRegion(regionCode); } /** * Returns the country calling code for a specific region. For example, this would be 1 for the * United States, and 64 for New Zealand. Assumes the region is already valid. * * @param regionCode the region that we want to get the country calling code for * @return the country calling code for the region denoted by regionCode * @throws IllegalArgumentException if the region is invalid */ private int getCountryCodeForValidRegion(String regionCode) { PhoneMetadata metadata = getMetadataForRegion(regionCode); if (metadata == null) { throw new IllegalArgumentException("Invalid region code: " + regionCode); } return metadata.getCountryCode(); } /** * Returns the national dialling prefix for a specific region. For example, this would be 1 for * the United States, and 0 for New Zealand. Set stripNonDigits to true to strip symbols like "~" * (which indicates a wait for a dialling tone) from the prefix returned. If no national prefix is * present, we return null. * *

Warning: Do not use this method for do-your-own formatting - for some regions, the * national dialling prefix is used only for certain types of numbers. Use the library's * formatting functions to prefix the national prefix when required. * * @param regionCode the region that we want to get the dialling prefix for * @param stripNonDigits true to strip non-digits from the national dialling prefix * @return the dialling prefix for the region denoted by regionCode */ public String getNddPrefixForRegion(String regionCode, boolean stripNonDigits) { PhoneMetadata metadata = getMetadataForRegion(regionCode); if (metadata == null) { logger.log(Level.WARNING, "Invalid or missing region code (" + ((regionCode == null) ? "null" : regionCode) + ") provided."); return null; } String nationalPrefix = metadata.getNationalPrefix(); // If no national prefix was found, we return null. if (nationalPrefix.length() == 0) { return null; } if (stripNonDigits) { // Note: if any other non-numeric symbols are ever used in national prefixes, these would have // to be removed here as well. nationalPrefix = nationalPrefix.replace("~", ""); } return nationalPrefix; } /** * Checks if this is a region under the North American Numbering Plan Administration (NANPA). * * @return true if regionCode is one of the regions under NANPA */ public boolean isNANPACountry(String regionCode) { return nanpaRegions.contains(regionCode); } /** * Checks if the number is a valid vanity (alpha) number such as 800 MICROSOFT. A valid vanity * number will start with at least 3 digits and will have three or more alpha characters. This * does not do region-specific checks - to work out if this number is actually valid for a region, * it should be parsed and methods such as {@link #isPossibleNumberWithReason} and * {@link #isValidNumber} should be used. * * @param number the number that needs to be checked * @return true if the number is a valid vanity number */ public boolean isAlphaNumber(CharSequence number) { if (!isViablePhoneNumber(number)) { // Number is too short, or doesn't match the basic phone number pattern. return false; } StringBuilder strippedNumber = new StringBuilder(number); maybeStripExtension(strippedNumber); return VALID_ALPHA_PHONE_PATTERN.matcher(strippedNumber).matches(); } /** * Convenience wrapper around {@link #isPossibleNumberWithReason}. Instead of returning the reason * for failure, this method returns true if the number is either a possible fully-qualified number * (containing the area code and country code), or if the number could be a possible local number * (with a country code, but missing an area code). Local numbers are considered possible if they * could be possibly dialled in this format: if the area code is needed for a call to connect, the * number is not considered possible without it. * * @param number the number that needs to be checked * @return true if the number is possible */ public boolean isPossibleNumber(PhoneNumber number) { ValidationResult result = isPossibleNumberWithReason(number); return result == ValidationResult.IS_POSSIBLE || result == ValidationResult.IS_POSSIBLE_LOCAL_ONLY; } /** * Convenience wrapper around {@link #isPossibleNumberForTypeWithReason}. Instead of returning the * reason for failure, this method returns true if the number is either a possible fully-qualified * number (containing the area code and country code), or if the number could be a possible local * number (with a country code, but missing an area code). Local numbers are considered possible * if they could be possibly dialled in this format: if the area code is needed for a call to * connect, the number is not considered possible without it. * * @param number the number that needs to be checked * @param type the type we are interested in * @return true if the number is possible for this particular type */ public boolean isPossibleNumberForType(PhoneNumber number, PhoneNumberType type) { ValidationResult result = isPossibleNumberForTypeWithReason(number, type); return result == ValidationResult.IS_POSSIBLE || result == ValidationResult.IS_POSSIBLE_LOCAL_ONLY; } /** * Helper method to check a number against possible lengths for this region, based on the metadata * being passed in, and determine whether it matches, or is too short or too long. */ private ValidationResult testNumberLength(CharSequence number, PhoneMetadata metadata) { return testNumberLength(number, metadata, PhoneNumberType.UNKNOWN); } /** * Helper method to check a number against possible lengths for this number type, and determine * whether it matches, or is too short or too long. */ private ValidationResult testNumberLength( CharSequence number, PhoneMetadata metadata, PhoneNumberType type) { PhoneNumberDesc descForType = getNumberDescByType(metadata, type); // There should always be "possibleLengths" set for every element. This is declared in the XML // schema which is verified by PhoneNumberMetadataSchemaTest. // For size efficiency, where a sub-description (e.g. fixed-line) has the same possibleLengths // as the parent, this is missing, so we fall back to the general desc (where no numbers of the // type exist at all, there is one possible length (-1) which is guaranteed not to match the // length of any real phone number). List possibleLengths = descForType.getPossibleLengthList().isEmpty() ? metadata.getGeneralDesc().getPossibleLengthList() : descForType.getPossibleLengthList(); List localLengths = descForType.getPossibleLengthLocalOnlyList(); if (type == PhoneNumberType.FIXED_LINE_OR_MOBILE) { if (!descHasPossibleNumberData(getNumberDescByType(metadata, PhoneNumberType.FIXED_LINE))) { // The rare case has been encountered where no fixedLine data is available (true for some // non-geographical entities), so we just check mobile. return testNumberLength(number, metadata, PhoneNumberType.MOBILE); } else { PhoneNumberDesc mobileDesc = getNumberDescByType(metadata, PhoneNumberType.MOBILE); if (descHasPossibleNumberData(mobileDesc)) { // Merge the mobile data in if there was any. We have to make a copy to do this. possibleLengths = new ArrayList(possibleLengths); // Note that when adding the possible lengths from mobile, we have to again check they // aren't empty since if they are this indicates they are the same as the general desc and // should be obtained from there. possibleLengths.addAll(mobileDesc.getPossibleLengthCount() == 0 ? metadata.getGeneralDesc().getPossibleLengthList() : mobileDesc.getPossibleLengthList()); // The current list is sorted; we need to merge in the new list and re-sort (duplicates // are okay). Sorting isn't so expensive because the lists are very small. Collections.sort(possibleLengths); if (localLengths.isEmpty()) { localLengths = mobileDesc.getPossibleLengthLocalOnlyList(); } else { localLengths = new ArrayList(localLengths); localLengths.addAll(mobileDesc.getPossibleLengthLocalOnlyList()); Collections.sort(localLengths); } } } } // If the type is not supported at all (indicated by the possible lengths containing -1 at this // point) we return invalid length. if (possibleLengths.get(0) == -1) { return ValidationResult.INVALID_LENGTH; } int actualLength = number.length(); // This is safe because there is never an overlap beween the possible lengths and the local-only // lengths; this is checked at build time. if (localLengths.contains(actualLength)) { return ValidationResult.IS_POSSIBLE_LOCAL_ONLY; } int minimumLength = possibleLengths.get(0); if (minimumLength == actualLength) { return ValidationResult.IS_POSSIBLE; } else if (minimumLength > actualLength) { return ValidationResult.TOO_SHORT; } else if (possibleLengths.get(possibleLengths.size() - 1) < actualLength) { return ValidationResult.TOO_LONG; } // We skip the first element; we've already checked it. return possibleLengths.subList(1, possibleLengths.size()).contains(actualLength) ? ValidationResult.IS_POSSIBLE : ValidationResult.INVALID_LENGTH; } /** * Check whether a phone number is a possible number. It provides a more lenient check than * {@link #isValidNumber} in the following sense: *

    *
  1. It only checks the length of phone numbers. In particular, it doesn't check starting * digits of the number. *
  2. It doesn't attempt to figure out the type of the number, but uses general rules which * applies to all types of phone numbers in a region. Therefore, it is much faster than * isValidNumber. *
  3. For some numbers (particularly fixed-line), many regions have the concept of area code, * which together with subscriber number constitute the national significant number. It is * sometimes okay to dial only the subscriber number when dialing in the same area. This * function will return IS_POSSIBLE_LOCAL_ONLY if the subscriber-number-only version is * passed in. On the other hand, because isValidNumber validates using information on both * starting digits (for fixed line numbers, that would most likely be area codes) and * length (obviously includes the length of area codes for fixed line numbers), it will * return false for the subscriber-number-only version. *
* @param number the number that needs to be checked * @return a ValidationResult object which indicates whether the number is possible */ public ValidationResult isPossibleNumberWithReason(PhoneNumber number) { return isPossibleNumberForTypeWithReason(number, PhoneNumberType.UNKNOWN); } /** * Check whether a phone number is a possible number of a particular type. For types that don't * exist in a particular region, this will return a result that isn't so useful; it is recommended * that you use {@link #getSupportedTypesForRegion} or {@link #getSupportedTypesForNonGeoEntity} * respectively before calling this method to determine whether you should call it for this number * at all. * * This provides a more lenient check than {@link #isValidNumber} in the following sense: * *
    *
  1. It only checks the length of phone numbers. In particular, it doesn't check starting * digits of the number. *
  2. For some numbers (particularly fixed-line), many regions have the concept of area code, * which together with subscriber number constitute the national significant number. It is * sometimes okay to dial only the subscriber number when dialing in the same area. This * function will return IS_POSSIBLE_LOCAL_ONLY if the subscriber-number-only version is * passed in. On the other hand, because isValidNumber validates using information on both * starting digits (for fixed line numbers, that would most likely be area codes) and * length (obviously includes the length of area codes for fixed line numbers), it will * return false for the subscriber-number-only version. *
* * @param number the number that needs to be checked * @param type the type we are interested in * @return a ValidationResult object which indicates whether the number is possible */ public ValidationResult isPossibleNumberForTypeWithReason( PhoneNumber number, PhoneNumberType type) { String nationalNumber = getNationalSignificantNumber(number); int countryCode = number.getCountryCode(); // Note: For regions that share a country calling code, like NANPA numbers, we just use the // rules from the default region (US in this case) since the getRegionCodeForNumber will not // work if the number is possible but not valid. There is in fact one country calling code (290) // where the possible number pattern differs between various regions (Saint Helena and Tristan // da Cuñha), but this is handled by putting all possible lengths for any country with this // country calling code in the metadata for the default region in this case. if (!hasValidCountryCallingCode(countryCode)) { return ValidationResult.INVALID_COUNTRY_CODE; } String regionCode = getRegionCodeForCountryCode(countryCode); // Metadata cannot be null because the country calling code is valid. PhoneMetadata metadata = getMetadataForRegionOrCallingCode(countryCode, regionCode); return testNumberLength(nationalNumber, metadata, type); } /** * Check whether a phone number is a possible number given a number in the form of a string, and * the region where the number could be dialed from. It provides a more lenient check than * {@link #isValidNumber}. See {@link #isPossibleNumber(PhoneNumber)} for details. * *

This method first parses the number, then invokes {@link #isPossibleNumber(PhoneNumber)} * with the resultant PhoneNumber object. * * @param number the number that needs to be checked * @param regionDialingFrom the region that we are expecting the number to be dialed from. * Note this is different from the region where the number belongs. For example, the number * +1 650 253 0000 is a number that belongs to US. When written in this form, it can be * dialed from any region. When it is written as 00 1 650 253 0000, it can be dialed from any * region which uses an international dialling prefix of 00. When it is written as * 650 253 0000, it can only be dialed from within the US, and when written as 253 0000, it * can only be dialed from within a smaller area in the US (Mountain View, CA, to be more * specific). * @return true if the number is possible */ public boolean isPossibleNumber(CharSequence number, String regionDialingFrom) { try { return isPossibleNumber(parse(number, regionDialingFrom)); } catch (NumberParseException e) { return false; } } /** * Attempts to extract a valid number from a phone number that is too long to be valid, and resets * the PhoneNumber object passed in to that valid version. If no valid number could be extracted, * the PhoneNumber object passed in will not be modified. * @param number a PhoneNumber object which contains a number that is too long to be valid * @return true if a valid phone number can be successfully extracted */ public boolean truncateTooLongNumber(PhoneNumber number) { if (isValidNumber(number)) { return true; } PhoneNumber numberCopy = new PhoneNumber(); numberCopy.mergeFrom(number); long nationalNumber = number.getNationalNumber(); do { nationalNumber /= 10; numberCopy.setNationalNumber(nationalNumber); if (isPossibleNumberWithReason(numberCopy) == ValidationResult.TOO_SHORT || nationalNumber == 0) { return false; } } while (!isValidNumber(numberCopy)); number.setNationalNumber(nationalNumber); return true; } /** * Gets an {@link com.google.i18n.phonenumbers.AsYouTypeFormatter} for the specific region. * * @param regionCode the region where the phone number is being entered * @return an {@link com.google.i18n.phonenumbers.AsYouTypeFormatter} object, which can be used * to format phone numbers in the specific region "as you type" */ public AsYouTypeFormatter getAsYouTypeFormatter(String regionCode) { return new AsYouTypeFormatter(regionCode); } // Extracts country calling code from fullNumber, returns it and places the remaining number in // nationalNumber. It assumes that the leading plus sign or IDD has already been removed. Returns // 0 if fullNumber doesn't start with a valid country calling code, and leaves nationalNumber // unmodified. int extractCountryCode(StringBuilder fullNumber, StringBuilder nationalNumber) { if ((fullNumber.length() == 0) || (fullNumber.charAt(0) == '0')) { // Country codes do not begin with a '0'. return 0; } int potentialCountryCode; int numberLength = fullNumber.length(); for (int i = 1; i <= MAX_LENGTH_COUNTRY_CODE && i <= numberLength; i++) { potentialCountryCode = Integer.parseInt(fullNumber.substring(0, i)); if (countryCallingCodeToRegionCodeMap.containsKey(potentialCountryCode)) { nationalNumber.append(fullNumber.substring(i)); return potentialCountryCode; } } return 0; } /** * Tries to extract a country calling code from a number. This method will return zero if no * country calling code is considered to be present. Country calling codes are extracted in the * following ways: *

    *
  • by stripping the international dialing prefix of the region the person is dialing from, * if this is present in the number, and looking at the next digits *
  • by stripping the '+' sign if present and then looking at the next digits *
  • by comparing the start of the number and the country calling code of the default region. * If the number is not considered possible for the numbering plan of the default region * initially, but starts with the country calling code of this region, validation will be * reattempted after stripping this country calling code. If this number is considered a * possible number, then the first digits will be considered the country calling code and * removed as such. *
* It will throw a NumberParseException if the number starts with a '+' but the country calling * code supplied after this does not match that of any known region. * * @param number non-normalized telephone number that we wish to extract a country calling * code from - may begin with '+' * @param defaultRegionMetadata metadata about the region this number may be from * @param nationalNumber a string buffer to store the national significant number in, in the case * that a country calling code was extracted. The number is appended to any existing contents. * If no country calling code was extracted, this will be left unchanged. * @param keepRawInput true if the country_code_source and preferred_carrier_code fields of * phoneNumber should be populated. * @param phoneNumber the PhoneNumber object where the country_code and country_code_source need * to be populated. Note the country_code is always populated, whereas country_code_source is * only populated when keepCountryCodeSource is true. * @return the country calling code extracted or 0 if none could be extracted */ // @VisibleForTesting int maybeExtractCountryCode(CharSequence number, PhoneMetadata defaultRegionMetadata, StringBuilder nationalNumber, boolean keepRawInput, PhoneNumber phoneNumber) throws NumberParseException { if (number.length() == 0) { return 0; } StringBuilder fullNumber = new StringBuilder(number); // Set the default prefix to be something that will never match. String possibleCountryIddPrefix = "NonMatch"; if (defaultRegionMetadata != null) { possibleCountryIddPrefix = defaultRegionMetadata.getInternationalPrefix(); } CountryCodeSource countryCodeSource = maybeStripInternationalPrefixAndNormalize(fullNumber, possibleCountryIddPrefix); if (keepRawInput) { phoneNumber.setCountryCodeSource(countryCodeSource); } if (countryCodeSource != CountryCodeSource.FROM_DEFAULT_COUNTRY) { if (fullNumber.length() <= MIN_LENGTH_FOR_NSN) { throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_AFTER_IDD, "Phone number had an IDD, but after this was not " + "long enough to be a viable phone number."); } int potentialCountryCode = extractCountryCode(fullNumber, nationalNumber); if (potentialCountryCode != 0) { phoneNumber.setCountryCode(potentialCountryCode); return potentialCountryCode; } // If this fails, they must be using a strange country calling code that we don't recognize, // or that doesn't exist. throw new NumberParseException(NumberParseException.ErrorType.INVALID_COUNTRY_CODE, "Country calling code supplied was not recognised."); } else if (defaultRegionMetadata != null) { // Check to see if the number starts with the country calling code for the default region. If // so, we remove the country calling code, and do some checks on the validity of the number // before and after. int defaultCountryCode = defaultRegionMetadata.getCountryCode(); String defaultCountryCodeString = String.valueOf(defaultCountryCode); String normalizedNumber = fullNumber.toString(); if (normalizedNumber.startsWith(defaultCountryCodeString)) { StringBuilder potentialNationalNumber = new StringBuilder(normalizedNumber.substring(defaultCountryCodeString.length())); PhoneNumberDesc generalDesc = defaultRegionMetadata.getGeneralDesc(); maybeStripNationalPrefixAndCarrierCode( potentialNationalNumber, defaultRegionMetadata, null /* Don't need the carrier code */); // If the number was not valid before but is valid now, or if it was too long before, we // consider the number with the country calling code stripped to be a better result and // keep that instead. if ((!matcherApi.matchNationalNumber(fullNumber, generalDesc, false) && matcherApi.matchNationalNumber(potentialNationalNumber, generalDesc, false)) || testNumberLength(fullNumber, defaultRegionMetadata) == ValidationResult.TOO_LONG) { nationalNumber.append(potentialNationalNumber); if (keepRawInput) { phoneNumber.setCountryCodeSource(CountryCodeSource.FROM_NUMBER_WITHOUT_PLUS_SIGN); } phoneNumber.setCountryCode(defaultCountryCode); return defaultCountryCode; } } } // No country calling code present. phoneNumber.setCountryCode(0); return 0; } /** * Strips the IDD from the start of the number if present. Helper function used by * maybeStripInternationalPrefixAndNormalize. */ private boolean parsePrefixAsIdd(Pattern iddPattern, StringBuilder number) { Matcher m = iddPattern.matcher(number); if (m.lookingAt()) { int matchEnd = m.end(); // Only strip this if the first digit after the match is not a 0, since country calling codes // cannot begin with 0. Matcher digitMatcher = CAPTURING_DIGIT_PATTERN.matcher(number.substring(matchEnd)); if (digitMatcher.find()) { String normalizedGroup = normalizeDigitsOnly(digitMatcher.group(1)); if (normalizedGroup.equals("0")) { return false; } } number.delete(0, matchEnd); return true; } return false; } /** * Strips any international prefix (such as +, 00, 011) present in the number provided, normalizes * the resulting number, and indicates if an international prefix was present. * * @param number the non-normalized telephone number that we wish to strip any international * dialing prefix from * @param possibleIddPrefix the international direct dialing prefix from the region we * think this number may be dialed in * @return the corresponding CountryCodeSource if an international dialing prefix could be * removed from the number, otherwise CountryCodeSource.FROM_DEFAULT_COUNTRY if the number did * not seem to be in international format */ // @VisibleForTesting CountryCodeSource maybeStripInternationalPrefixAndNormalize( StringBuilder number, String possibleIddPrefix) { if (number.length() == 0) { return CountryCodeSource.FROM_DEFAULT_COUNTRY; } // Check to see if the number begins with one or more plus signs. Matcher m = PLUS_CHARS_PATTERN.matcher(number); if (m.lookingAt()) { number.delete(0, m.end()); // Can now normalize the rest of the number since we've consumed the "+" sign at the start. normalize(number); return CountryCodeSource.FROM_NUMBER_WITH_PLUS_SIGN; } // Attempt to parse the first digits as an international prefix. Pattern iddPattern = regexCache.getPatternForRegex(possibleIddPrefix); normalize(number); return parsePrefixAsIdd(iddPattern, number) ? CountryCodeSource.FROM_NUMBER_WITH_IDD : CountryCodeSource.FROM_DEFAULT_COUNTRY; } /** * Strips any national prefix (such as 0, 1) present in the number provided. * * @param number the normalized telephone number that we wish to strip any national * dialing prefix from * @param metadata the metadata for the region that we think this number is from * @param carrierCode a place to insert the carrier code if one is extracted * @return true if a national prefix or carrier code (or both) could be extracted */ // @VisibleForTesting boolean maybeStripNationalPrefixAndCarrierCode( StringBuilder number, PhoneMetadata metadata, StringBuilder carrierCode) { int numberLength = number.length(); String possibleNationalPrefix = metadata.getNationalPrefixForParsing(); if (numberLength == 0 || possibleNationalPrefix.length() == 0) { // Early return for numbers of zero length. return false; } // Attempt to parse the first digits as a national prefix. Matcher prefixMatcher = regexCache.getPatternForRegex(possibleNationalPrefix).matcher(number); if (prefixMatcher.lookingAt()) { PhoneNumberDesc generalDesc = metadata.getGeneralDesc(); // Check if the original number is viable. boolean isViableOriginalNumber = matcherApi.matchNationalNumber(number, generalDesc, false); // prefixMatcher.group(numOfGroups) == null implies nothing was captured by the capturing // groups in possibleNationalPrefix; therefore, no transformation is necessary, and we just // remove the national prefix. int numOfGroups = prefixMatcher.groupCount(); String transformRule = metadata.getNationalPrefixTransformRule(); if (transformRule == null || transformRule.length() == 0 || prefixMatcher.group(numOfGroups) == null) { // If the original number was viable, and the resultant number is not, we return. if (isViableOriginalNumber && !matcherApi.matchNationalNumber( number.substring(prefixMatcher.end()), generalDesc, false)) { return false; } if (carrierCode != null && numOfGroups > 0 && prefixMatcher.group(numOfGroups) != null) { carrierCode.append(prefixMatcher.group(1)); } number.delete(0, prefixMatcher.end()); return true; } else { // Check that the resultant number is still viable. If not, return. Check this by copying // the string buffer and making the transformation on the copy first. StringBuilder transformedNumber = new StringBuilder(number); transformedNumber.replace(0, numberLength, prefixMatcher.replaceFirst(transformRule)); if (isViableOriginalNumber && !matcherApi.matchNationalNumber(transformedNumber.toString(), generalDesc, false)) { return false; } if (carrierCode != null && numOfGroups > 1) { carrierCode.append(prefixMatcher.group(1)); } number.replace(0, number.length(), transformedNumber.toString()); return true; } } return false; } /** * Strips any extension (as in, the part of the number dialled after the call is connected, * usually indicated with extn, ext, x or similar) from the end of the number, and returns it. * * @param number the non-normalized telephone number that we wish to strip the extension from * @return the phone extension */ // @VisibleForTesting String maybeStripExtension(StringBuilder number) { Matcher m = EXTN_PATTERN.matcher(number); // If we find a potential extension, and the number preceding this is a viable number, we assume // it is an extension. if (m.find() && isViablePhoneNumber(number.substring(0, m.start()))) { // The numbers are captured into groups in the regular expression. for (int i = 1, length = m.groupCount(); i <= length; i++) { if (m.group(i) != null) { // We go through the capturing groups until we find one that captured some digits. If none // did, then we will return the empty string. String extension = m.group(i); number.delete(m.start(), number.length()); return extension; } } } return ""; } /** * Checks to see that the region code used is valid, or if it is not valid, that the number to * parse starts with a + symbol so that we can attempt to infer the region from the number. * Returns false if it cannot use the region provided and the region cannot be inferred. */ private boolean checkRegionForParsing(CharSequence numberToParse, String defaultRegion) { if (!isValidRegionCode(defaultRegion)) { // If the number is null or empty, we can't infer the region. if ((numberToParse == null) || (numberToParse.length() == 0) || !PLUS_CHARS_PATTERN.matcher(numberToParse).lookingAt()) { return false; } } return true; } /** * Parses a string and returns it as a phone number in proto buffer format. The method is quite * lenient and looks for a number in the input text (raw input) and does not check whether the * string is definitely only a phone number. To do this, it ignores punctuation and white-space, * as well as any text before the number (e.g. a leading "Tel: ") and trims the non-number bits. * It will accept a number in any format (E164, national, international etc), assuming it can be * interpreted with the defaultRegion supplied. It also attempts to convert any alpha characters * into digits if it thinks this is a vanity number of the type "1800 MICROSOFT". * *

This method will throw a {@link com.google.i18n.phonenumbers.NumberParseException} if the * number is not considered to be a possible number. Note that validation of whether the number * is actually a valid number for a particular region is not performed. This can be done * separately with {@link #isValidNumber}. * *

Note this method canonicalizes the phone number such that different representations can be * easily compared, no matter what form it was originally entered in (e.g. national, * international). If you want to record context about the number being parsed, such as the raw * input that was entered, how the country code was derived etc. then call {@link * #parseAndKeepRawInput} instead. * * @param numberToParse number that we are attempting to parse. This can contain formatting such * as +, ( and -, as well as a phone number extension. It can also be provided in RFC3966 * format. * @param defaultRegion region that we are expecting the number to be from. This is only used if * the number being parsed is not written in international format. The country_code for the * number in this case would be stored as that of the default region supplied. If the number * is guaranteed to start with a '+' followed by the country calling code, then RegionCode.ZZ * or null can be supplied. * @return a phone number proto buffer filled with the parsed number * @throws NumberParseException if the string is not considered to be a viable phone number (e.g. * too few or too many digits) or if no default region was supplied and the number is not in * international format (does not start with +) */ public PhoneNumber parse(CharSequence numberToParse, String defaultRegion) throws NumberParseException { PhoneNumber phoneNumber = new PhoneNumber(); parse(numberToParse, defaultRegion, phoneNumber); return phoneNumber; } /** * Same as {@link #parse(CharSequence, String)}, but accepts mutable PhoneNumber as a * parameter to decrease object creation when invoked many times. */ public void parse(CharSequence numberToParse, String defaultRegion, PhoneNumber phoneNumber) throws NumberParseException { parseHelper(numberToParse, defaultRegion, false, true, phoneNumber); } /** * Parses a string and returns it in proto buffer format. This method differs from {@link #parse} * in that it always populates the raw_input field of the protocol buffer with numberToParse as * well as the country_code_source field. * * @param numberToParse number that we are attempting to parse. This can contain formatting such * as +, ( and -, as well as a phone number extension. * @param defaultRegion region that we are expecting the number to be from. This is only used if * the number being parsed is not written in international format. The country calling code * for the number in this case would be stored as that of the default region supplied. * @return a phone number proto buffer filled with the parsed number * @throws NumberParseException if the string is not considered to be a viable phone number or if * no default region was supplied */ public PhoneNumber parseAndKeepRawInput(CharSequence numberToParse, String defaultRegion) throws NumberParseException { PhoneNumber phoneNumber = new PhoneNumber(); parseAndKeepRawInput(numberToParse, defaultRegion, phoneNumber); return phoneNumber; } /** * Same as{@link #parseAndKeepRawInput(CharSequence, String)}, but accepts a mutable * PhoneNumber as a parameter to decrease object creation when invoked many times. */ public void parseAndKeepRawInput(CharSequence numberToParse, String defaultRegion, PhoneNumber phoneNumber) throws NumberParseException { parseHelper(numberToParse, defaultRegion, true, true, phoneNumber); } /** * Returns an iterable over all {@link PhoneNumberMatch PhoneNumberMatches} in {@code text}. This * is a shortcut for {@link #findNumbers(CharSequence, String, Leniency, long) * getMatcher(text, defaultRegion, Leniency.VALID, Long.MAX_VALUE)}. * * @param text the text to search for phone numbers, null for no text * @param defaultRegion region that we are expecting the number to be from. This is only used if * the number being parsed is not written in international format. The country_code for the * number in this case would be stored as that of the default region supplied. May be null if * only international numbers are expected. */ public Iterable findNumbers(CharSequence text, String defaultRegion) { return findNumbers(text, defaultRegion, Leniency.VALID, Long.MAX_VALUE); } /** * Returns an iterable over all {@link PhoneNumberMatch PhoneNumberMatches} in {@code text}. * * @param text the text to search for phone numbers, null for no text * @param defaultRegion region that we are expecting the number to be from. This is only used if * the number being parsed is not written in international format. The country_code for the * number in this case would be stored as that of the default region supplied. May be null if * only international numbers are expected. * @param leniency the leniency to use when evaluating candidate phone numbers * @param maxTries the maximum number of invalid numbers to try before giving up on the text. * This is to cover degenerate cases where the text has a lot of false positives in it. Must * be {@code >= 0}. */ public Iterable findNumbers( final CharSequence text, final String defaultRegion, final Leniency leniency, final long maxTries) { return new Iterable() { @Override public Iterator iterator() { return new PhoneNumberMatcher( PhoneNumberUtil.this, text, defaultRegion, leniency, maxTries); } }; } /** * A helper function to set the values related to leading zeros in a PhoneNumber. */ static void setItalianLeadingZerosForPhoneNumber(CharSequence nationalNumber, PhoneNumber phoneNumber) { if (nationalNumber.length() > 1 && nationalNumber.charAt(0) == '0') { phoneNumber.setItalianLeadingZero(true); int numberOfLeadingZeros = 1; // Note that if the national number is all "0"s, the last "0" is not counted as a leading // zero. while (numberOfLeadingZeros < nationalNumber.length() - 1 && nationalNumber.charAt(numberOfLeadingZeros) == '0') { numberOfLeadingZeros++; } if (numberOfLeadingZeros != 1) { phoneNumber.setNumberOfLeadingZeros(numberOfLeadingZeros); } } } /** * Parses a string and fills up the phoneNumber. This method is the same as the public * parse() method, with the exception that it allows the default region to be null, for use by * isNumberMatch(). checkRegion should be set to false if it is permitted for the default region * to be null or unknown ("ZZ"). * * Note if any new field is added to this method that should always be filled in, even when * keepRawInput is false, it should also be handled in the copyCoreFieldsOnly() method. */ private void parseHelper(CharSequence numberToParse, String defaultRegion, boolean keepRawInput, boolean checkRegion, PhoneNumber phoneNumber) throws NumberParseException { if (numberToParse == null) { throw new NumberParseException(NumberParseException.ErrorType.NOT_A_NUMBER, "The phone number supplied was null."); } else if (numberToParse.length() > MAX_INPUT_STRING_LENGTH) { throw new NumberParseException(NumberParseException.ErrorType.TOO_LONG, "The string supplied was too long to parse."); } StringBuilder nationalNumber = new StringBuilder(); String numberBeingParsed = numberToParse.toString(); buildNationalNumberForParsing(numberBeingParsed, nationalNumber); if (!isViablePhoneNumber(nationalNumber)) { throw new NumberParseException(NumberParseException.ErrorType.NOT_A_NUMBER, "The string supplied did not seem to be a phone number."); } // Check the region supplied is valid, or that the extracted number starts with some sort of + // sign so the number's region can be determined. if (checkRegion && !checkRegionForParsing(nationalNumber, defaultRegion)) { throw new NumberParseException(NumberParseException.ErrorType.INVALID_COUNTRY_CODE, "Missing or invalid default region."); } if (keepRawInput) { phoneNumber.setRawInput(numberBeingParsed); } // Attempt to parse extension first, since it doesn't require region-specific data and we want // to have the non-normalised number here. String extension = maybeStripExtension(nationalNumber); if (extension.length() > 0) { phoneNumber.setExtension(extension); } PhoneMetadata regionMetadata = getMetadataForRegion(defaultRegion); // Check to see if the number is given in international format so we know whether this number is // from the default region or not. StringBuilder normalizedNationalNumber = new StringBuilder(); int countryCode = 0; try { // TODO: This method should really just take in the string buffer that has already // been created, and just remove the prefix, rather than taking in a string and then // outputting a string buffer. countryCode = maybeExtractCountryCode(nationalNumber, regionMetadata, normalizedNationalNumber, keepRawInput, phoneNumber); } catch (NumberParseException e) { Matcher matcher = PLUS_CHARS_PATTERN.matcher(nationalNumber); if (e.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE && matcher.lookingAt()) { // Strip the plus-char, and try again. countryCode = maybeExtractCountryCode(nationalNumber.substring(matcher.end()), regionMetadata, normalizedNationalNumber, keepRawInput, phoneNumber); if (countryCode == 0) { throw new NumberParseException(NumberParseException.ErrorType.INVALID_COUNTRY_CODE, "Could not interpret numbers after plus-sign."); } } else { throw new NumberParseException(e.getErrorType(), e.getMessage()); } } if (countryCode != 0) { String phoneNumberRegion = getRegionCodeForCountryCode(countryCode); if (!phoneNumberRegion.equals(defaultRegion)) { // Metadata cannot be null because the country calling code is valid. regionMetadata = getMetadataForRegionOrCallingCode(countryCode, phoneNumberRegion); } } else { // If no extracted country calling code, use the region supplied instead. The national number // is just the normalized version of the number we were given to parse. normalizedNationalNumber.append(normalize(nationalNumber)); if (defaultRegion != null) { countryCode = regionMetadata.getCountryCode(); phoneNumber.setCountryCode(countryCode); } else if (keepRawInput) { phoneNumber.clearCountryCodeSource(); } } if (normalizedNationalNumber.length() < MIN_LENGTH_FOR_NSN) { throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_NSN, "The string supplied is too short to be a phone number."); } if (regionMetadata != null) { StringBuilder carrierCode = new StringBuilder(); StringBuilder potentialNationalNumber = new StringBuilder(normalizedNationalNumber); maybeStripNationalPrefixAndCarrierCode(potentialNationalNumber, regionMetadata, carrierCode); // We require that the NSN remaining after stripping the national prefix and carrier code be // long enough to be a possible length for the region. Otherwise, we don't do the stripping, // since the original number could be a valid short number. ValidationResult validationResult = testNumberLength(potentialNationalNumber, regionMetadata); if (validationResult != ValidationResult.TOO_SHORT && validationResult != ValidationResult.IS_POSSIBLE_LOCAL_ONLY && validationResult != ValidationResult.INVALID_LENGTH) { normalizedNationalNumber = potentialNationalNumber; if (keepRawInput && carrierCode.length() > 0) { phoneNumber.setPreferredDomesticCarrierCode(carrierCode.toString()); } } } int lengthOfNationalNumber = normalizedNationalNumber.length(); if (lengthOfNationalNumber < MIN_LENGTH_FOR_NSN) { throw new NumberParseException(NumberParseException.ErrorType.TOO_SHORT_NSN, "The string supplied is too short to be a phone number."); } if (lengthOfNationalNumber > MAX_LENGTH_FOR_NSN) { throw new NumberParseException(NumberParseException.ErrorType.TOO_LONG, "The string supplied is too long to be a phone number."); } setItalianLeadingZerosForPhoneNumber(normalizedNationalNumber, phoneNumber); phoneNumber.setNationalNumber(Long.parseLong(normalizedNationalNumber.toString())); } /** * Converts numberToParse to a form that we can parse and write it to nationalNumber if it is * written in RFC3966; otherwise extract a possible number out of it and write to nationalNumber. */ private void buildNationalNumberForParsing(String numberToParse, StringBuilder nationalNumber) { int indexOfPhoneContext = numberToParse.indexOf(RFC3966_PHONE_CONTEXT); if (indexOfPhoneContext >= 0) { int phoneContextStart = indexOfPhoneContext + RFC3966_PHONE_CONTEXT.length(); // If the phone context contains a phone number prefix, we need to capture it, whereas domains // will be ignored. if (phoneContextStart < (numberToParse.length() - 1) && numberToParse.charAt(phoneContextStart) == PLUS_SIGN) { // Additional parameters might follow the phone context. If so, we will remove them here // because the parameters after phone context are not important for parsing the // phone number. int phoneContextEnd = numberToParse.indexOf(';', phoneContextStart); if (phoneContextEnd > 0) { nationalNumber.append(numberToParse.substring(phoneContextStart, phoneContextEnd)); } else { nationalNumber.append(numberToParse.substring(phoneContextStart)); } } // Now append everything between the "tel:" prefix and the phone-context. This should include // the national number, an optional extension or isdn-subaddress component. Note we also // handle the case when "tel:" is missing, as we have seen in some of the phone number inputs. // In that case, we append everything from the beginning. int indexOfRfc3966Prefix = numberToParse.indexOf(RFC3966_PREFIX); int indexOfNationalNumber = (indexOfRfc3966Prefix >= 0) ? indexOfRfc3966Prefix + RFC3966_PREFIX.length() : 0; nationalNumber.append(numberToParse.substring(indexOfNationalNumber, indexOfPhoneContext)); } else { // Extract a possible number from the string passed in (this strips leading characters that // could not be the start of a phone number.) nationalNumber.append(extractPossibleNumber(numberToParse)); } // Delete the isdn-subaddress and everything after it if it is present. Note extension won't // appear at the same time with isdn-subaddress according to paragraph 5.3 of the RFC3966 spec, int indexOfIsdn = nationalNumber.indexOf(RFC3966_ISDN_SUBADDRESS); if (indexOfIsdn > 0) { nationalNumber.delete(indexOfIsdn, nationalNumber.length()); } // If both phone context and isdn-subaddress are absent but other parameters are present, the // parameters are left in nationalNumber. This is because we are concerned about deleting // content from a potential number string when there is no strong evidence that the number is // actually written in RFC3966. } /** * Returns a new phone number containing only the fields needed to uniquely identify a phone * number, rather than any fields that capture the context in which the phone number was created. * These fields correspond to those set in parse() rather than parseAndKeepRawInput(). */ private static PhoneNumber copyCoreFieldsOnly(PhoneNumber phoneNumberIn) { PhoneNumber phoneNumber = new PhoneNumber(); phoneNumber.setCountryCode(phoneNumberIn.getCountryCode()); phoneNumber.setNationalNumber(phoneNumberIn.getNationalNumber()); if (phoneNumberIn.getExtension().length() > 0) { phoneNumber.setExtension(phoneNumberIn.getExtension()); } if (phoneNumberIn.isItalianLeadingZero()) { phoneNumber.setItalianLeadingZero(true); // This field is only relevant if there are leading zeros at all. phoneNumber.setNumberOfLeadingZeros(phoneNumberIn.getNumberOfLeadingZeros()); } return phoneNumber; } /** * Takes two phone numbers and compares them for equality. * *

Returns EXACT_MATCH if the country_code, NSN, presence of a leading zero for Italian numbers * and any extension present are the same. * Returns NSN_MATCH if either or both has no region specified, and the NSNs and extensions are * the same. * Returns SHORT_NSN_MATCH if either or both has no region specified, or the region specified is * the same, and one NSN could be a shorter version of the other number. This includes the case * where one has an extension specified, and the other does not. * Returns NO_MATCH otherwise. * For example, the numbers +1 345 657 1234 and 657 1234 are a SHORT_NSN_MATCH. * The numbers +1 345 657 1234 and 345 657 are a NO_MATCH. * * @param firstNumberIn first number to compare * @param secondNumberIn second number to compare * * @return NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH or EXACT_MATCH depending on the level of equality * of the two numbers, described in the method definition. */ public MatchType isNumberMatch(PhoneNumber firstNumberIn, PhoneNumber secondNumberIn) { // We only care about the fields that uniquely define a number, so we copy these across // explicitly. PhoneNumber firstNumber = copyCoreFieldsOnly(firstNumberIn); PhoneNumber secondNumber = copyCoreFieldsOnly(secondNumberIn); // Early exit if both had extensions and these are different. if (firstNumber.hasExtension() && secondNumber.hasExtension() && !firstNumber.getExtension().equals(secondNumber.getExtension())) { return MatchType.NO_MATCH; } int firstNumberCountryCode = firstNumber.getCountryCode(); int secondNumberCountryCode = secondNumber.getCountryCode(); // Both had country_code specified. if (firstNumberCountryCode != 0 && secondNumberCountryCode != 0) { if (firstNumber.exactlySameAs(secondNumber)) { return MatchType.EXACT_MATCH; } else if (firstNumberCountryCode == secondNumberCountryCode && isNationalNumberSuffixOfTheOther(firstNumber, secondNumber)) { // A SHORT_NSN_MATCH occurs if there is a difference because of the presence or absence of // an 'Italian leading zero', the presence or absence of an extension, or one NSN being a // shorter variant of the other. return MatchType.SHORT_NSN_MATCH; } // This is not a match. return MatchType.NO_MATCH; } // Checks cases where one or both country_code fields were not specified. To make equality // checks easier, we first set the country_code fields to be equal. firstNumber.setCountryCode(secondNumberCountryCode); // If all else was the same, then this is an NSN_MATCH. if (firstNumber.exactlySameAs(secondNumber)) { return MatchType.NSN_MATCH; } if (isNationalNumberSuffixOfTheOther(firstNumber, secondNumber)) { return MatchType.SHORT_NSN_MATCH; } return MatchType.NO_MATCH; } // Returns true when one national number is the suffix of the other or both are the same. private boolean isNationalNumberSuffixOfTheOther(PhoneNumber firstNumber, PhoneNumber secondNumber) { String firstNumberNationalNumber = String.valueOf(firstNumber.getNationalNumber()); String secondNumberNationalNumber = String.valueOf(secondNumber.getNationalNumber()); // Note that endsWith returns true if the numbers are equal. return firstNumberNationalNumber.endsWith(secondNumberNationalNumber) || secondNumberNationalNumber.endsWith(firstNumberNationalNumber); } /** * Takes two phone numbers as strings and compares them for equality. This is a convenience * wrapper for {@link #isNumberMatch(PhoneNumber, PhoneNumber)}. No default region is known. * * @param firstNumber first number to compare. Can contain formatting, and can have country * calling code specified with + at the start. * @param secondNumber second number to compare. Can contain formatting, and can have country * calling code specified with + at the start. * @return NOT_A_NUMBER, NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH, EXACT_MATCH. See * {@link #isNumberMatch(PhoneNumber, PhoneNumber)} for more details. */ public MatchType isNumberMatch(CharSequence firstNumber, CharSequence secondNumber) { try { PhoneNumber firstNumberAsProto = parse(firstNumber, UNKNOWN_REGION); return isNumberMatch(firstNumberAsProto, secondNumber); } catch (NumberParseException e) { if (e.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { try { PhoneNumber secondNumberAsProto = parse(secondNumber, UNKNOWN_REGION); return isNumberMatch(secondNumberAsProto, firstNumber); } catch (NumberParseException e2) { if (e2.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { try { PhoneNumber firstNumberProto = new PhoneNumber(); PhoneNumber secondNumberProto = new PhoneNumber(); parseHelper(firstNumber, null, false, false, firstNumberProto); parseHelper(secondNumber, null, false, false, secondNumberProto); return isNumberMatch(firstNumberProto, secondNumberProto); } catch (NumberParseException e3) { // Fall through and return MatchType.NOT_A_NUMBER. } } } } } // One or more of the phone numbers we are trying to match is not a viable phone number. return MatchType.NOT_A_NUMBER; } /** * Takes two phone numbers and compares them for equality. This is a convenience wrapper for * {@link #isNumberMatch(PhoneNumber, PhoneNumber)}. No default region is known. * * @param firstNumber first number to compare in proto buffer format * @param secondNumber second number to compare. Can contain formatting, and can have country * calling code specified with + at the start. * @return NOT_A_NUMBER, NO_MATCH, SHORT_NSN_MATCH, NSN_MATCH, EXACT_MATCH. See * {@link #isNumberMatch(PhoneNumber, PhoneNumber)} for more details. */ public MatchType isNumberMatch(PhoneNumber firstNumber, CharSequence secondNumber) { // First see if the second number has an implicit country calling code, by attempting to parse // it. try { PhoneNumber secondNumberAsProto = parse(secondNumber, UNKNOWN_REGION); return isNumberMatch(firstNumber, secondNumberAsProto); } catch (NumberParseException e) { if (e.getErrorType() == NumberParseException.ErrorType.INVALID_COUNTRY_CODE) { // The second number has no country calling code. EXACT_MATCH is no longer possible. // We parse it as if the region was the same as that for the first number, and if // EXACT_MATCH is returned, we replace this with NSN_MATCH. String firstNumberRegion = getRegionCodeForCountryCode(firstNumber.getCountryCode()); try { if (!firstNumberRegion.equals(UNKNOWN_REGION)) { PhoneNumber secondNumberWithFirstNumberRegion = parse(secondNumber, firstNumberRegion); MatchType match = isNumberMatch(firstNumber, secondNumberWithFirstNumberRegion); if (match == MatchType.EXACT_MATCH) { return MatchType.NSN_MATCH; } return match; } else { // If the first number didn't have a valid country calling code, then we parse the // second number without one as well. PhoneNumber secondNumberProto = new PhoneNumber(); parseHelper(secondNumber, null, false, false, secondNumberProto); return isNumberMatch(firstNumber, secondNumberProto); } } catch (NumberParseException e2) { // Fall-through to return NOT_A_NUMBER. } } } // One or more of the phone numbers we are trying to match is not a viable phone number. return MatchType.NOT_A_NUMBER; } /** * Returns true if the number can be dialled from outside the region, or unknown. If the number * can only be dialled from within the region, returns false. Does not check the number is a valid * number. Note that, at the moment, this method does not handle short numbers (which are * currently all presumed to not be diallable from outside their country). * * @param number the phone-number for which we want to know whether it is diallable from * outside the region */ public boolean canBeInternationallyDialled(PhoneNumber number) { PhoneMetadata metadata = getMetadataForRegion(getRegionCodeForNumber(number)); if (metadata == null) { // Note numbers belonging to non-geographical entities (e.g. +800 numbers) are always // internationally diallable, and will be caught here. return true; } String nationalSignificantNumber = getNationalSignificantNumber(number); return !isNumberMatchingDesc(nationalSignificantNumber, metadata.getNoInternationalDialling()); } /** * Returns true if the supplied region supports mobile number portability. Returns false for * invalid, unknown or regions that don't support mobile number portability. * * @param regionCode the region for which we want to know whether it supports mobile number * portability or not */ public boolean isMobileNumberPortableRegion(String regionCode) { PhoneMetadata metadata = getMetadataForRegion(regionCode); if (metadata == null) { logger.log(Level.WARNING, "Invalid or unknown region code provided: " + regionCode); return false; } return metadata.getMobileNumberPortableRegion(); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy