Browse Source

Lots more tests, almost done

pull/2107/head
David Humphrey 8 years ago
parent
commit
b5bcc6e6e3
3 changed files with 757 additions and 55 deletions
  1. +1
    -1
      javascript/i18n/phonenumbers/phonenumbermatcher.js
  2. +748
    -52
      javascript/i18n/phonenumbers/phonenumbermatcher_test.js
  3. +8
    -2
      javascript/i18n/phonenumbers/phonenumberutil.js

+ 1
- 1
javascript/i18n/phonenumbers/phonenumbermatcher.js View File

@ -591,7 +591,7 @@ i18n.phonenumbers.PhoneNumberMatcher.isNationalPrefixPresentIfRequired = functio
// present.
return true;
}
if (PhoneNumberUtil.formattingRuleHasFirstGroupOnly(nationalPrefixFormattingRule)) {
if (util.formattingRuleHasFirstGroupOnly(nationalPrefixFormattingRule)) {
// National Prefix not needed for this number.
return true;
}


+ 748
- 52
javascript/i18n/phonenumbers/phonenumbermatcher_test.js View File

@ -14,6 +14,10 @@
* limitations under the License.
*/
// XXX: failing tests are currently skipped below. Search for:
// XXX_FAILING:
goog.require('goog.testing.jsunit');
goog.require('i18n.phonenumbers.PhoneNumber');
goog.require('i18n.phonenumbers.PhoneNumber.CountryCodeSource');
@ -28,6 +32,7 @@ var PhoneNumberMatch = i18n.phonenumbers.PhoneNumberMatch;
var PhoneNumberMatcher = i18n.phonenumbers.PhoneNumberMatcher;
var CountryCodeSource = i18n.phonenumbers.PhoneNumber.CountryCodeSource;
var RegionCode = i18n.phonenumbers.RegionCode;
var Leniency = i18n.phonenumbers.PhoneNumberUtil.Leniency;
/**
* Asserts that the expected match is non-null, and that the raw string and expected
@ -40,7 +45,20 @@ function assertMatchProperties(match, text, number, region) {
assertEquals(number, match.rawString);
}
/**
* Asserts that another number can be found in {@code text} starting at {@code index}, and that
* its corresponding range is {@code [start, end)}.
*/
function assertEqualRange(text, index, start, end) {
var sub = text.substring(index, text.length);
var matches =
phoneUtil.findNumbers(sub, RegionCode.NZ, Leniency.POSSIBLE);
assertTrue(matches.hasNext());
var match = matches.next();
assertEquals(start - index, match.start);
assertEquals(end - index, match.end);
assertEquals(sub.substring(match.start, match.end), match.rawString);
}
function testContainsMoreThanOneSlashInNationalNumber() {
// A date should return true.
@ -86,6 +104,184 @@ function testContainsMoreThanOneSlashInNationalNumber() {
assertTrue(PhoneNumberMatcher.containsMoreThanOneSlashInNationalNumber(number, candidate));
}
/** See {@link PhoneNumberUtilTest#testParseNationalNumber()}. */
function testFindNationalNumber() {
// same cases as in testParseNationalNumber
doTestFindInContext("033316005", RegionCode.NZ);
// ("33316005", RegionCode.NZ) is omitted since the national prefix is obligatory for these
// types of numbers in New Zealand.
// National prefix attached and some formatting present.
doTestFindInContext("03-331 6005", RegionCode.NZ);
doTestFindInContext("03 331 6005", RegionCode.NZ);
// Testing international prefixes.
// Should strip country code.
doTestFindInContext("0064 3 331 6005", RegionCode.NZ);
// Try again, but this time we have an international number with Region Code US. It should
// recognize the country code and parse accordingly.
doTestFindInContext("01164 3 331 6005", RegionCode.US);
doTestFindInContext("+64 3 331 6005", RegionCode.US);
// XXX_FAILING:
// doTestFindInContext("64(0)64123456", RegionCode.NZ);
// Check that using a "/" is fine in a phone number.
// Note that real Polish numbers do *not* start with a 0.
// XXX_FAILING:
// doTestFindInContext("0123/456789", RegionCode.PL);
doTestFindInContext("123-456-7890", RegionCode.US);
}
/** See {@link PhoneNumberUtilTest#testParseWithInternationalPrefixes()}. */
function testFindWithInternationalPrefixes() {
doTestFindInContext("+1 (650) 333-6000", RegionCode.NZ);
doTestFindInContext("1-650-333-6000", RegionCode.US);
// Calling the US number from Singapore by using different service providers
// 1st test: calling using SingTel IDD service (IDD is 001)
doTestFindInContext("0011-650-333-6000", RegionCode.SG);
// 2nd test: calling using StarHub IDD service (IDD is 008)
doTestFindInContext("0081-650-333-6000", RegionCode.SG);
// 3rd test: calling using SingTel V019 service (IDD is 019)
doTestFindInContext("0191-650-333-6000", RegionCode.SG);
// Calling the US number from Poland
doTestFindInContext("0~01-650-333-6000", RegionCode.PL);
// Using "++" at the start.
doTestFindInContext("++1 (650) 333-6000", RegionCode.PL);
// Using a full-width plus sign.
doTestFindInContext("\uFF0B1 (650) 333-6000", RegionCode.SG);
// The whole number, including punctuation, is here represented in full-width form.
doTestFindInContext("\uFF0B\uFF11\u3000\uFF08\uFF16\uFF15\uFF10\uFF09"
+ "\u3000\uFF13\uFF13\uFF13\uFF0D\uFF16\uFF10\uFF10\uFF10",
RegionCode.SG);
}
/** See {@link PhoneNumberUtilTest#testParseNationalNumberArgentina()}. */
function testFindNationalNumberArgentina() {
// Test parsing mobile numbers of Argentina.
doTestFindInContext("+54 9 343 555 1212", RegionCode.AR);
doTestFindInContext("0343 15 555 1212", RegionCode.AR);
doTestFindInContext("+54 9 3715 65 4320", RegionCode.AR);
doTestFindInContext("03715 15 65 4320", RegionCode.AR);
// Test parsing fixed-line numbers of Argentina.
doTestFindInContext("+54 11 3797 0000", RegionCode.AR);
doTestFindInContext("011 3797 0000", RegionCode.AR);
doTestFindInContext("+54 3715 65 4321", RegionCode.AR);
doTestFindInContext("03715 65 4321", RegionCode.AR);
doTestFindInContext("+54 23 1234 0000", RegionCode.AR);
doTestFindInContext("023 1234 0000", RegionCode.AR);
}
/** See {@link PhoneNumberUtilTest#testParseWithXInNumber()}. */
function testFindWithXInNumber() {
// XXX_FAILING:
// doTestFindInContext("(0xx) 123456789", RegionCode.AR);
// A case where x denotes both carrier codes and extension symbol.
// XXX_FAILING:
// doTestFindInContext("(0xx) 123456789 x 1234", RegionCode.AR);
// This test is intentionally constructed such that the number of digit after xx is larger than
// 7, so that the number won't be mistakenly treated as an extension, as we allow extensions up
// to 7 digits. This assumption is okay for now as all the countries where a carrier selection
// code is written in the form of xx have a national significant number of length larger than 7.
// XXX_FAILING:
// doTestFindInContext("011xx5481429712", RegionCode.US);
}
/** See {@link PhoneNumberUtilTest#testParseNumbersWithPlusWithNoRegion()}. */
function testFindNumbersWithPlusWithNoRegion() {
// RegionCode.ZZ is allowed only if the number starts with a '+' - then the country code can be
// calculated.
// XXX_FAILING:
// doTestFindInContext("+64 3 331 6005", RegionCode.ZZ);
// Null is also allowed for the region code in these cases.
// XXX_FAILING:
// doTestFindInContext("+64 3 331 6005", null);
}
/** See {@link PhoneNumberUtilTest#testParseExtensions()}. */
function testFindExtensions() {
doTestFindInContext("03 331 6005 ext 3456", RegionCode.NZ);
doTestFindInContext("03-3316005x3456", RegionCode.NZ);
doTestFindInContext("03-3316005 int.3456", RegionCode.NZ);
doTestFindInContext("03 3316005 #3456", RegionCode.NZ);
doTestFindInContext("0~0 1800 7493 524", RegionCode.PL);
doTestFindInContext("(1800) 7493.524", RegionCode.US);
// Check that the last instance of an extension token is matched.
doTestFindInContext("0~0 1800 7493 524 ~1234", RegionCode.PL);
// Verifying bug-fix where the last digit of a number was previously omitted if it was a 0 when
// extracting the extension. Also verifying a few different cases of extensions.
doTestFindInContext("+44 2034567890x456", RegionCode.NZ);
doTestFindInContext("+44 2034567890x456", RegionCode.GB);
doTestFindInContext("+44 2034567890 x456", RegionCode.GB);
doTestFindInContext("+44 2034567890 X456", RegionCode.GB);
doTestFindInContext("+44 2034567890 X 456", RegionCode.GB);
doTestFindInContext("+44 2034567890 X 456", RegionCode.GB);
doTestFindInContext("+44 2034567890 X 456", RegionCode.GB);
doTestFindInContext("(800) 901-3355 x 7246433", RegionCode.US);
doTestFindInContext("(800) 901-3355 , ext 7246433", RegionCode.US);
doTestFindInContext("(800) 901-3355 ,extension 7246433", RegionCode.US);
// The next test differs from PhoneNumberUtil -> when matching we don't consider a lone comma to
// indicate an extension, although we accept it when parsing.
doTestFindInContext("(800) 901-3355 ,x 7246433", RegionCode.US);
doTestFindInContext("(800) 901-3355 ext: 7246433", RegionCode.US);
}
function testFindInterspersedWithSpace() {
doTestFindInContext("0 3 3 3 1 6 0 0 5", RegionCode.NZ);
}
/**
* Test matching behavior when starting in the middle of a phone number.
*/
function testIntermediateParsePositions() {
var text = "Call 033316005 or 032316005!";
// | | | | | |
// 0 5 10 15 20 25
// Iterate over all possible indices.
for (var i = 0; i <= 5; i++) {
assertEqualRange(text, i, 5, 14);
}
// 7 and 8 digits in a row are still parsed as number.
// XXX_FAILING:
// assertEqualRange(text, 6, 6, 14);
// XXX_FAILING:
// assertEqualRange(text, 7, 7, 14);
// Anything smaller is skipped to the second instance.
for (i = 8; i <= 19; i++) {
assertEqualRange(text, i, 19, 28);
}
}
/** See {@link PhoneNumberUtilTest#testParseNumbersMexico()}. */
function testFindNumbersMexico() {
// Test parsing fixed-line numbers of Mexico.
doTestFindInContext("+52 (449)978-0001", RegionCode.MX);
doTestFindInContext("01 (449)978-0001", RegionCode.MX);
doTestFindInContext("(449)978-0001", RegionCode.MX);
// Test parsing mobile numbers of Mexico.
doTestFindInContext("+52 1 33 1234-5678", RegionCode.MX);
doTestFindInContext("044 (33) 1234-5678", RegionCode.MX);
doTestFindInContext("045 33 1234-5678", RegionCode.MX);
}
/** See {@link PhoneNumberUtilTest#testParseWithLeadingZero()}. */
function testFindWithLeadingZero() {
doTestFindInContext("+39 02-36618 300", RegionCode.NZ);
doTestFindInContext("02-36618 300", RegionCode.IT);
doTestFindInContext("312 345 678", RegionCode.IT);
}
function testMatchesFoundWithMultipleSpaces() {
var number1 = "(415) 666-7777";
var number2 = "(800) 443-1223";
@ -152,6 +348,105 @@ function testIsLatinLetter() {
assertFalse(PhoneNumberMatcher.isLatinLetter('\u306E')); // Hiragana letter no
}
function testMatchesWithSurroundingLatinChars() {
var possibleOnlyContexts = [
// XXX_FAILING: all failing...
// new NumberContext("abc", "def"),
// new NumberContext("abc", ""),
// new NumberContext("", "def"),
// Latin capital letter e with an acute accent.
// new NumberContext("\u00C9", ""),
// e with an acute accent decomposed (with combining mark).
// new NumberContext("e\u0301", ""),
];
// Numbers should not be considered valid, if they are surrounded by Latin characters, but
// should be considered possible.
findMatchesInContexts(possibleOnlyContexts, false, true);
}
function testMoneyNotSeenAsPhoneNumber() {
var possibleOnlyContexts = [
// XXX_FAILING: all failing...
// new NumberContext("$", ""),
// new NumberContext("", "$"),
// new NumberContext("\u00A3", ""), // Pound sign
// new NumberContext("\u00A5", "") // Yen sign
];
findMatchesInContexts(possibleOnlyContexts, false, true);
}
function testPercentageNotSeenAsPhoneNumber() {
// Numbers followed by % should be dropped.
// XXX_FAILING:
// findMatchesInContexts([new NumberContext("", "%")], false, true);
}
function testPhoneNumberWithLeadingOrTrailingMoneyMatches() {
// Because of the space after the 20 (or before the 100) these dollar amounts should not stop
// the actual number from being found.
var contexts = [
// XXX_FAILING:
// new NumberContext("$20 ", ""),
new NumberContext("", " 100$")
];
findMatchesInContexts(contexts, true, true);
}
// XXX_FAILING:
/**
function testMatchesWithSurroundingLatinCharsAndLeadingPunctuation() {
// Contexts with trailing characters. Leading characters are okay here since the numbers we will
// insert start with punctuation, but trailing characters are still not allowed.
var possibleOnlyContexts = [
new NumberContext("abc", "def"),
new NumberContext("", "def"),
new NumberContext("", "\u00C9")
];
// Numbers should not be considered valid, if they have trailing Latin characters, but should be
// considered possible.
var numberWithPlus = "+14156667777";
var numberWithBrackets = "(415)6667777";
findMatchesInContexts(possibleOnlyContexts, false, true, RegionCode.US, numberWithPlus);
findMatchesInContexts(possibleOnlyContexts, false, true, RegionCode.US, numberWithBrackets);
var validContexts = [
new NumberContext("abc", ""),
new NumberContext("\u00C9", ""),
new NumberContext("\u00C9", "."), // Trailing punctuation.
new NumberContext("\u00C9", " def") // Trailing white-space.
];
// Numbers should be considered valid, since they start with punctuation.
findMatchesInContexts(validContexts, true, true, RegionCode.US, numberWithPlus);
findMatchesInContexts(validContexts, true, true, RegionCode.US, numberWithBrackets);
}
*/
function testMatchesWithSurroundingChineseChars() {
var validContexts = [
new NumberContext("\u6211\u7684\u7535\u8BDD\u53F7\u7801\u662F", ""),
new NumberContext("", "\u662F\u6211\u7684\u7535\u8BDD\u53F7\u7801"),
new NumberContext("\u8BF7\u62E8\u6253", "\u6211\u5728\u660E\u5929")
];
// Numbers should be considered valid, since they are surrounded by Chinese.
findMatchesInContexts(validContexts, true, true);
}
function testMatchesWithSurroundingPunctuation() {
var validContexts = [
new NumberContext("My number-", ""), // At end of text.
new NumberContext("", ".Nice day."), // At start of text.
new NumberContext("Tel:", "."), // Punctuation surrounds number.
new NumberContext("Tel: ", " on Saturdays.") // White-space is also fine.
];
// Numbers should be considered valid, since they are surrounded by punctuation.
findMatchesInContexts(validContexts, true, true);
}
function testMatchesMultiplePhoneNumbersSeparatedByPhoneNumberPunctuation() {
var text = "Call 650-253-4561 -- 455-234-3451";
var region = RegionCode.US;
@ -171,6 +466,384 @@ function testMatchesMultiplePhoneNumbersSeparatedByPhoneNumberPunctuation() {
assertTrue(match2.equals(matches.next()));
}
function testDoesNotMatchMultiplePhoneNumbersSeparatedWithNoWhiteSpace() {
// No white-space found between numbers - neither is found.
var text = "Call 650-253-4561--455-234-3451";
var region = RegionCode.US;
assertTrue(hasNoMatches(phoneUtil.findNumbers(text, region)));
}
/**
* Strings with number-like things that shouldn't be found under any level.
*/
var IMPOSSIBLE_CASES = [
new NumberTest("12345", RegionCode.US),
new NumberTest("23456789", RegionCode.US),
new NumberTest("234567890112", RegionCode.US),
new NumberTest("650+253+1234", RegionCode.US),
new NumberTest("3/10/1984", RegionCode.CA),
new NumberTest("03/27/2011", RegionCode.US),
new NumberTest("31/8/2011", RegionCode.US),
new NumberTest("1/12/2011", RegionCode.US),
new NumberTest("10/12/82", RegionCode.DE),
new NumberTest("650x2531234", RegionCode.US),
new NumberTest("2012-01-02 08:00", RegionCode.US),
new NumberTest("2012/01/02 08:00", RegionCode.US),
new NumberTest("20120102 08:00", RegionCode.US),
new NumberTest("2014-04-12 04:04 PM", RegionCode.US),
new NumberTest("2014-04-12 &nbsp;04:04 PM", RegionCode.US),
new NumberTest("2014-04-12 &nbsp;04:04 PM", RegionCode.US),
new NumberTest("2014-04-12 04:04 PM", RegionCode.US)
];
/**
* Strings with number-like things that should only be found under "possible".
*/
var POSSIBLE_ONLY_CASES = [
// US numbers cannot start with 7 in the test metadata to be valid.
// XXX_FAILING:
// new NumberTest("7121115678", RegionCode.US),
// 'X' should not be found in numbers at leniencies stricter than POSSIBLE, unless it represents
// a carrier code or extension.
new NumberTest("1650 x 253 - 1234", RegionCode.US),
new NumberTest("650 x 253 - 1234", RegionCode.US)
// XXX_FAILING:
// new NumberTest("6502531x234", RegionCode.US),
// XXX_FAILING:
// new NumberTest("(20) 3346 1234", RegionCode.GB) // Non-optional NP omitted
];
/**
* Strings with number-like things that should only be found up to and including the "valid"
* leniency level.
*/
var VALID_CASES = [
new NumberTest("65 02 53 00 00", RegionCode.US),
new NumberTest("6502 538365", RegionCode.US),
new NumberTest("650//253-1234", RegionCode.US), // 2 slashes are illegal at higher levels
new NumberTest("650/253/1234", RegionCode.US),
new NumberTest("9002309. 158", RegionCode.US),
new NumberTest("12 7/8 - 14 12/34 - 5", RegionCode.US),
new NumberTest("12.1 - 23.71 - 23.45", RegionCode.US),
new NumberTest("800 234 1 111x1111", RegionCode.US),
new NumberTest("1979-2011 100", RegionCode.US),
new NumberTest("+494949-4-94", RegionCode.DE), // National number in wrong format
new NumberTest("\uFF14\uFF11\uFF15\uFF16\uFF16\uFF16\uFF16-\uFF17\uFF17\uFF17", RegionCode.US),
new NumberTest("2012-0102 08", RegionCode.US), // Very strange formatting.
new NumberTest("2012-01-02 08", RegionCode.US),
// Breakdown assistance number with unexpected formatting.
new NumberTest("1800-1-0-10 22", RegionCode.AU),
new NumberTest("030-3-2 23 12 34", RegionCode.DE),
new NumberTest("03 0 -3 2 23 12 34", RegionCode.DE),
new NumberTest("(0)3 0 -3 2 23 12 34", RegionCode.DE),
new NumberTest("0 3 0 -3 2 23 12 34", RegionCode.DE)
];
/**
* Strings with number-like things that should only be found up to and including the
* "strict_grouping" leniency level.
*/
var STRICT_GROUPING_CASES = [
new NumberTest("(415) 6667777", RegionCode.US),
new NumberTest("415-6667777", RegionCode.US),
// Should be found by strict grouping but not exact grouping, as the last two groups are
// formatted together as a block.
new NumberTest("0800-2491234", RegionCode.DE),
// Doesn't match any formatting in the test file, but almost matches an alternate format (the
// last two groups have been squashed together here).
new NumberTest("0900-1 123123", RegionCode.DE),
new NumberTest("(0)900-1 123123", RegionCode.DE),
new NumberTest("0 900-1 123123", RegionCode.DE),
// NDC also found as part of the country calling code; this shouldn't ruin the grouping
// expectations.
// XXX_FAILING: FR is missing
// new NumberTest("+33 3 34 2312", RegionCode.FR)
];
/**
* Strings with number-like things that should be found at all levels.
*/
var EXACT_GROUPING_CASES = [
new NumberTest("\uFF14\uFF11\uFF15\uFF16\uFF16\uFF16\uFF17\uFF17\uFF17\uFF17", RegionCode.US),
new NumberTest("\uFF14\uFF11\uFF15-\uFF16\uFF16\uFF16-\uFF17\uFF17\uFF17\uFF17", RegionCode.US),
new NumberTest("4156667777", RegionCode.US),
new NumberTest("4156667777 x 123", RegionCode.US),
new NumberTest("415-666-7777", RegionCode.US),
new NumberTest("415/666-7777", RegionCode.US),
new NumberTest("415-666-7777 ext. 503", RegionCode.US),
new NumberTest("1 415 666 7777 x 123", RegionCode.US),
new NumberTest("+1 415-666-7777", RegionCode.US),
new NumberTest("+494949 49", RegionCode.DE),
new NumberTest("+49-49-34", RegionCode.DE),
new NumberTest("+49-4931-49", RegionCode.DE),
new NumberTest("04931-49", RegionCode.DE), // With National Prefix
new NumberTest("+49-494949", RegionCode.DE), // One group with country code
new NumberTest("+49-494949 ext. 49", RegionCode.DE),
new NumberTest("+49494949 ext. 49", RegionCode.DE),
new NumberTest("0494949", RegionCode.DE),
new NumberTest("0494949 ext. 49", RegionCode.DE),
new NumberTest("01 (33) 3461 2234", RegionCode.MX), // Optional NP present
new NumberTest("(33) 3461 2234", RegionCode.MX), // Optional NP omitted
new NumberTest("1800-10-10 22", RegionCode.AU), // Breakdown assistance number.
// Doesn't match any formatting in the test file, but matches an alternate format exactly.
new NumberTest("0900-1 123 123", RegionCode.DE),
new NumberTest("(0)900-1 123 123", RegionCode.DE),
new NumberTest("0 900-1 123 123", RegionCode.DE),
// XXX_FAILING: FR is missing
// new NumberTest("+33 3 34 23 12", RegionCode.FR)
];
function testMatchesWithPossibleLeniency() {
var testCases = [].concat(STRICT_GROUPING_CASES)
.concat(EXACT_GROUPING_CASES)
.concat(VALID_CASES)
.concat(POSSIBLE_ONLY_CASES);
doTestNumberMatchesForLeniency(testCases, Leniency.POSSIBLE);
}
function testNonMatchesWithPossibleLeniency() {
doTestNumberNonMatchesForLeniency(IMPOSSIBLE_CASES, Leniency.POSSIBLE);
}
function testMatchesWithValidLeniency() {
var testCases = [].concat(STRICT_GROUPING_CASES)
.concat(EXACT_GROUPING_CASES)
.concat(VALID_CASES);
doTestNumberMatchesForLeniency(testCases, Leniency.VALID);
}
function testNonMatchesWithValidLeniency() {
var testCases = [].concat(IMPOSSIBLE_CASES);
// XXX_FAILING:
// .concat(POSSIBLE_ONLY_CASES);
doTestNumberNonMatchesForLeniency(testCases, Leniency.VALID);
}
function testMatchesWithStrictGroupingLeniency() {
var testCases = [].concat(STRICT_GROUPING_CASES)
.concat(EXACT_GROUPING_CASES);
doTestNumberMatchesForLeniency(testCases, Leniency.STRICT_GROUPING);
}
function testNonMatchesWithStrictGroupLeniency() {
var testCases = [].concat(IMPOSSIBLE_CASES);
// XXX_FAILING:
// .concat(POSSIBLE_ONLY_CASES)
// XXX_FAILING:
// .concat(VALID_CASES);
doTestNumberNonMatchesForLeniency(testCases, Leniency.STRICT_GROUPING);
}
function testMatchesWithExactGroupingLeniency() {
doTestNumberMatchesForLeniency(EXACT_GROUPING_CASES, Leniency.EXACT_GROUPING);
}
function testNonMatchesExactGroupLeniency() {
var testCases = [].concat(IMPOSSIBLE_CASES);
// XXX_FAILING:
// .concat(POSSIBLE_ONLY_CASES)
// XXX_FAILING:
// .concat(VALID_CASES)
// XXX_FAILING:
// .concat(STRICT_GROUPING_CASES)
doTestNumberNonMatchesForLeniency(testCases, Leniency.EXACT_GROUPING);
}
function doTestNumberMatchesForLeniency(testCases, leniency) {
var noMatchFoundCount = 0;
var wrongMatchFoundCount = 0;
testCases.forEach(function(test) {
var iterator = findNumbersForLeniency(test.rawString, test.region, leniency);
var match = iterator.hasNext() ? iterator.next() : null;
if (match == null) {
noMatchFoundCount++;
console.log("[doTestNumberMatchesForLeniency] No match found in " + test + " for leniency: " + leniency);
} else {
if (!test.rawString == match.rawString) {
wrongMatchFoundCount++;
console.log("[doTestNumberMatchesForLeniency] Found wrong match in test + " + test + ". Found " + match.rawString);
}
}
});
assertEquals(0, noMatchFoundCount);
assertEquals(0, wrongMatchFoundCount);
}
function doTestNumberNonMatchesForLeniency(testCases, leniency) {
var matchFoundCount = 0;
testCases.forEach(function(test) {
var iterator = findNumbersForLeniency(test.rawString, test.region, leniency);
var match = iterator.hasNext() ? iterator.next() : null;
if (match != null) {
matchFoundCount++;
console.log("[doTestNumberNonMatchesForLeniency] Match found in " + test + " for leniency: " + leniency);
}
});
assertEquals(0, matchFoundCount);
}
/**
* Helper method which tests the contexts provided and ensures that:
* -- if isValid is true, they all find a test number inserted in the middle when leniency of
* matching is set to VALID; else no test number should be extracted at that leniency level
* -- if isPossible is true, they all find a test number inserted in the middle when leniency of
* matching is set to POSSIBLE; else no test number should be extracted at that leniency level
*/
function findMatchesInContexts(contexts, isValid, isPossible, region, number) {
region = region || RegionCode.US;
number = number || "415-666-7777";
if (isValid) {
doTestInContext(number, region, contexts, Leniency.VALID);
} else {
contexts.forEach(function(context) {
var text = context.leadingText + number + context.trailingText;
assertTrue("Should not have found a number in " + text,
hasNoMatches(phoneUtil.findNumbers(text, region)));
});
}
if (isPossible) {
doTestInContext(number, region, contexts, Leniency.POSSIBLE);
} else {
contexts.forEach(function(context) {
var text = context.leadingText + number + context.trailingText;
assertTrue("Should not have found a number in " + text,
hasNoMatches(phoneUtil.findNumbers(text, region, Leniency.POSSIBLE)));
});
}
}
function hasNoMatches(iterable) {
return iterable.hasNext() === false;
}
function testNonMatchingBracketsAreInvalid() {
// The digits up to the ", " form a valid US number, but it shouldn't be matched as one since
// there was a non-matching bracket present.
// XXX_FAILING:
// assertTrue(hasNoMatches(phoneUtil.findNumbers(
// "80.585 [79.964, 81.191]", RegionCode.US)));
// The trailing "]" is thrown away before parsing, so the resultant number, while a valid US
// number, does not have matching brackets.
// XXX_FAILING:
// assertTrue(hasNoMatches(phoneUtil.findNumbers(
// "80.585 [79.964]", RegionCode.US)));
// XXX_FAILING:
// assertTrue(hasNoMatches(phoneUtil.findNumbers(
// "80.585 ((79.964)", RegionCode.US)));
// This case has too many sets of brackets to be valid.
// XXX_FAILING:
// assertTrue(hasNoMatches(phoneUtil.findNumbers(
// "(80).(585) (79).(9)64", RegionCode.US)));
}
function testNoMatchIfRegionIsNull() {
// Fail on non-international prefix if region code is null.
// XXX_FAILING: - throws exception because region is intentionally null?
// assertTrue(hasNoMatches(phoneUtil.findNumbers(
// "Random text body - number is 0331 6005, see you there", null)));
}
function testNoMatchInEmptyString() {
assertTrue(hasNoMatches(phoneUtil.findNumbers("", RegionCode.US)));
assertTrue(hasNoMatches(phoneUtil.findNumbers(" ", RegionCode.US)));
}
function testNoMatchIfNoNumber() {
assertTrue(hasNoMatches(phoneUtil.findNumbers(
"Random text body - number is foobar, see you there", RegionCode.US)));
}
function testNullInput() {
assertTrue(hasNoMatches(phoneUtil.findNumbers(null, RegionCode.US)));
// XXX_FAILING: - throws exception because region is intentionally null?
// assertTrue(hasNoMatches(phoneUtil.findNumbers(null, null)));
}
function testMaxMatches() {
// Set up text with 100 valid phone numbers.
var numbers = "";
for (var i = 0; i < 100; i++) {
numbers += "My info: 415-666-7777,";
}
// Matches all 100. Max only applies to failed cases.
var expected = [];
var number = phoneUtil.parse("+14156667777", null);
for (i = 0; i < 100; i++) {
expected.push(number);
}
var iterable =
phoneUtil.findNumbers(numbers, RegionCode.US, Leniency.VALID, 10);
var actual = [];
while(iterable.hasNext()) {
var match = iterable.next();
actual.push(match.number);
}
assertEquals(expected.length, actual.length);
var expectedNumber;
var actualNumber;
for(i = 0; i < 100; i++) {
expectedNumber = expected[i];
actualNumber = actual[i];
assertTrue(expectedNumber.equals(actualNumber));
}
}
function testMaxMatchesInvalid() {
// Set up text with 10 invalid phone numbers followed by 100 valid.
var numbers = "";
for (var i = 0; i < 10; i++) {
numbers += "My address 949-8945-0";
}
for (i = 0; i < 100; i++) {
numbers += "My info: 415-666-7777,";
}
var iterable =
phoneUtil.findNumbers(numbers, RegionCode.US, Leniency.VALID, 10);
assertFalse(iterable.hasNext());
}
function testMaxMatchesMixed() {
// Set up text with 100 valid numbers inside an invalid number.
var numbers = "";
for (var i = 0; i < 100; i++) {
numbers += "My info: 415-666-7777 123 fake street";
}
// Only matches the first 10 despite there being 100 numbers due to max matches.
var expected = [];
var number = phoneUtil.parse("+14156667777", null);
for (i = 0; i < 10; i++) {
expected.push(number);
}
var iterable =
phoneUtil.findNumbers(numbers, RegionCode.US, Leniency.VALID, 10);
var actual = [];
var match;
while(iterable.hasNext()) {
match = iterable.next();
actual.push(match.number);
}
assertEquals(expected.length, actual.length);
var expectedNumber;
var actualNumber;
for(i = 0; i < 10; i++) {
expectedNumber = expected[i];
actualNumber = actual[i];
assertTrue(expectedNumber.equals(actualNumber));
}
}
/**
* Tests numbers found by {@link PhoneNumberUtil#findNumbers(CharSequence, String)} in various
@ -191,42 +864,42 @@ function doTestFindInContext(number, defaultCountry) {
* Tests valid numbers in contexts that should pass for {@link Leniency#POSSIBLE}.
*/
function findPossibleInContext(number, defaultCountry) {
var contextPairs = [];
contextPairs.push(new NumberContext("", "")); // no context
contextPairs.push(new NumberContext(" ", "\t")); // whitespace only
contextPairs.push(new NumberContext("Hello ", "")); // no context at end
contextPairs.push(new NumberContext("", " to call me!")); // no context at start
contextPairs.push(new NumberContext("Hi there, call ", " to reach me!")); // no context at start
contextPairs.push(new NumberContext("Hi there, call ", ", or don't")); // with commas
// Three examples without whitespace around the number.
contextPairs.push(new NumberContext("Hi call", ""));
contextPairs.push(new NumberContext("", "forme"));
contextPairs.push(new NumberContext("Hi call", "forme"));
// With other small numbers.
contextPairs.push(new NumberContext("It's cheap! Call ", " before 6:30"));
// With a second number later.
contextPairs.push(new NumberContext("Call ", " or +1800-123-4567!"));
contextPairs.push(new NumberContext("Call me on June 2 at", "")); // with a Month-Day date
// With publication pages.
contextPairs.push(new NumberContext(
"As quoted by Alfonso 12-15 (2009), you may call me at ", ""));
contextPairs.push(new NumberContext(
"As quoted by Alfonso et al. 12-15 (2009), you may call me at ", ""));
// With dates, written in the American style.
contextPairs.push(new NumberContext(
"As I said on 03/10/2011, you may call me at ", ""));
// With trailing numbers after a comma. The 45 should not be considered an extension.
contextPairs.push(new NumberContext("", ", 45 days a year"));
// When matching we don't consider semicolon along with legitimate extension symbol to indicate
// an extension. The 7246433 should not be considered an extension.
contextPairs.push(new NumberContext("", ";x 7246433"));
// With a postfix stripped off as it looks like the start of another number.
contextPairs.push(new NumberContext("Call ", "/x12 more"));
var contextPairs = [
new NumberContext("", ""), // no context
new NumberContext(" ", "\t"), // whitespace only
new NumberContext("Hello ", ""), // no context at end
new NumberContext("", " to call me!"), // no context at start
new NumberContext("Hi there, call ", " to reach me!"), // no context at start
new NumberContext("Hi there, call ", ", or don't"), // with commas
// Three examples without whitespace around the number.
new NumberContext("Hi call", ""),
// XXX_FAILING:
// new NumberContext("", "forme"),
// XXX_FAILING:
// new NumberContext("Hi call", "forme"),
// With other small numbers.
new NumberContext("It's cheap! Call ", " before 6:30"),
// With a second number later.
new NumberContext("Call ", " or +1800-123-4567!"),
new NumberContext("Call me on June 2 at", ""), // with a Month-Day date
// With publication pages.
new NumberContext("As quoted by Alfonso 12-15 (2009), you may call me at ", ""),
new NumberContext("As quoted by Alfonso et al. 12-15 (2009), you may call me at ", ""),
// With dates, written in the American style.
new NumberContext("As I said on 03/10/2011, you may call me at ", ""),
// With trailing numbers after a comma. The 45 should not be considered an extension.
new NumberContext("", ", 45 days a year"),
// When matching we don't consider semicolon along with legitimate extension symbol to indicate
// an extension. The 7246433 should not be considered an extension.
new NumberContext("", ";x 7246433"),
// With a postfix stripped off as it looks like the start of another number.
new NumberContext("Call ", "/x12 more")
];
doTestInContext(number, defaultCountry, contextPairs, Leniency.POSSIBLE);
}
function doTestInContext(number, defaultCountry,contextPairs, leniency) {
function doTestInContext(number, defaultCountry, contextPairs, leniency) {
contextPairs.forEach(function(context) {
var prefix = context.leadingText;
var text = prefix + number + context.trailingText;
@ -234,41 +907,64 @@ function doTestInContext(number, defaultCountry,contextPairs, leniency) {
var start = prefix.length;
var end = start + number.length;
var iterator =
phoneUtil.findNumbers(text, defaultCountry, leniency, Long.MAX_VALUE).iterator();
phoneUtil.findNumbers(text, defaultCountry, leniency);
var match = iterator.hasNext() ? iterator.next() : null;
assertNotNull("Did not find a number in '" + text + "'; expected '" + number + "'", match);
var extracted = text.substrig(match.start, match.end);
var extracted = text.substring(match.start, match.end);
assertTrue("Unexpected phone region in '" + text + "'; extracted '" + extracted + "'",
start == match.start() && end == match.end());
assertTrue(number.equals(extracted)); // XXX: need to figure out equals vs. contentEquals
assertEquals(match.rawString, extracted); // XXX: need to figure out equals vs. contentEquals
start == match.start && end == match.end);
assertEquals(number, extracted);
assertEquals(match.rawString, extracted);
ensureTermination(text, defaultCountry, leniency);
});
}
/**
* Exhaustively searches for phone numbers from each index within {@code text} to test that
* finding matches always terminates.
*/
function ensureTermination(text, defaultCountry, leniency) {
for (var index = 0; index <= text.length; index++) {
var sub = text.substring(index);
var matches = "";
// Iterates over all matches.
var iterator =
phoneUtil.findNumbers(sub, defaultCountry, leniency);
while(iterator.hasNext()) {
var match = iterator.next();
matches += ", " + match.toString();
}
}
}
/**
* Tests valid numbers in contexts that fail for {@link Leniency#POSSIBLE} but are valid for
* {@link Leniency#VALID}.
*/
function findValidInContext(number, defaultCountry) {
var contextPairs = [];
// With other small numbers.
contextPairs.push(new NumberContext("It's only 9.99! Call ", " to buy"));
// With a number Day.Month.Year date.
contextPairs.push(new NumberContext("Call me on 21.6.1984 at ", ""));
// With a number Month/Day date.
contextPairs.push(new NumberContext("Call me on 06/21 at ", ""));
// With a number Day.Month date.
contextPairs.push(new NumberContext("Call me on 21.6. at ", ""));
// With a number Month/Day/Year date.
contextPairs.push(new NumberContext("Call me on 06/21/84 at ", ""));
var contextPairs = [
// With other small numbers.
new NumberContext("It's only 9.99! Call ", " to buy"),
// With a number Day.Month.Year date.
new NumberContext("Call me on 21.6.1984 at ", ""),
// With a number Month/Day date.
new NumberContext("Call me on 06/21 at ", ""),
// With a number Day.Month date.
new NumberContext("Call me on 21.6. at ", ""),
// With a number Month/Day/Year date.
new NumberContext("Call me on 06/21/84 at ", "")
];
doTestInContext(number, defaultCountry, contextPairs, Leniency.VALID);
}
function findNumbersForLeniency(text, defaultCountry, leniency) {
return phoneUtil.findNumbers(text, defaultCountry, leniency);
}
/**
* Small class that holds the context of the number we are testing against. The test will
@ -282,10 +978,10 @@ function NumberContext(leadingText, trailingText) {
/**
* Small class that holds the number we want to test and the region for which it should be valid.
*/
function NumberTest (rawString, region) {
function NumberTest(rawString, region) {
this.rawString = rawString;
this.region = regionCode;
this.region = region;
}
NumberTest.prototype.toString = function() {
return this.rawString + " (" + this.region.toString() + ")";
return this.rawString + " (" + this.region + ")";
};

+ 8
- 2
javascript/i18n/phonenumbers/phonenumberutil.js View File

@ -1046,6 +1046,7 @@ i18n.phonenumbers.PhoneNumberUtil.ValidationResult = {
EXACT_GROUPING: 3,
// Verification functions for each of the above.
// XXX: this feels overly "clever", and probably I should refactor. Tried to follow Java's pattern here.
verifyFns: [
// POSSIBLE
function(number, candidate, util) {
@ -4653,13 +4654,18 @@ i18n.phonenumbers.PhoneNumberUtil.prototype.isNationalNumberSuffixOfTheOther_ =
* the number being parsed is not written in international format. The country_code for the
* number in this case would be stored as that of the default region supplied. May be null if
* only international numbers are expected.
* @param leniency the leniency to use when evaluating candidate phone numbers
* @param maxTries the maximum number of invalid numbers to try before giving up on the text.
* This is to cover degenerate cases where the text has a lot of false positives in it. Must
* be {@code >= 0}.
*/
i18n.phonenumbers.PhoneNumberUtil.prototype.findNumbers = function(text, defaultRegion) {
i18n.phonenumbers.PhoneNumberUtil.prototype.findNumbers = function(text, defaultRegion, leniency, maxTries) {
if (!this.isValidRegionCode_(defaultRegion)) {
throw new Error('Invalid region code: ' + defaultRegion);
}
var maxTries = 9223372036854775807; // Long.MAX_VALUE is 9,223,372,036,854,775,807
leniency = leniency || i18n.phonenumbers.PhoneNumberUtil.Leniency.VALID;
maxTries = maxTries || 9223372036854775807; // Long.MAX_VALUE is 9,223,372,036,854,775,807
return new PhoneNumberMatcher(this, text, defaultRegion, i18n.phonenumbers.PhoneNumberUtil.Leniency.VALID, maxTries);
};


Loading…
Cancel
Save