2018-06-25 16:30:11 +02:00
|
|
|
// Copyright (C) 2017 Mathias Bynens. All rights reserved.
|
2017-07-14 17:37:24 +02:00
|
|
|
// This code is governed by the BSD license found in the LICENSE file.
|
|
|
|
/*---
|
|
|
|
description: |
|
|
|
|
Collection of functions used to assert the correctness of RegExp objects.
|
2022-05-06 13:44:47 +02:00
|
|
|
defines: [buildString, testPropertyEscapes, testPropertyOfStrings, testExtendedCharacterClass, matchValidator]
|
2017-07-14 17:37:24 +02:00
|
|
|
---*/
|
|
|
|
|
2021-05-29 01:47:36 +02:00
|
|
|
function buildString(args) {
|
|
|
|
// Use member expressions rather than destructuring `args` for improved
|
|
|
|
// compatibility with engines that only implement assignment patterns
|
|
|
|
// partially or not at all.
|
|
|
|
const loneCodePoints = args.loneCodePoints;
|
|
|
|
const ranges = args.ranges;
|
2017-04-13 17:22:49 +02:00
|
|
|
const CHUNK_SIZE = 10000;
|
2018-08-17 16:48:42 +02:00
|
|
|
let result = Reflect.apply(String.fromCodePoint, null, loneCodePoints);
|
|
|
|
for (let i = 0; i < ranges.length; i++) {
|
|
|
|
const range = ranges[i];
|
|
|
|
const start = range[0];
|
|
|
|
const end = range[1];
|
2017-04-13 17:22:49 +02:00
|
|
|
const codePoints = [];
|
|
|
|
for (let length = 0, codePoint = start; codePoint <= end; codePoint++) {
|
|
|
|
codePoints[length++] = codePoint;
|
|
|
|
if (length === CHUNK_SIZE) {
|
2018-08-17 16:48:42 +02:00
|
|
|
result += Reflect.apply(String.fromCodePoint, null, codePoints);
|
2017-04-13 17:22:49 +02:00
|
|
|
codePoints.length = length = 0;
|
|
|
|
}
|
|
|
|
}
|
2018-08-17 16:48:42 +02:00
|
|
|
result += Reflect.apply(String.fromCodePoint, null, codePoints);
|
2017-04-13 17:22:49 +02:00
|
|
|
}
|
|
|
|
return result;
|
|
|
|
}
|
|
|
|
|
2021-12-27 12:04:14 +01:00
|
|
|
function printCodePoint(codePoint) {
|
|
|
|
const hex = codePoint
|
|
|
|
.toString(16)
|
|
|
|
.toUpperCase()
|
|
|
|
.padStart(6, "0");
|
|
|
|
return `U+${hex}`;
|
|
|
|
}
|
|
|
|
|
|
|
|
function printStringCodePoints(string) {
|
|
|
|
const buf = [];
|
|
|
|
for (const symbol of string) {
|
|
|
|
const formatted = printCodePoint(symbol.codePointAt(0));
|
|
|
|
buf.push(formatted);
|
|
|
|
}
|
|
|
|
return buf.join(' ');
|
|
|
|
}
|
|
|
|
|
|
|
|
function testPropertyEscapes(regExp, string, expression) {
|
|
|
|
if (!regExp.test(string)) {
|
2017-04-13 17:22:49 +02:00
|
|
|
for (const symbol of string) {
|
2022-05-04 12:55:48 +02:00
|
|
|
const hex = printCodePoint(symbol.codePointAt(0));
|
2017-04-13 17:22:49 +02:00
|
|
|
assert(
|
2021-12-27 12:04:14 +01:00
|
|
|
regExp.test(symbol),
|
2017-04-13 17:22:49 +02:00
|
|
|
`\`${ expression }\` should match U+${ hex } (\`${ symbol }\`)`
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2018-03-18 04:48:31 +01:00
|
|
|
|
2021-12-27 12:04:14 +01:00
|
|
|
function testPropertyOfStrings(args) {
|
|
|
|
// Use member expressions rather than destructuring `args` for improved
|
|
|
|
// compatibility with engines that only implement assignment patterns
|
|
|
|
// partially or not at all.
|
|
|
|
const regExp = args.regExp;
|
|
|
|
const expression = args.expression;
|
|
|
|
const matchStrings = args.matchStrings;
|
|
|
|
const nonMatchStrings = args.nonMatchStrings;
|
|
|
|
const allStrings = matchStrings.join('');
|
|
|
|
if (!regExp.test(allStrings)) {
|
|
|
|
for (const string of matchStrings) {
|
|
|
|
assert(
|
|
|
|
regExp.test(string),
|
|
|
|
`\`${ expression }\` should match ${ string } (U+${ printStringCodePoints(string) })`
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
const allNonMatchStrings = nonMatchStrings.join('');
|
|
|
|
if (regExp.test(allNonMatchStrings)) {
|
|
|
|
for (const string of nonMatchStrings) {
|
|
|
|
assert(
|
|
|
|
!regExp.test(string),
|
|
|
|
`\`${ expression }\` should not match ${ string } (U+${ printStringCodePoints(string) })`
|
|
|
|
);
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2022-05-06 13:12:55 +02:00
|
|
|
// The exact same logic can be used to test extended character classes
|
|
|
|
// as enabled through the RegExp `v` flag. This is useful to test not
|
|
|
|
// just standalone properties of strings, but also string literals, and
|
|
|
|
// set operations.
|
|
|
|
const testExtendedCharacterClass = testPropertyOfStrings;
|
|
|
|
|
2021-12-27 12:04:14 +01:00
|
|
|
// Returns a function that validates a RegExp match result.
|
2018-03-18 04:48:31 +01:00
|
|
|
//
|
|
|
|
// Example:
|
|
|
|
//
|
|
|
|
// var validate = matchValidator(['b'], 1, 'abc');
|
|
|
|
// validate(/b/.exec('abc'));
|
|
|
|
//
|
|
|
|
function matchValidator(expectedEntries, expectedIndex, expectedInput) {
|
|
|
|
return function(match) {
|
|
|
|
assert.compareArray(match, expectedEntries, 'Match entries');
|
|
|
|
assert.sameValue(match.index, expectedIndex, 'Match index');
|
|
|
|
assert.sameValue(match.input, expectedInput, 'Match input');
|
|
|
|
}
|
|
|
|
}
|