mirror of
https://github.com/thangisme/notes.git
synced 2024-11-01 00:37:33 -04:00
45 lines
1.6 KiB
JavaScript
45 lines
1.6 KiB
JavaScript
|
/** Used to compose unicode character classes. */
|
||
|
var rsAstralRange = '\\ud800-\\udfff',
|
||
|
rsComboMarksRange = '\\u0300-\\u036f',
|
||
|
reComboHalfMarksRange = '\\ufe20-\\ufe2f',
|
||
|
rsComboSymbolsRange = '\\u20d0-\\u20ff',
|
||
|
rsComboRange = rsComboMarksRange + reComboHalfMarksRange + rsComboSymbolsRange,
|
||
|
rsVarRange = '\\ufe0e\\ufe0f';
|
||
|
|
||
|
/** Used to compose unicode capture groups. */
|
||
|
var rsAstral = '[' + rsAstralRange + ']',
|
||
|
rsCombo = '[' + rsComboRange + ']',
|
||
|
rsFitz = '\\ud83c[\\udffb-\\udfff]',
|
||
|
rsModifier = '(?:' + rsCombo + '|' + rsFitz + ')',
|
||
|
rsNonAstral = '[^' + rsAstralRange + ']',
|
||
|
rsRegional = '(?:\\ud83c[\\udde6-\\uddff]){2}',
|
||
|
rsSurrPair = '[\\ud800-\\udbff][\\udc00-\\udfff]',
|
||
|
rsZWJ = '\\u200d';
|
||
|
|
||
|
/** Used to compose unicode regexes. */
|
||
|
var reOptMod = rsModifier + '?',
|
||
|
rsOptVar = '[' + rsVarRange + ']?',
|
||
|
rsOptJoin = '(?:' + rsZWJ + '(?:' + [rsNonAstral, rsRegional, rsSurrPair].join('|') + ')' + rsOptVar + reOptMod + ')*',
|
||
|
rsSeq = rsOptVar + reOptMod + rsOptJoin,
|
||
|
rsSymbol = '(?:' + [rsNonAstral + rsCombo + '?', rsCombo, rsRegional, rsSurrPair, rsAstral].join('|') + ')';
|
||
|
|
||
|
/** Used to match [string symbols](https://mathiasbynens.be/notes/javascript-unicode). */
|
||
|
var reUnicode = RegExp(rsFitz + '(?=' + rsFitz + ')|' + rsSymbol + rsSeq, 'g');
|
||
|
|
||
|
/**
|
||
|
* Gets the size of a Unicode `string`.
|
||
|
*
|
||
|
* @private
|
||
|
* @param {string} string The string inspect.
|
||
|
* @returns {number} Returns the string size.
|
||
|
*/
|
||
|
function unicodeSize(string) {
|
||
|
var result = reUnicode.lastIndex = 0;
|
||
|
while (reUnicode.test(string)) {
|
||
|
++result;
|
||
|
}
|
||
|
return result;
|
||
|
}
|
||
|
|
||
|
module.exports = unicodeSize;
|