218 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
		
		
			
		
	
	
			218 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
| 
								 | 
							
								"use strict";
							 | 
						|||
| 
								 | 
							
								Object.defineProperty(exports, "__esModule", { value: true });
							 | 
						|||
| 
								 | 
							
								exports.splitGraphemes = exports.GraphemeBreaker = exports.graphemeBreakAtIndex = exports.codePointToClass = exports.BREAK_ALLOWED = exports.BREAK_NOT_ALLOWED = exports.UnicodeTrie = exports.fromCodePoint = exports.toCodePoints = exports.classes = void 0;
							 | 
						|||
| 
								 | 
							
								var grapheme_break_trie_1 = require("./grapheme-break-trie");
							 | 
						|||
| 
								 | 
							
								var utrie_1 = require("utrie");
							 | 
						|||
| 
								 | 
							
								var Other = 0;
							 | 
						|||
| 
								 | 
							
								var Prepend = 1;
							 | 
						|||
| 
								 | 
							
								var CR = 2;
							 | 
						|||
| 
								 | 
							
								var LF = 3;
							 | 
						|||
| 
								 | 
							
								var Control = 4;
							 | 
						|||
| 
								 | 
							
								var Extend = 5;
							 | 
						|||
| 
								 | 
							
								var Regional_Indicator = 6;
							 | 
						|||
| 
								 | 
							
								var SpacingMark = 7;
							 | 
						|||
| 
								 | 
							
								var L = 8;
							 | 
						|||
| 
								 | 
							
								var V = 9;
							 | 
						|||
| 
								 | 
							
								var T = 10;
							 | 
						|||
| 
								 | 
							
								var LV = 11;
							 | 
						|||
| 
								 | 
							
								var LVT = 12;
							 | 
						|||
| 
								 | 
							
								var ZWJ = 13;
							 | 
						|||
| 
								 | 
							
								var Extended_Pictographic = 14;
							 | 
						|||
| 
								 | 
							
								var RI = 15;
							 | 
						|||
| 
								 | 
							
								exports.classes = {
							 | 
						|||
| 
								 | 
							
								    Other: Other,
							 | 
						|||
| 
								 | 
							
								    Prepend: Prepend,
							 | 
						|||
| 
								 | 
							
								    CR: CR,
							 | 
						|||
| 
								 | 
							
								    LF: LF,
							 | 
						|||
| 
								 | 
							
								    Control: Control,
							 | 
						|||
| 
								 | 
							
								    Extend: Extend,
							 | 
						|||
| 
								 | 
							
								    Regional_Indicator: Regional_Indicator,
							 | 
						|||
| 
								 | 
							
								    SpacingMark: SpacingMark,
							 | 
						|||
| 
								 | 
							
								    L: L,
							 | 
						|||
| 
								 | 
							
								    V: V,
							 | 
						|||
| 
								 | 
							
								    T: T,
							 | 
						|||
| 
								 | 
							
								    LV: LV,
							 | 
						|||
| 
								 | 
							
								    LVT: LVT,
							 | 
						|||
| 
								 | 
							
								    ZWJ: ZWJ,
							 | 
						|||
| 
								 | 
							
								    Extended_Pictographic: Extended_Pictographic,
							 | 
						|||
| 
								 | 
							
								    RI: RI,
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								var toCodePoints = function (str) {
							 | 
						|||
| 
								 | 
							
								    var codePoints = [];
							 | 
						|||
| 
								 | 
							
								    var i = 0;
							 | 
						|||
| 
								 | 
							
								    var length = str.length;
							 | 
						|||
| 
								 | 
							
								    while (i < length) {
							 | 
						|||
| 
								 | 
							
								        var value = str.charCodeAt(i++);
							 | 
						|||
| 
								 | 
							
								        if (value >= 0xd800 && value <= 0xdbff && i < length) {
							 | 
						|||
| 
								 | 
							
								            var extra = str.charCodeAt(i++);
							 | 
						|||
| 
								 | 
							
								            if ((extra & 0xfc00) === 0xdc00) {
							 | 
						|||
| 
								 | 
							
								                codePoints.push(((value & 0x3ff) << 10) + (extra & 0x3ff) + 0x10000);
							 | 
						|||
| 
								 | 
							
								            }
							 | 
						|||
| 
								 | 
							
								            else {
							 | 
						|||
| 
								 | 
							
								                codePoints.push(value);
							 | 
						|||
| 
								 | 
							
								                i--;
							 | 
						|||
| 
								 | 
							
								            }
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								        else {
							 | 
						|||
| 
								 | 
							
								            codePoints.push(value);
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    return codePoints;
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								exports.toCodePoints = toCodePoints;
							 | 
						|||
| 
								 | 
							
								var fromCodePoint = function () {
							 | 
						|||
| 
								 | 
							
								    var codePoints = [];
							 | 
						|||
| 
								 | 
							
								    for (var _i = 0; _i < arguments.length; _i++) {
							 | 
						|||
| 
								 | 
							
								        codePoints[_i] = arguments[_i];
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    if (String.fromCodePoint) {
							 | 
						|||
| 
								 | 
							
								        return String.fromCodePoint.apply(String, codePoints);
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    var length = codePoints.length;
							 | 
						|||
| 
								 | 
							
								    if (!length) {
							 | 
						|||
| 
								 | 
							
								        return '';
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    var codeUnits = [];
							 | 
						|||
| 
								 | 
							
								    var index = -1;
							 | 
						|||
| 
								 | 
							
								    var result = '';
							 | 
						|||
| 
								 | 
							
								    while (++index < length) {
							 | 
						|||
| 
								 | 
							
								        var codePoint = codePoints[index];
							 | 
						|||
| 
								 | 
							
								        if (codePoint <= 0xffff) {
							 | 
						|||
| 
								 | 
							
								            codeUnits.push(codePoint);
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								        else {
							 | 
						|||
| 
								 | 
							
								            codePoint -= 0x10000;
							 | 
						|||
| 
								 | 
							
								            codeUnits.push((codePoint >> 10) + 0xd800, (codePoint % 0x400) + 0xdc00);
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								        if (index + 1 === length || codeUnits.length > 0x4000) {
							 | 
						|||
| 
								 | 
							
								            result += String.fromCharCode.apply(String, codeUnits);
							 | 
						|||
| 
								 | 
							
								            codeUnits.length = 0;
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    return result;
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								exports.fromCodePoint = fromCodePoint;
							 | 
						|||
| 
								 | 
							
								exports.UnicodeTrie = utrie_1.createTrieFromBase64(grapheme_break_trie_1.base64, grapheme_break_trie_1.byteLength);
							 | 
						|||
| 
								 | 
							
								exports.BREAK_NOT_ALLOWED = '×';
							 | 
						|||
| 
								 | 
							
								exports.BREAK_ALLOWED = '÷';
							 | 
						|||
| 
								 | 
							
								var codePointToClass = function (codePoint) { return exports.UnicodeTrie.get(codePoint); };
							 | 
						|||
| 
								 | 
							
								exports.codePointToClass = codePointToClass;
							 | 
						|||
| 
								 | 
							
								var _graphemeBreakAtIndex = function (_codePoints, classTypes, index) {
							 | 
						|||
| 
								 | 
							
								    var prevIndex = index - 2;
							 | 
						|||
| 
								 | 
							
								    var prev = classTypes[prevIndex];
							 | 
						|||
| 
								 | 
							
								    var current = classTypes[index - 1];
							 | 
						|||
| 
								 | 
							
								    var next = classTypes[index];
							 | 
						|||
| 
								 | 
							
								    // GB3 Do not break between a CR and LF
							 | 
						|||
| 
								 | 
							
								    if (current === CR && next === LF) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB4 Otherwise, break before and after controls.
							 | 
						|||
| 
								 | 
							
								    if (current === CR || current === LF || current === Control) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB5
							 | 
						|||
| 
								 | 
							
								    if (next === CR || next === LF || next === Control) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // Do not break Hangul syllable sequences.
							 | 
						|||
| 
								 | 
							
								    // GB6
							 | 
						|||
| 
								 | 
							
								    if (current === L && [L, V, LV, LVT].indexOf(next) !== -1) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB7
							 | 
						|||
| 
								 | 
							
								    if ((current === LV || current === V) && (next === V || next === T)) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB8
							 | 
						|||
| 
								 | 
							
								    if ((current === LVT || current === T) && next === T) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB9 Do not break before extending characters or ZWJ.
							 | 
						|||
| 
								 | 
							
								    if (next === ZWJ || next === Extend) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // Do not break before SpacingMarks, or after Prepend characters.
							 | 
						|||
| 
								 | 
							
								    // GB9a
							 | 
						|||
| 
								 | 
							
								    if (next === SpacingMark) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB9a
							 | 
						|||
| 
								 | 
							
								    if (current === Prepend) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB11 Do not break within emoji modifier sequences or emoji zwj sequences.
							 | 
						|||
| 
								 | 
							
								    if (current === ZWJ && next === Extended_Pictographic) {
							 | 
						|||
| 
								 | 
							
								        while (prev === Extend) {
							 | 
						|||
| 
								 | 
							
								            prev = classTypes[--prevIndex];
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								        if (prev === Extended_Pictographic) {
							 | 
						|||
| 
								 | 
							
								            return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB12 Do not break within emoji flag sequences.
							 | 
						|||
| 
								 | 
							
								    // That is, do not break between regional indicator (RI) symbols
							 | 
						|||
| 
								 | 
							
								    // if there is an odd number of RI characters before the break point.
							 | 
						|||
| 
								 | 
							
								    if (current === RI && next === RI) {
							 | 
						|||
| 
								 | 
							
								        var countRI = 0;
							 | 
						|||
| 
								 | 
							
								        while (prev === RI) {
							 | 
						|||
| 
								 | 
							
								            countRI++;
							 | 
						|||
| 
								 | 
							
								            prev = classTypes[--prevIndex];
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								        if (countRI % 2 === 0) {
							 | 
						|||
| 
								 | 
							
								            return exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    return exports.BREAK_ALLOWED;
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								var graphemeBreakAtIndex = function (codePoints, index) {
							 | 
						|||
| 
								 | 
							
								    // GB1 Break at the start and end of text, unless the text is empty.
							 | 
						|||
| 
								 | 
							
								    if (index === 0) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    // GB2
							 | 
						|||
| 
								 | 
							
								    if (index >= codePoints.length) {
							 | 
						|||
| 
								 | 
							
								        return exports.BREAK_ALLOWED;
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    var classTypes = codePoints.map(exports.codePointToClass);
							 | 
						|||
| 
								 | 
							
								    return _graphemeBreakAtIndex(codePoints, classTypes, index);
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								exports.graphemeBreakAtIndex = graphemeBreakAtIndex;
							 | 
						|||
| 
								 | 
							
								var GraphemeBreaker = function (str) {
							 | 
						|||
| 
								 | 
							
								    var codePoints = exports.toCodePoints(str);
							 | 
						|||
| 
								 | 
							
								    var length = codePoints.length;
							 | 
						|||
| 
								 | 
							
								    var index = 0;
							 | 
						|||
| 
								 | 
							
								    var lastEnd = 0;
							 | 
						|||
| 
								 | 
							
								    var classTypes = codePoints.map(exports.codePointToClass);
							 | 
						|||
| 
								 | 
							
								    return {
							 | 
						|||
| 
								 | 
							
								        next: function () {
							 | 
						|||
| 
								 | 
							
								            if (index >= length) {
							 | 
						|||
| 
								 | 
							
								                return { done: true, value: null };
							 | 
						|||
| 
								 | 
							
								            }
							 | 
						|||
| 
								 | 
							
								            var graphemeBreak = exports.BREAK_NOT_ALLOWED;
							 | 
						|||
| 
								 | 
							
								            while (index < length &&
							 | 
						|||
| 
								 | 
							
								                (graphemeBreak = _graphemeBreakAtIndex(codePoints, classTypes, ++index)) === exports.BREAK_NOT_ALLOWED) { }
							 | 
						|||
| 
								 | 
							
								            if (graphemeBreak !== exports.BREAK_NOT_ALLOWED || index === length) {
							 | 
						|||
| 
								 | 
							
								                var value = exports.fromCodePoint.apply(null, codePoints.slice(lastEnd, index));
							 | 
						|||
| 
								 | 
							
								                lastEnd = index;
							 | 
						|||
| 
								 | 
							
								                return { value: value, done: false };
							 | 
						|||
| 
								 | 
							
								            }
							 | 
						|||
| 
								 | 
							
								            return { done: true, value: null };
							 | 
						|||
| 
								 | 
							
								            while (index < length) { }
							 | 
						|||
| 
								 | 
							
								            return { done: true, value: null };
							 | 
						|||
| 
								 | 
							
								        },
							 | 
						|||
| 
								 | 
							
								    };
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								exports.GraphemeBreaker = GraphemeBreaker;
							 | 
						|||
| 
								 | 
							
								var splitGraphemes = function (str) {
							 | 
						|||
| 
								 | 
							
								    var breaker = exports.GraphemeBreaker(str);
							 | 
						|||
| 
								 | 
							
								    var graphemes = [];
							 | 
						|||
| 
								 | 
							
								    var bk;
							 | 
						|||
| 
								 | 
							
								    while (!(bk = breaker.next()).done) {
							 | 
						|||
| 
								 | 
							
								        if (bk.value) {
							 | 
						|||
| 
								 | 
							
								            graphemes.push(bk.value.slice());
							 | 
						|||
| 
								 | 
							
								        }
							 | 
						|||
| 
								 | 
							
								    }
							 | 
						|||
| 
								 | 
							
								    return graphemes;
							 | 
						|||
| 
								 | 
							
								};
							 | 
						|||
| 
								 | 
							
								exports.splitGraphemes = splitGraphemes;
							 | 
						|||
| 
								 | 
							
								//# sourceMappingURL=GraphemeBreak.js.map
							 |