218 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
		
		
			
		
	
	
			218 lines
		
	
	
		
			7.0 KiB
		
	
	
	
		
			JavaScript
		
	
	
	
|  | "use strict"; | |||
|  | Object.defineProperty(exports, "__esModule", { value: true }); | |||
|  | exports.splitGraphemes = exports.GraphemeBreaker = exports.graphemeBreakAtIndex = exports.codePointToClass = exports.BREAK_ALLOWED = exports.BREAK_NOT_ALLOWED = exports.UnicodeTrie = exports.fromCodePoint = exports.toCodePoints = exports.classes = void 0; | |||
|  | var grapheme_break_trie_1 = require("./grapheme-break-trie"); | |||
|  | var utrie_1 = require("utrie"); | |||
|  | var Other = 0; | |||
|  | var Prepend = 1; | |||
|  | var CR = 2; | |||
|  | var LF = 3; | |||
|  | var Control = 4; | |||
|  | var Extend = 5; | |||
|  | var Regional_Indicator = 6; | |||
|  | var SpacingMark = 7; | |||
|  | var L = 8; | |||
|  | var V = 9; | |||
|  | var T = 10; | |||
|  | var LV = 11; | |||
|  | var LVT = 12; | |||
|  | var ZWJ = 13; | |||
|  | var Extended_Pictographic = 14; | |||
|  | var RI = 15; | |||
|  | exports.classes = { | |||
|  |     Other: Other, | |||
|  |     Prepend: Prepend, | |||
|  |     CR: CR, | |||
|  |     LF: LF, | |||
|  |     Control: Control, | |||
|  |     Extend: Extend, | |||
|  |     Regional_Indicator: Regional_Indicator, | |||
|  |     SpacingMark: SpacingMark, | |||
|  |     L: L, | |||
|  |     V: V, | |||
|  |     T: T, | |||
|  |     LV: LV, | |||
|  |     LVT: LVT, | |||
|  |     ZWJ: ZWJ, | |||
|  |     Extended_Pictographic: Extended_Pictographic, | |||
|  |     RI: RI, | |||
|  | }; | |||
|  | var toCodePoints = function (str) { | |||
|  |     var codePoints = []; | |||
|  |     var i = 0; | |||
|  |     var length = str.length; | |||
|  |     while (i < length) { | |||
|  |         var value = str.charCodeAt(i++); | |||
|  |         if (value >= 0xd800 && value <= 0xdbff && i < length) { | |||
|  |             var extra = str.charCodeAt(i++); | |||
|  |             if ((extra & 0xfc00) === 0xdc00) { | |||
|  |                 codePoints.push(((value & 0x3ff) << 10) + (extra & 0x3ff) + 0x10000); | |||
|  |             } | |||
|  |             else { | |||
|  |                 codePoints.push(value); | |||
|  |                 i--; | |||
|  |             } | |||
|  |         } | |||
|  |         else { | |||
|  |             codePoints.push(value); | |||
|  |         } | |||
|  |     } | |||
|  |     return codePoints; | |||
|  | }; | |||
|  | exports.toCodePoints = toCodePoints; | |||
|  | var fromCodePoint = function () { | |||
|  |     var codePoints = []; | |||
|  |     for (var _i = 0; _i < arguments.length; _i++) { | |||
|  |         codePoints[_i] = arguments[_i]; | |||
|  |     } | |||
|  |     if (String.fromCodePoint) { | |||
|  |         return String.fromCodePoint.apply(String, codePoints); | |||
|  |     } | |||
|  |     var length = codePoints.length; | |||
|  |     if (!length) { | |||
|  |         return ''; | |||
|  |     } | |||
|  |     var codeUnits = []; | |||
|  |     var index = -1; | |||
|  |     var result = ''; | |||
|  |     while (++index < length) { | |||
|  |         var codePoint = codePoints[index]; | |||
|  |         if (codePoint <= 0xffff) { | |||
|  |             codeUnits.push(codePoint); | |||
|  |         } | |||
|  |         else { | |||
|  |             codePoint -= 0x10000; | |||
|  |             codeUnits.push((codePoint >> 10) + 0xd800, (codePoint % 0x400) + 0xdc00); | |||
|  |         } | |||
|  |         if (index + 1 === length || codeUnits.length > 0x4000) { | |||
|  |             result += String.fromCharCode.apply(String, codeUnits); | |||
|  |             codeUnits.length = 0; | |||
|  |         } | |||
|  |     } | |||
|  |     return result; | |||
|  | }; | |||
|  | exports.fromCodePoint = fromCodePoint; | |||
|  | exports.UnicodeTrie = utrie_1.createTrieFromBase64(grapheme_break_trie_1.base64, grapheme_break_trie_1.byteLength); | |||
|  | exports.BREAK_NOT_ALLOWED = '×'; | |||
|  | exports.BREAK_ALLOWED = '÷'; | |||
|  | var codePointToClass = function (codePoint) { return exports.UnicodeTrie.get(codePoint); }; | |||
|  | exports.codePointToClass = codePointToClass; | |||
|  | var _graphemeBreakAtIndex = function (_codePoints, classTypes, index) { | |||
|  |     var prevIndex = index - 2; | |||
|  |     var prev = classTypes[prevIndex]; | |||
|  |     var current = classTypes[index - 1]; | |||
|  |     var next = classTypes[index]; | |||
|  |     // GB3 Do not break between a CR and LF
 | |||
|  |     if (current === CR && next === LF) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB4 Otherwise, break before and after controls.
 | |||
|  |     if (current === CR || current === LF || current === Control) { | |||
|  |         return exports.BREAK_ALLOWED; | |||
|  |     } | |||
|  |     // GB5
 | |||
|  |     if (next === CR || next === LF || next === Control) { | |||
|  |         return exports.BREAK_ALLOWED; | |||
|  |     } | |||
|  |     // Do not break Hangul syllable sequences.
 | |||
|  |     // GB6
 | |||
|  |     if (current === L && [L, V, LV, LVT].indexOf(next) !== -1) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB7
 | |||
|  |     if ((current === LV || current === V) && (next === V || next === T)) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB8
 | |||
|  |     if ((current === LVT || current === T) && next === T) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB9 Do not break before extending characters or ZWJ.
 | |||
|  |     if (next === ZWJ || next === Extend) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // Do not break before SpacingMarks, or after Prepend characters.
 | |||
|  |     // GB9a
 | |||
|  |     if (next === SpacingMark) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB9a
 | |||
|  |     if (current === Prepend) { | |||
|  |         return exports.BREAK_NOT_ALLOWED; | |||
|  |     } | |||
|  |     // GB11 Do not break within emoji modifier sequences or emoji zwj sequences.
 | |||
|  |     if (current === ZWJ && next === Extended_Pictographic) { | |||
|  |         while (prev === Extend) { | |||
|  |             prev = classTypes[--prevIndex]; | |||
|  |         } | |||
|  |         if (prev === Extended_Pictographic) { | |||
|  |             return exports.BREAK_NOT_ALLOWED; | |||
|  |         } | |||
|  |     } | |||
|  |     // GB12 Do not break within emoji flag sequences.
 | |||
|  |     // That is, do not break between regional indicator (RI) symbols
 | |||
|  |     // if there is an odd number of RI characters before the break point.
 | |||
|  |     if (current === RI && next === RI) { | |||
|  |         var countRI = 0; | |||
|  |         while (prev === RI) { | |||
|  |             countRI++; | |||
|  |             prev = classTypes[--prevIndex]; | |||
|  |         } | |||
|  |         if (countRI % 2 === 0) { | |||
|  |             return exports.BREAK_NOT_ALLOWED; | |||
|  |         } | |||
|  |     } | |||
|  |     return exports.BREAK_ALLOWED; | |||
|  | }; | |||
|  | var graphemeBreakAtIndex = function (codePoints, index) { | |||
|  |     // GB1 Break at the start and end of text, unless the text is empty.
 | |||
|  |     if (index === 0) { | |||
|  |         return exports.BREAK_ALLOWED; | |||
|  |     } | |||
|  |     // GB2
 | |||
|  |     if (index >= codePoints.length) { | |||
|  |         return exports.BREAK_ALLOWED; | |||
|  |     } | |||
|  |     var classTypes = codePoints.map(exports.codePointToClass); | |||
|  |     return _graphemeBreakAtIndex(codePoints, classTypes, index); | |||
|  | }; | |||
|  | exports.graphemeBreakAtIndex = graphemeBreakAtIndex; | |||
|  | var GraphemeBreaker = function (str) { | |||
|  |     var codePoints = exports.toCodePoints(str); | |||
|  |     var length = codePoints.length; | |||
|  |     var index = 0; | |||
|  |     var lastEnd = 0; | |||
|  |     var classTypes = codePoints.map(exports.codePointToClass); | |||
|  |     return { | |||
|  |         next: function () { | |||
|  |             if (index >= length) { | |||
|  |                 return { done: true, value: null }; | |||
|  |             } | |||
|  |             var graphemeBreak = exports.BREAK_NOT_ALLOWED; | |||
|  |             while (index < length && | |||
|  |                 (graphemeBreak = _graphemeBreakAtIndex(codePoints, classTypes, ++index)) === exports.BREAK_NOT_ALLOWED) { } | |||
|  |             if (graphemeBreak !== exports.BREAK_NOT_ALLOWED || index === length) { | |||
|  |                 var value = exports.fromCodePoint.apply(null, codePoints.slice(lastEnd, index)); | |||
|  |                 lastEnd = index; | |||
|  |                 return { value: value, done: false }; | |||
|  |             } | |||
|  |             return { done: true, value: null }; | |||
|  |             while (index < length) { } | |||
|  |             return { done: true, value: null }; | |||
|  |         }, | |||
|  |     }; | |||
|  | }; | |||
|  | exports.GraphemeBreaker = GraphemeBreaker; | |||
|  | var splitGraphemes = function (str) { | |||
|  |     var breaker = exports.GraphemeBreaker(str); | |||
|  |     var graphemes = []; | |||
|  |     var bk; | |||
|  |     while (!(bk = breaker.next()).done) { | |||
|  |         if (bk.value) { | |||
|  |             graphemes.push(bk.value.slice()); | |||
|  |         } | |||
|  |     } | |||
|  |     return graphemes; | |||
|  | }; | |||
|  | exports.splitGraphemes = splitGraphemes; | |||
|  | //# sourceMappingURL=GraphemeBreak.js.map
 |