diff --git a/.editorconfig b/.editorconfig new file mode 100644 index 0000000..883576d --- /dev/null +++ b/.editorconfig @@ -0,0 +1,10 @@ + +root = true + +[*] +charset = utf-8 +end_of_line = lf +indent_size = 2 +indent_style = space +insert_final_newline = true +trim_trailing_whitespace = true diff --git a/.gitignore b/.gitignore new file mode 100644 index 0000000..046c61c --- /dev/null +++ b/.gitignore @@ -0,0 +1,15 @@ +*~ +*.err +*.log +._* +.cache +.fseventsd +.DocumentRevisions* +.DS_Store +.TemporaryItems +.Trashes +Thumbs.db + +dist +node_modules +package-lock.json diff --git a/license b/license new file mode 100644 index 0000000..815da7d --- /dev/null +++ b/license @@ -0,0 +1,21 @@ +The MIT License (MIT) + +Copyright (c) 2024-present Fabio Spampinato + +Permission is hereby granted, free of charge, to any person obtaining a +copy of this software and associated documentation files (the "Software"), +to deal in the Software without restriction, including without limitation +the rights to use, copy, modify, merge, publish, distribute, sublicense, +and/or sell copies of the Software, and to permit persons to whom the +Software is furnished to do so, subject to the following conditions: + +The above copyright notice and this permission notice shall be included in +all copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR +IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, +FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE +AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER +LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING +FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER +DEALINGS IN THE SOFTWARE. diff --git a/package.json b/package.json new file mode 100644 index 0000000..6f54a80 --- /dev/null +++ b/package.json @@ -0,0 +1,34 @@ +{ + "name": "fast-string-truncated-width", + "repository": "github:fabiospampinato/fast-string-truncated-width", + "description": "A fast function for calculating where a string should be truncated, given an optional width limit and an ellipsis string.", + "version": "1.0.4", + "type": "module", + "main": "dist/index.js", + "exports": "./dist/index.js", + "types": "./dist/index.d.ts", + "scripts": { + "benchmark": "tsex benchmark", + "benchmark:watch": "tsex benchmark --watch", + "clean": "tsex clean", + "compile": "tsex compile", + "compile:watch": "tsex compile --watch", + "test": "tsex test", + "test:watch": "tsex test --watch", + "prepublishOnly": "tsex prepare" + }, + "keywords": [ + "fast", + "string", + "truncated", + "width", + "cli", + "terminal" + ], + "devDependencies": { + "benchloop": "^2.1.1", + "fava": "^0.3.2", + "tsex": "^3.0.2", + "typescript": "^5.3.3" + } +} diff --git a/readme.md b/readme.md new file mode 100644 index 0000000..405119b --- /dev/null +++ b/readme.md @@ -0,0 +1,39 @@ +# Fast String Truncated Width + +A fast function for calculating where a string should be truncated, given a width limit and an ellipsis string. + +This is a low-level function that basically calculates the visual width of a string and the index at which it should be truncated once printed to the terminal, but taking into account an optional width limit and an optional ellipsis string, so that the string doesn't have to be processed multiple times to be truncated, and how long the part after the truncation point is doesn't cost us anything because we can just ignore it. + +## Install + +```sh +npm install --save fast-string-truncated-width +``` + +## Usage + +```ts +import fastStringTruncatedWidth from 'fast-string-truncated-width'; + +// Retrieving the result for a string that fits within our width limit + +const result1 = fastStringTruncatedWidth ( '\x1b[31mhello', { limit: Infinity, ellipsis: '…' } ); + +result1.truncated; // => false, the string fits within the width limit, it doesn't have to be truncated +result1.ellipsed; // => false, the ellipsis string doesn't need to be appended to the string +result1.width; // => 5, the visual width of the string once printed to the terminal +result1.index; // => 10, the end index at which the string should be sliced, equal to input.length in this case + +// Retrieving the result for a string that doesn't fit within our width limit + +const result2 = fastStringTruncatedWidth ( '\x1b[31mhello', { limit: 3, ellipsis: '…' } ); + +result2.truncated; // => true, the string doesn't fit within the width limit, it has to be truncated +result2.ellipsed; // => true, the ellipsis string should be appended to the string (this isn't always the case, for example if our limit is 0) +result2.width; // => 2, the visual width of the string once printed to the terminal (this doesn't account for the width of the ellipsis string itself) +result2.index; // => 7, the end index at which the string should be sliced to truncate it correctly +``` + +## License + +MIT Β© Fabio Spampinato diff --git a/src/index.ts b/src/index.ts new file mode 100644 index 0000000..3658358 --- /dev/null +++ b/src/index.ts @@ -0,0 +1,222 @@ + +/* IMPORT */ + +import {isAmbiguous, isFullWidth, isWide} from './utils'; +import type {TruncationOptions, WidthOptions, Result} from './types'; + +/* HELPERS */ + +const ANSI_RE = /[\u001b\u009b][[()#;?]*(?:[0-9]{1,4}(?:;[0-9]{0,4})*)?[0-9A-ORZcf-nqry=><]/y; +const CONTROL_RE = /[\x00-\x1F\x7F-\x9F]+/y; +const EMOJI_RE = /(?:\p{Emoji_Modifier_Base}\p{Emoji_Modifier}?|\p{Emoji_Presentation}|\p{Emoji}\uFE0F)(?:\u200d(?:\p{Emoji_Modifier_Base}\p{Emoji_Modifier}?|\p{Emoji_Presentation}|\p{Emoji}\uFE0F))*/yu; +const LATIN_RE = /[\x20-\x7E\xA0-\xFF]+/y; +const MODIFIER_RE = /\p{M}+/gu; +const NO_TRUNCATION: TruncationOptions = { limit: Infinity, ellipsis: '' }; + +/* MAIN */ + +//TODO: Optimize matching non-latin letters + +const getStringTruncatedWidth = ( input: string, truncationOptions: TruncationOptions = {}, widthOptions: WidthOptions = {} ): Result => { + + /* CONSTANTS */ + + const LIMIT = truncationOptions.limit ?? Infinity; + const ELLIPSIS = truncationOptions.ellipsis ?? ''; + const ELLIPSIS_WIDTH = ELLIPSIS ? getStringTruncatedWidth ( ELLIPSIS, NO_TRUNCATION, widthOptions ).width : 0; + + const ANSI_WIDTH = widthOptions.ansiWidth ?? 0; + const CONTROL_WIDTH = widthOptions.controlWidth ?? 0; + + const AMBIGUOUS_WIDTH = widthOptions.ambiguousWidth ?? 1; + const EMOJI_WIDTH = widthOptions.emojiWidth ?? 2; + const FULL_WIDTH_WIDTH = widthOptions.fullWidthWidth ?? 2; + const REGULAR_WIDTH = widthOptions.regularWidth ?? 1; + const WIDE_WIDTH = widthOptions.wideWidth ?? 2; + + /* STATE */ + + let indexPrev = 0; + let index = 0; + let length = input.length; + let lengthExtra = 0; + let truncationEnabled = false; + let truncationIndex = length; + let truncationLimit = Math.max ( 0, LIMIT - ELLIPSIS_WIDTH ); + let unmatchedStart = 0; + let unmatchedEnd = 0; + let width = 0; + let widthExtra = 0; + + /* PARSE LOOP */ + + outer: + while ( true ) { + + /* UNMATCHED */ + + if ( ( unmatchedEnd > unmatchedStart ) || ( index >= length && index > indexPrev ) ) { + + const unmatched = input.slice ( unmatchedStart, unmatchedEnd ) || input.slice ( indexPrev, index ); + + lengthExtra = 0; + + for ( const char of unmatched.replaceAll ( MODIFIER_RE, '' ) ) { + + const codePoint = char.codePointAt ( 0 ) || 0; + + if ( isFullWidth ( codePoint ) ) { + widthExtra = FULL_WIDTH_WIDTH; + } else if ( isWide ( codePoint ) ) { + widthExtra = WIDE_WIDTH; + } else if ( AMBIGUOUS_WIDTH !== REGULAR_WIDTH && isAmbiguous ( codePoint ) ) { + widthExtra = AMBIGUOUS_WIDTH; + } else { + widthExtra = REGULAR_WIDTH; + } + + if ( ( width + widthExtra ) > truncationLimit ) { + truncationIndex = Math.min ( truncationIndex, Math.max ( unmatchedStart, indexPrev ) + lengthExtra ); + } + + if ( ( width + widthExtra ) > LIMIT ) { + truncationEnabled = true; + break outer; + } + + lengthExtra += char.length; + width += widthExtra; + + } + + unmatchedStart = unmatchedEnd = 0; + + } + + /* EXITING */ + + if ( index >= length ) break; + + /* LATIN */ + + LATIN_RE.lastIndex = index; + + if ( LATIN_RE.test ( input ) ) { + + lengthExtra = LATIN_RE.lastIndex - index; + widthExtra = lengthExtra * REGULAR_WIDTH; + + if ( ( width + widthExtra ) > truncationLimit ) { + truncationIndex = Math.min ( truncationIndex, index + Math.floor ( ( truncationLimit - width ) / REGULAR_WIDTH ) ); + } + + if ( ( width + widthExtra ) > LIMIT ) { + truncationEnabled = true; + break; + } + + width += widthExtra; + unmatchedStart = indexPrev; + unmatchedEnd = index; + index = indexPrev = LATIN_RE.lastIndex; + + continue; + + } + + /* ANSI */ + + ANSI_RE.lastIndex = index; + + if ( ANSI_RE.test ( input ) ) { + + if ( ( width + ANSI_WIDTH ) > truncationLimit ) { + truncationIndex = Math.min ( truncationIndex, index ); + } + + if ( ( width + ANSI_WIDTH ) > LIMIT ) { + truncationEnabled = true; + break; + } + + width += ANSI_WIDTH; + unmatchedStart = indexPrev; + unmatchedEnd = index; + index = indexPrev = ANSI_RE.lastIndex; + + continue; + + } + + /* CONTROL */ + + CONTROL_RE.lastIndex = index; + + if ( CONTROL_RE.test ( input ) ) { + + lengthExtra = CONTROL_RE.lastIndex - index; + widthExtra = lengthExtra * CONTROL_WIDTH; + + if ( ( width + widthExtra ) > truncationLimit ) { + truncationIndex = Math.min ( truncationIndex, index + Math.floor ( ( truncationLimit - width ) / CONTROL_WIDTH ) ); + } + + if ( ( width + widthExtra ) > LIMIT ) { + truncationEnabled = true; + break; + } + + width += widthExtra; + unmatchedStart = indexPrev; + unmatchedEnd = index; + index = indexPrev = CONTROL_RE.lastIndex; + + continue; + + } + + /* EMOJI */ + + EMOJI_RE.lastIndex = index; + + if ( EMOJI_RE.test ( input ) ) { + + if ( ( width + EMOJI_WIDTH ) > truncationLimit ) { + truncationIndex = Math.min ( truncationIndex, index ); + } + + if ( ( width + EMOJI_WIDTH ) > LIMIT ) { + truncationEnabled = true; + break; + } + + width += EMOJI_WIDTH; + unmatchedStart = indexPrev; + unmatchedEnd = index; + index = indexPrev = EMOJI_RE.lastIndex; + + continue; + + } + + /* UNMATCHED INDEX */ + + index += 1; + + } + + /* RETURN */ + + return { + width: truncationEnabled ? truncationLimit : width, + index: truncationEnabled ? truncationIndex : length, + truncated: truncationEnabled, + ellipsed: truncationEnabled && LIMIT >= ELLIPSIS_WIDTH + }; + +}; + +/* EXPORT */ + +export default getStringTruncatedWidth; +export type {TruncationOptions, WidthOptions, Result}; diff --git a/src/types.ts b/src/types.ts new file mode 100644 index 0000000..32f0bd8 --- /dev/null +++ b/src/types.ts @@ -0,0 +1,30 @@ + +/* MAIN */ + +type TruncationOptions = { + limit?: number, + ellipsis?: string +}; + +type WidthOptions = { + /* SPECIAL */ + ansiWidth?: number, + controlWidth?: number, + /* UNICODE */ + ambiguousWidth?: number, + emojiWidth?: number, + fullWidthWidth?: number, + regularWidth?: number, + wideWidth?: number +}; + +type Result = { + width: number, + index: number, + truncated: boolean, + ellipsed: boolean +}; + +/* EXPORT */ + +export type {TruncationOptions, WidthOptions, Result}; diff --git a/src/utils.ts b/src/utils.ts new file mode 100644 index 0000000..dad92dc --- /dev/null +++ b/src/utils.ts @@ -0,0 +1,29 @@ + +/* MAIN */ + +//URL: https://github.com/sindresorhus/get-east-asian-width/blob/main/lookup.js +//LICENSE: https://github.com/sindresorhus/get-east-asian-width/blob/main/license + +//TODO: Replace these with some unicode property classes, if the ones we need exist + +const isAmbiguous = ( x: number ): boolean => { + + return x === 0xA1 || x === 0xA4 || x === 0xA7 || x === 0xA8 || x === 0xAA || x === 0xAD || x === 0xAE || x >= 0xB0 && x <= 0xB4 || x >= 0xB6 && x <= 0xBA || x >= 0xBC && x <= 0xBF || x === 0xC6 || x === 0xD0 || x === 0xD7 || x === 0xD8 || x >= 0xDE && x <= 0xE1 || x === 0xE6 || x >= 0xE8 && x <= 0xEA || x === 0xEC || x === 0xED || x === 0xF0 || x === 0xF2 || x === 0xF3 || x >= 0xF7 && x <= 0xFA || x === 0xFC || x === 0xFE || x === 0x101 || x === 0x111 || x === 0x113 || x === 0x11B || x === 0x126 || x === 0x127 || x === 0x12B || x >= 0x131 && x <= 0x133 || x === 0x138 || x >= 0x13F && x <= 0x142 || x === 0x144 || x >= 0x148 && x <= 0x14B || x === 0x14D || x === 0x152 || x === 0x153 || x === 0x166 || x === 0x167 || x === 0x16B || x === 0x1CE || x === 0x1D0 || x === 0x1D2 || x === 0x1D4 || x === 0x1D6 || x === 0x1D8 || x === 0x1DA || x === 0x1DC || x === 0x251 || x === 0x261 || x === 0x2C4 || x === 0x2C7 || x >= 0x2C9 && x <= 0x2CB || x === 0x2CD || x === 0x2D0 || x >= 0x2D8 && x <= 0x2DB || x === 0x2DD || x === 0x2DF || x >= 0x300 && x <= 0x36F || x >= 0x391 && x <= 0x3A1 || x >= 0x3A3 && x <= 0x3A9 || x >= 0x3B1 && x <= 0x3C1 || x >= 0x3C3 && x <= 0x3C9 || x === 0x401 || x >= 0x410 && x <= 0x44F || x === 0x451 || x === 0x2010 || x >= 0x2013 && x <= 0x2016 || x === 0x2018 || x === 0x2019 || x === 0x201C || x === 0x201D || x >= 0x2020 && x <= 0x2022 || x >= 0x2024 && x <= 0x2027 || x === 0x2030 || x === 0x2032 || x === 0x2033 || x === 0x2035 || x === 0x203B || x === 0x203E || x === 0x2074 || x === 0x207F || x >= 0x2081 && x <= 0x2084 || x === 0x20AC || x === 0x2103 || x === 0x2105 || x === 0x2109 || x === 0x2113 || x === 0x2116 || x === 0x2121 || x === 0x2122 || x === 0x2126 || x === 0x212B || x === 0x2153 || x === 0x2154 || x >= 0x215B && x <= 0x215E || x >= 0x2160 && x <= 0x216B || x >= 0x2170 && x <= 0x2179 || x === 0x2189 || x >= 0x2190 && x <= 0x2199 || x === 0x21B8 || x === 0x21B9 || x === 0x21D2 || x === 0x21D4 || x === 0x21E7 || x === 0x2200 || x === 0x2202 || x === 0x2203 || x === 0x2207 || x === 0x2208 || x === 0x220B || x === 0x220F || x === 0x2211 || x === 0x2215 || x === 0x221A || x >= 0x221D && x <= 0x2220 || x === 0x2223 || x === 0x2225 || x >= 0x2227 && x <= 0x222C || x === 0x222E || x >= 0x2234 && x <= 0x2237 || x === 0x223C || x === 0x223D || x === 0x2248 || x === 0x224C || x === 0x2252 || x === 0x2260 || x === 0x2261 || x >= 0x2264 && x <= 0x2267 || x === 0x226A || x === 0x226B || x === 0x226E || x === 0x226F || x === 0x2282 || x === 0x2283 || x === 0x2286 || x === 0x2287 || x === 0x2295 || x === 0x2299 || x === 0x22A5 || x === 0x22BF || x === 0x2312 || x >= 0x2460 && x <= 0x24E9 || x >= 0x24EB && x <= 0x254B || x >= 0x2550 && x <= 0x2573 || x >= 0x2580 && x <= 0x258F || x >= 0x2592 && x <= 0x2595 || x === 0x25A0 || x === 0x25A1 || x >= 0x25A3 && x <= 0x25A9 || x === 0x25B2 || x === 0x25B3 || x === 0x25B6 || x === 0x25B7 || x === 0x25BC || x === 0x25BD || x === 0x25C0 || x === 0x25C1 || x >= 0x25C6 && x <= 0x25C8 || x === 0x25CB || x >= 0x25CE && x <= 0x25D1 || x >= 0x25E2 && x <= 0x25E5 || x === 0x25EF || x === 0x2605 || x === 0x2606 || x === 0x2609 || x === 0x260E || x === 0x260F || x === 0x261C || x === 0x261E || x === 0x2640 || x === 0x2642 || x === 0x2660 || x === 0x2661 || x >= 0x2663 && x <= 0x2665 || x >= 0x2667 && x <= 0x266A || x === 0x266C || x === 0x266D || x === 0x266F || x === 0x269E || x === 0x269F || x === 0x26BF || x >= 0x26C6 && x <= 0x26CD || x >= 0x26CF && x <= 0x26D3 || x >= 0x26D5 && x <= 0x26E1 || x === 0x26E3 || x === 0x26E8 || x === 0x26E9 || x >= 0x26EB && x <= 0x26F1 || x === 0x26F4 || x >= 0x26F6 && x <= 0x26F9 || x === 0x26FB || x === 0x26FC || x === 0x26FE || x === 0x26FF || x === 0x273D || x >= 0x2776 && x <= 0x277F || x >= 0x2B56 && x <= 0x2B59 || x >= 0x3248 && x <= 0x324F || x >= 0xE000 && x <= 0xF8FF || x >= 0xFE00 && x <= 0xFE0F || x === 0xFFFD || x >= 0x1F100 && x <= 0x1F10A || x >= 0x1F110 && x <= 0x1F12D || x >= 0x1F130 && x <= 0x1F169 || x >= 0x1F170 && x <= 0x1F18D || x === 0x1F18F || x === 0x1F190 || x >= 0x1F19B && x <= 0x1F1AC || x >= 0xE0100 && x <= 0xE01EF || x >= 0xF0000 && x <= 0xFFFFD || x >= 0x100000 && x <= 0x10FFFD; + +}; + +const isFullWidth = ( x: number ): boolean => { + + return x === 0x3000 || x >= 0xFF01 && x <= 0xFF60 || x >= 0xFFE0 && x <= 0xFFE6; + +}; + +const isWide = ( x: number ): boolean => { + + return x >= 0x1100 && x <= 0x115F || x === 0x231A || x === 0x231B || x === 0x2329 || x === 0x232A || x >= 0x23E9 && x <= 0x23EC || x === 0x23F0 || x === 0x23F3 || x === 0x25FD || x === 0x25FE || x === 0x2614 || x === 0x2615 || x >= 0x2648 && x <= 0x2653 || x === 0x267F || x === 0x2693 || x === 0x26A1 || x === 0x26AA || x === 0x26AB || x === 0x26BD || x === 0x26BE || x === 0x26C4 || x === 0x26C5 || x === 0x26CE || x === 0x26D4 || x === 0x26EA || x === 0x26F2 || x === 0x26F3 || x === 0x26F5 || x === 0x26FA || x === 0x26FD || x === 0x2705 || x === 0x270A || x === 0x270B || x === 0x2728 || x === 0x274C || x === 0x274E || x >= 0x2753 && x <= 0x2755 || x === 0x2757 || x >= 0x2795 && x <= 0x2797 || x === 0x27B0 || x === 0x27BF || x === 0x2B1B || x === 0x2B1C || x === 0x2B50 || x === 0x2B55 || x >= 0x2E80 && x <= 0x2E99 || x >= 0x2E9B && x <= 0x2EF3 || x >= 0x2F00 && x <= 0x2FD5 || x >= 0x2FF0 && x <= 0x2FFF || x >= 0x3001 && x <= 0x303E || x >= 0x3041 && x <= 0x3096 || x >= 0x3099 && x <= 0x30FF || x >= 0x3105 && x <= 0x312F || x >= 0x3131 && x <= 0x318E || x >= 0x3190 && x <= 0x31E3 || x >= 0x31EF && x <= 0x321E || x >= 0x3220 && x <= 0x3247 || x >= 0x3250 && x <= 0x4DBF || x >= 0x4E00 && x <= 0xA48C || x >= 0xA490 && x <= 0xA4C6 || x >= 0xA960 && x <= 0xA97C || x >= 0xAC00 && x <= 0xD7A3 || x >= 0xF900 && x <= 0xFAFF || x >= 0xFE10 && x <= 0xFE19 || x >= 0xFE30 && x <= 0xFE52 || x >= 0xFE54 && x <= 0xFE66 || x >= 0xFE68 && x <= 0xFE6B || x >= 0x16FE0 && x <= 0x16FE4 || x === 0x16FF0 || x === 0x16FF1 || x >= 0x17000 && x <= 0x187F7 || x >= 0x18800 && x <= 0x18CD5 || x >= 0x18D00 && x <= 0x18D08 || x >= 0x1AFF0 && x <= 0x1AFF3 || x >= 0x1AFF5 && x <= 0x1AFFB || x === 0x1AFFD || x === 0x1AFFE || x >= 0x1B000 && x <= 0x1B122 || x === 0x1B132 || x >= 0x1B150 && x <= 0x1B152 || x === 0x1B155 || x >= 0x1B164 && x <= 0x1B167 || x >= 0x1B170 && x <= 0x1B2FB || x === 0x1F004 || x === 0x1F0CF || x === 0x1F18E || x >= 0x1F191 && x <= 0x1F19A || x >= 0x1F200 && x <= 0x1F202 || x >= 0x1F210 && x <= 0x1F23B || x >= 0x1F240 && x <= 0x1F248 || x === 0x1F250 || x === 0x1F251 || x >= 0x1F260 && x <= 0x1F265 || x >= 0x1F300 && x <= 0x1F320 || x >= 0x1F32D && x <= 0x1F335 || x >= 0x1F337 && x <= 0x1F37C || x >= 0x1F37E && x <= 0x1F393 || x >= 0x1F3A0 && x <= 0x1F3CA || x >= 0x1F3CF && x <= 0x1F3D3 || x >= 0x1F3E0 && x <= 0x1F3F0 || x === 0x1F3F4 || x >= 0x1F3F8 && x <= 0x1F43E || x === 0x1F440 || x >= 0x1F442 && x <= 0x1F4FC || x >= 0x1F4FF && x <= 0x1F53D || x >= 0x1F54B && x <= 0x1F54E || x >= 0x1F550 && x <= 0x1F567 || x === 0x1F57A || x === 0x1F595 || x === 0x1F596 || x === 0x1F5A4 || x >= 0x1F5FB && x <= 0x1F64F || x >= 0x1F680 && x <= 0x1F6C5 || x === 0x1F6CC || x >= 0x1F6D0 && x <= 0x1F6D2 || x >= 0x1F6D5 && x <= 0x1F6D7 || x >= 0x1F6DC && x <= 0x1F6DF || x === 0x1F6EB || x === 0x1F6EC || x >= 0x1F6F4 && x <= 0x1F6FC || x >= 0x1F7E0 && x <= 0x1F7EB || x === 0x1F7F0 || x >= 0x1F90C && x <= 0x1F93A || x >= 0x1F93C && x <= 0x1F945 || x >= 0x1F947 && x <= 0x1F9FF || x >= 0x1FA70 && x <= 0x1FA7C || x >= 0x1FA80 && x <= 0x1FA88 || x >= 0x1FA90 && x <= 0x1FABD || x >= 0x1FABF && x <= 0x1FAC5 || x >= 0x1FACE && x <= 0x1FADB || x >= 0x1FAE0 && x <= 0x1FAE8 || x >= 0x1FAF0 && x <= 0x1FAF8 || x >= 0x20000 && x <= 0x2FFFD || x >= 0x30000 && x <= 0x3FFFD; + +}; + +/* EXPORT */ + +export {isAmbiguous, isFullWidth, isWide}; diff --git a/tasks/benchmark.js b/tasks/benchmark.js new file mode 100644 index 0000000..0aa0700 --- /dev/null +++ b/tasks/benchmark.js @@ -0,0 +1,62 @@ + +/* IMPORT */ + +import benchmark from 'benchloop'; +// import stringWidth from 'string-width'; +import fastStringTruncatedWidth from '../dist/index.js'; + +/* HELPERS */ + +const IMPLEMENTATIONS = [ + // [Bun.stringWidth, 'bun'], + // [stringWidth, 'string-width'], + [fastStringTruncatedWidth, 'fast-string-truncated-width'] +]; + + +const INPUTS = [ + ['helloworld', 'ascii'], + ['\x1b[31mhelloworld', 'ascii+ansi'], + ['helloworldπŸ˜€', 'ascii+emoji'], + ['\x1b[31mπŸ˜€', 'ansi+emoji'], + ['helloworldπŸ˜€\x1b[31mπŸ˜€', 'ascii+ansi+emoji'], + // ['叀池や', 'cjk'] +]; + +const REPETITIONS = [1, 10, 50, 100, 500, 1_000, 5_000, 25_000]; + +const LIMIT = Infinity; + +/* MAIN */ + +benchmark.config ({ + iterations: 10 +}); + +for ( const [implementation, implementationName] of IMPLEMENTATIONS ) { + + benchmark.group ( implementationName, () => { + + for ( const [input, inputName] of INPUTS ) { + + for ( const repetitions of REPETITIONS ) { + + const target = input.repeat ( repetitions ); + const truncationOptions = { limit: LIMIT, ellipsis: '…' }; + + benchmark ({ + name: `${inputName}-${repetitions}`, + fn: () => { + implementation ( target, truncationOptions ); + } + }); + + } + + } + + }); + +} + +benchmark.summary (); diff --git a/test/index.js b/test/index.js new file mode 100644 index 0000000..45b8b29 --- /dev/null +++ b/test/index.js @@ -0,0 +1,262 @@ + +/* IMPORT */ + +import {describe} from 'fava'; +import fastStringTruncatedWidth from '../dist/index.js'; + +/* HELPERS */ + +const getWidth = ( input, widthOptions ) => { + return fastStringTruncatedWidth ( input, {}, widthOptions ).width; +}; + +const truncate = ( input, truncationOptions, widthOptions ) => { + const ellipsis = truncationOptions.ellipsis ?? ''; + const result = fastStringTruncatedWidth ( input, truncationOptions, widthOptions ); + const line = `${input.slice ( 0, result.index )}${result.ellipsed ? ellipsis : ''}`; + return line; +}; + +/* MAIN */ + +describe ( 'Fast String Width', () => { + + describe ( 'calculating the raw result', it => { + + it ( 'supports strings that do not need to be truncated', t => { + + const result = fastStringTruncatedWidth ( '\x1b[31mhello', { limit: Infinity, ellipsis: '…' } ); + + t.is ( result.truncated, false ); + t.is ( result.ellipsed, false ); + t.is ( result.width, 5 ); + t.is ( result.index, 10 ); + + }); + + it ( 'supports strings that do need to be truncated', t => { + + debugger; + const result = fastStringTruncatedWidth ( '\x1b[31mhello', { limit: 3, ellipsis: '…' } ); + + t.is ( result.truncated, true ); + t.is ( result.ellipsed, true ); + t.is ( result.width, 2 ); + t.is ( result.index, 7 ); + + }); + + }); + + describe ( 'calculating the width of a string', it => { + + it ( 'supports basic cases', t => { + + t.is ( getWidth ( 'hello' ), 5 ); + t.is ( getWidth ( '\x1b[31mhello' ), 5 ); + + t.is ( getWidth ( 'abcde' ), 5 ); + t.is ( getWidth ( '叀池や' ), 6 ); + t.is ( getWidth ( 'あいうabc' ), 9 ); + t.is ( getWidth ( 'γ‚γ„γ†β˜…' ), 7 ); + t.is ( getWidth ( 'Β±' ), 1 ); + t.is ( getWidth ( 'γƒŽγƒΌγƒ‰.js' ), 9 ); + t.is ( getWidth ( 'δ½ ε₯½' ), 4 ); + t.is ( getWidth ( 'μ•ˆλ…•ν•˜μ„Έμš”' ), 10 ); + t.is ( getWidth ( 'A\uD83C\uDE00BC' ), 5 ); + t.is ( getWidth ( '\u001B[31m\u001B[39m' ), 0 ); + // t.is ( getWidth ( '\u001B]8;;https://github.com\u0007Click\u001B]8;;\u0007' ), 5 ); //TODO: Maybe support these extra escapes too? + t.is ( getWidth ( '\u{231A}' ), 2 ); + t.is ( getWidth ( '\u{2194}\u{FE0F}' ), 2 ); + t.is ( getWidth ( '\u{1F469}' ), 2 ); + t.is ( getWidth ( '\u{1F469}\u{1F3FF}' ), 2 ); + t.is ( getWidth ( '\u{845B}\u{E0100}' ), 2 ); + t.is ( getWidth ( 'ปฏัก' ), 3 ); + t.is ( getWidth ( '_\u0E34' ), 1 ); + + }); + + it ( 'supports control characters', t => { + + t.is ( getWidth ( String.fromCodePoint ( 0 ) ), 0 ); + t.is ( getWidth ( String.fromCodePoint ( 31 ) ), 0 ); + t.is ( getWidth ( String.fromCodePoint ( 127 ) ), 0 ); + t.is ( getWidth ( String.fromCodePoint ( 134 ) ), 0 ); + t.is ( getWidth ( String.fromCodePoint ( 159 ) ), 0 ); + t.is ( getWidth ( '\u001B' ), 0 ); + + }); + + it ( 'supports combining characters', t => { + + t.is ( getWidth ( 'x\u0300' ), 1 ); + + }); + + it ( 'supports emoji characters', t => { + + t.is ( getWidth ( 'πŸ‘Ά' ), 2 ); + t.is ( getWidth ( 'πŸ‘ΆπŸ½' ), 2 ); + t.is ( getWidth ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦' ), 2 ); + t.is ( getWidth ( 'πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨' ), 2 ); + + t.is ( getWidth ( 'πŸ‘Ά'.repeat ( 2 ) ), 4 ); + t.is ( getWidth ( 'πŸ‘ΆπŸ½'.repeat ( 2 ) ), 4 ); + t.is ( getWidth ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦'.repeat ( 2 ) ), 4 ); + t.is ( getWidth ( 'πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨'.repeat ( 2 ) ), 4 ); + + }); + + it ( 'supports unicode characters', t => { + + t.is ( getWidth ( '…' ), 1 ); + t.is ( getWidth ( '\u2770' ), 1 ); + t.is ( getWidth ( '\u2771' ), 1 ); + t.is ( getWidth ( '\u21a9' ), 1 ); + t.is ( getWidth ( '\u2193' ), 1 ); + t.is ( getWidth ( '\u21F5' ), 1 ); + t.is ( getWidth ( '\u2937' ), 1 ); + t.is ( getWidth ( '\u27A4' ), 1 ); + t.is ( getWidth ( '\u2190' ), 1 ); + t.is ( getWidth ( '\u21d0' ), 1 ); + t.is ( getWidth ( '\u2194' ), 1 ); + t.is ( getWidth ( '\u21d4' ), 1 ); + t.is ( getWidth ( '\u21ce' ), 1 ); + t.is ( getWidth ( '\u27f7' ), 1 ); + t.is ( getWidth ( '\u2192' ), 1 ); + t.is ( getWidth ( '\u21d2' ), 1 ); + t.is ( getWidth ( '\u21e8' ), 1 ); + t.is ( getWidth ( '\u2191' ), 1 ); + t.is ( getWidth ( '\u21C5' ), 1 ); + t.is ( getWidth ( '\u2197' ), 1 ); + t.is ( getWidth ( '\u21cb' ), 1 ); + t.is ( getWidth ( '\u21cc' ), 1 ); + t.is ( getWidth ( '\u21c6' ), 1 ); + t.is ( getWidth ( '\u21c4' ), 1 ); + t.is ( getWidth ( '\u2217' ), 1 ); + t.is ( getWidth ( 'βœ”' ), 1 ); + t.is ( getWidth ( '\u2014' ), 1 ); + t.is ( getWidth ( '\u2022' ), 1 ); + t.is ( getWidth ( '\u2026' ), 1 ); + t.is ( getWidth ( '\u2013' ), 1 ); + t.is ( getWidth ( '\u2709' ), 1 ); + t.is ( getWidth ( '\u2261' ), 1 ); + t.is ( getWidth ( '\u2691' ), 1 ); + t.is ( getWidth ( '\u2690' ), 1 ); + t.is ( getWidth ( '\u22EF' ), 1 ); + t.is ( getWidth ( '\u226A' ), 1 ); + t.is ( getWidth ( '\u226B' ), 1 ); + t.is ( getWidth ( '\u270E' ), 1 ); + t.is ( getWidth ( '\u00a0' ), 1 ); + t.is ( getWidth ( '\u2009' ), 1 ); + t.is ( getWidth ( '\u200A' ), 1 ); + t.is ( getWidth ( '\u274F' ), 1 ); + t.is ( getWidth ( '\u2750' ), 1 ); + t.is ( getWidth ( '\u26a0' ), 1 ); + t.is ( getWidth ( '\u200b' ), 1 ); + + }); + + it ( 'supports japanese half-width characters', t => { + + t.is ( getWidth ( 'バ' ), 2 ); + t.is ( getWidth ( 'パ' ), 2 ); + + }); + + }); + + describe ( 'truncating a string', it => { + + it ( 'supports latin characters', t => { + + t.is ( truncate ( 'hello', { limit: 10, ellipsis: '…' } ), 'hello' ); + t.is ( truncate ( 'hello', { limit: 5, ellipsis: '…' } ), 'hello' ); + t.is ( truncate ( 'hello', { limit: 4, ellipsis: '…' } ), 'hel…' ); + t.is ( truncate ( 'hello', { limit: 3, ellipsis: '…' } ), 'he…' ); + t.is ( truncate ( 'hello', { limit: 2, ellipsis: '…' } ), 'h…' ); + t.is ( truncate ( 'hello', { limit: 1, ellipsis: '…' } ), '…' ); + t.is ( truncate ( 'hello', { limit: 0, ellipsis: '…' } ), '' ); + + t.is ( truncate ( 'hello', { limit: 10, ellipsis: '..' } ), 'hello' ); + t.is ( truncate ( 'hello', { limit: 5, ellipsis: '..' } ), 'hello' ); + t.is ( truncate ( 'hello', { limit: 4, ellipsis: '..' } ), 'he..' ); + t.is ( truncate ( 'hello', { limit: 3, ellipsis: '..' } ), 'h..' ); + t.is ( truncate ( 'hello', { limit: 2, ellipsis: '..' } ), '..' ); + t.is ( truncate ( 'hello', { limit: 1, ellipsis: '..' } ), '' ); + t.is ( truncate ( 'hello', { limit: 0, ellipsis: '..' } ), '' ); + + }); + + it ( 'supports ansi characters', t => { + + t.is ( truncate ( '\x1b[31mhello', { limit: 10, ellipsis: '…' } ), '\x1b[31mhello' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 5, ellipsis: '…' } ), '\x1b[31mhello' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 4, ellipsis: '…' } ), '\x1b[31mhel…' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 3, ellipsis: '…' } ), '\x1b[31mhe…' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 2, ellipsis: '…' } ), '\x1b[31mh…' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 1, ellipsis: '…' } ), '\x1b[31m…' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 0, ellipsis: '…' } ), '\x1b[31m' ); + + t.is ( truncate ( '\x1b[31mhello', { limit: 10, ellipsis: '..' } ), '\x1b[31mhello' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 5, ellipsis: '..' } ), '\x1b[31mhello' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 4, ellipsis: '..' } ), '\x1b[31mhe..' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 3, ellipsis: '..' } ), '\x1b[31mh..' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 2, ellipsis: '..' } ), '\x1b[31m..' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 1, ellipsis: '..' } ), '\x1b[31m' ); + t.is ( truncate ( '\x1b[31mhello', { limit: 0, ellipsis: '..' } ), '\x1b[31m' ); + + }); + + it ( 'supports control characters', t => { + + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 10, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 4, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 3, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 2, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 1, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 0, ellipsis: '…' } ), '\x00\x01\x02\x03' ); + + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 10, ellipsis: '…' }, { controlWidth: 1 } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 4, ellipsis: '…' }, { controlWidth: 1 } ), '\x00\x01\x02\x03' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 3, ellipsis: '…' }, { controlWidth: 1 } ), '\x00\x01…' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 2, ellipsis: '…' }, { controlWidth: 1 } ), '\x00…' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 1, ellipsis: '…' }, { controlWidth: 1 } ), '…' ); + t.is ( truncate ( '\x00\x01\x02\x03', { limit: 0, ellipsis: '…' }, { controlWidth: 1 } ), '' ); + + }); + + it ( 'supports CJK characters', t => { + + t.is ( truncate ( '叀池や', { limit: 10, ellipsis: '…' } ), '叀池や' ); + t.is ( truncate ( '叀池や', { limit: 6, ellipsis: '…' } ), '叀池や' ); + t.is ( truncate ( '叀池や', { limit: 5, ellipsis: '…' } ), '叀池…' ); + t.is ( truncate ( '叀池や', { limit: 4, ellipsis: '…' } ), '叀…' ); + t.is ( truncate ( '叀池や', { limit: 3, ellipsis: '…' } ), '叀…' ); + t.is ( truncate ( '叀池や', { limit: 2, ellipsis: '…' } ), '…' ); + t.is ( truncate ( '叀池や', { limit: 1, ellipsis: '…' } ), '…' ); + t.is ( truncate ( '叀池や', { limit: 0, ellipsis: '…' } ), '' ); + + }); + + it ( 'supports emoji characters', t => { + + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 10, ellipsis: '…' } ), 'πŸ‘ΆπŸ‘ΆπŸ½' ); + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 4, ellipsis: '…' } ), 'πŸ‘ΆπŸ‘ΆπŸ½' ); + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 3, ellipsis: '…' } ), 'πŸ‘Άβ€¦' ); + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 2, ellipsis: '…' } ), '…' ); + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 1, ellipsis: '…' } ), '…' ); + t.is ( truncate ( 'πŸ‘ΆπŸ‘ΆπŸ½', { limit: 0, ellipsis: '…' } ), '' ); + + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 10, ellipsis: '…' } ), 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨' ); + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 4, ellipsis: '…' } ), 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨' ); + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 3, ellipsis: '…' } ), 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦β€¦' ); + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 2, ellipsis: '…' } ), '…' ); + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 1, ellipsis: '…' } ), '…' ); + t.is ( truncate ( 'πŸ‘©β€πŸ‘©β€πŸ‘¦β€πŸ‘¦πŸ‘¨β€β€οΈβ€πŸ’‹β€πŸ‘¨', { limit: 0, ellipsis: '…' } ), '' ); + + }); + + }); + +}); diff --git a/tsconfig.json b/tsconfig.json new file mode 100644 index 0000000..378edff --- /dev/null +++ b/tsconfig.json @@ -0,0 +1,3 @@ +{ + "extends": "tsex/tsconfig.json" +}