strings.ts 18.1 KB
Newer Older
E
Erich Gamma 已提交
1 2 3 4 5 6
/*---------------------------------------------------------------------------------------------
 *  Copyright (c) Microsoft Corporation. All rights reserved.
 *  Licensed under the MIT License. See License.txt in the project root for license information.
 *--------------------------------------------------------------------------------------------*/
'use strict';

J
Johannes Rieken 已提交
7
import { CharCode } from 'vs/base/common/charCode';
8

E
Erich Gamma 已提交
9 10 11
/**
 * The empty string.
 */
B
Benjamin Pasero 已提交
12
export const empty = '';
E
Erich Gamma 已提交
13

14 15 16 17 18 19 20
export function isFalsyOrWhitespace(str: string): boolean {
	if (!str || typeof str !== 'string') {
		return true;
	}
	return str.trim().length === 0;
}

E
Erich Gamma 已提交
21
/**
22
 * @returns the provided number with the given number of preceding zeros.
E
Erich Gamma 已提交
23 24
 */
export function pad(n: number, l: number, char: string = '0'): string {
B
Benjamin Pasero 已提交
25 26
	let str = '' + n;
	let r = [str];
E
Erich Gamma 已提交
27

B
Benjamin Pasero 已提交
28
	for (let i = str.length; i < l; i++) {
E
Erich Gamma 已提交
29 30 31 32 33 34
		r.push(char);
	}

	return r.reverse().join('');
}

B
Benjamin Pasero 已提交
35
const _formatRegexp = /{(\d+)}/g;
E
Erich Gamma 已提交
36 37 38 39 40 41 42 43 44 45 46

/**
 * Helper to produce a string with a variable number of arguments. Insert variable segments
 * into the string using the {n} notation where N is the index of the argument following the string.
 * @param value string to which formatting is applied
 * @param args replacements for {n}-entries
 */
export function format(value: string, ...args: any[]): string {
	if (args.length === 0) {
		return value;
	}
J
Johannes Rieken 已提交
47
	return value.replace(_formatRegexp, function (match, group) {
B
Benjamin Pasero 已提交
48
		let idx = parseInt(group, 10);
E
Erich Gamma 已提交
49 50 51 52 53 54 55 56 57 58 59
		return isNaN(idx) || idx < 0 || idx >= args.length ?
			match :
			args[idx];
	});
}

/**
 * Converts HTML characters inside the string to use entities instead. Makes the string safe from
 * being used e.g. in HTMLElement.innerHTML.
 */
export function escape(html: string): string {
J
Johannes Rieken 已提交
60
	return html.replace(/[<|>|&]/g, function (match) {
E
Erich Gamma 已提交
61 62 63 64 65 66 67 68 69 70 71 72 73
		switch (match) {
			case '<': return '&lt;';
			case '>': return '&gt;';
			case '&': return '&amp;';
			default: return match;
		}
	});
}

/**
 * Escapes regular expression characters in a given string
 */
export function escapeRegExpCharacters(value: string): string {
74
	return value.replace(/[\-\\\{\}\*\+\?\|\^\$\.\[\]\(\)\#]/g, '\\$&');
E
Erich Gamma 已提交
75 76 77
}

/**
P
Pascal Borreli 已提交
78
 * Removes all occurrences of needle from the beginning and end of haystack.
E
Erich Gamma 已提交
79 80 81 82
 * @param haystack string to trim
 * @param needle the thing to trim (default is a blank)
 */
export function trim(haystack: string, needle: string = ' '): string {
B
Benjamin Pasero 已提交
83
	let trimmed = ltrim(haystack, needle);
E
Erich Gamma 已提交
84 85 86 87
	return rtrim(trimmed, needle);
}

/**
P
Pascal Borreli 已提交
88
 * Removes all occurrences of needle from the beginning of haystack.
E
Erich Gamma 已提交
89 90 91 92 93 94 95 96
 * @param haystack string to trim
 * @param needle the thing to trim
 */
export function ltrim(haystack?: string, needle?: string): string {
	if (!haystack || !needle) {
		return haystack;
	}

B
Benjamin Pasero 已提交
97
	let needleLen = needle.length;
E
Erich Gamma 已提交
98 99 100 101
	if (needleLen === 0 || haystack.length === 0) {
		return haystack;
	}

B
Benjamin Pasero 已提交
102
	let offset = 0,
E
Erich Gamma 已提交
103 104 105 106 107 108 109 110 111
		idx = -1;

	while ((idx = haystack.indexOf(needle, offset)) === offset) {
		offset = offset + needleLen;
	}
	return haystack.substring(offset);
}

/**
P
Pascal Borreli 已提交
112
 * Removes all occurrences of needle from the end of haystack.
E
Erich Gamma 已提交
113 114 115 116 117 118 119 120
 * @param haystack string to trim
 * @param needle the thing to trim
 */
export function rtrim(haystack?: string, needle?: string): string {
	if (!haystack || !needle) {
		return haystack;
	}

B
Benjamin Pasero 已提交
121
	let needleLen = needle.length,
E
Erich Gamma 已提交
122 123 124 125 126 127
		haystackLen = haystack.length;

	if (needleLen === 0 || haystackLen === 0) {
		return haystack;
	}

B
Benjamin Pasero 已提交
128
	let offset = haystackLen,
E
Erich Gamma 已提交
129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149
		idx = -1;

	while (true) {
		idx = haystack.lastIndexOf(needle, offset - 1);
		if (idx === -1 || idx + needleLen !== offset) {
			break;
		}
		if (idx === 0) {
			return '';
		}
		offset = idx;
	}

	return haystack.substring(0, offset);
}

export function convertSimple2RegExpPattern(pattern: string): string {
	return pattern.replace(/[\-\\\{\}\+\?\|\^\$\.\,\[\]\(\)\#\s]/g, '\\$&').replace(/[\*]/g, '.*');
}

export function stripWildcards(pattern: string): string {
B
Benjamin Pasero 已提交
150
	return pattern.replace(/\*/g, '');
E
Erich Gamma 已提交
151 152 153 154 155 156 157 158 159 160
}

/**
 * Determines if haystack starts with needle.
 */
export function startsWith(haystack: string, needle: string): boolean {
	if (haystack.length < needle.length) {
		return false;
	}

161 162 163 164
	if (haystack === needle) {
		return true;
	}

B
Benjamin Pasero 已提交
165
	for (let i = 0; i < needle.length; i++) {
E
Erich Gamma 已提交
166 167 168 169 170 171 172 173 174 175 176 177
		if (haystack[i] !== needle[i]) {
			return false;
		}
	}

	return true;
}

/**
 * Determines if haystack ends with needle.
 */
export function endsWith(haystack: string, needle: string): boolean {
B
Benjamin Pasero 已提交
178
	let diff = haystack.length - needle.length;
E
Erich Gamma 已提交
179
	if (diff > 0) {
C
Christof Marti 已提交
180
		return haystack.indexOf(needle, diff) === diff;
E
Erich Gamma 已提交
181 182 183 184 185 186 187
	} else if (diff === 0) {
		return haystack === needle;
	} else {
		return false;
	}
}

S
Sandeep Somavarapu 已提交
188 189 190 191 192 193 194 195
export interface RegExpOptions {
	matchCase?: boolean;
	wholeWord?: boolean;
	multiline?: boolean;
	global?: boolean;
}

export function createRegExp(searchString: string, isRegex: boolean, options: RegExpOptions = {}): RegExp {
196
	if (!searchString) {
E
Erich Gamma 已提交
197 198 199
		throw new Error('Cannot create regex from empty string');
	}
	if (!isRegex) {
200
		searchString = escapeRegExpCharacters(searchString);
E
Erich Gamma 已提交
201
	}
S
Sandeep Somavarapu 已提交
202
	if (options.wholeWord) {
E
Erich Gamma 已提交
203 204 205 206 207 208 209
		if (!/\B/.test(searchString.charAt(0))) {
			searchString = '\\b' + searchString;
		}
		if (!/\B/.test(searchString.charAt(searchString.length - 1))) {
			searchString = searchString + '\\b';
		}
	}
210
	let modifiers = '';
S
Sandeep Somavarapu 已提交
211
	if (options.global) {
212 213
		modifiers += 'g';
	}
S
Sandeep Somavarapu 已提交
214
	if (!options.matchCase) {
E
Erich Gamma 已提交
215 216
		modifiers += 'i';
	}
S
Sandeep Somavarapu 已提交
217 218 219
	if (options.multiline) {
		modifiers += 'm';
	}
E
Erich Gamma 已提交
220 221 222 223 224

	return new RegExp(searchString, modifiers);
}

export function regExpLeadsToEndlessLoop(regexp: RegExp): boolean {
225 226
	// Exit early if it's one of these special cases which are meant to match
	// against an empty string
227
	if (regexp.source === '^' || regexp.source === '^$' || regexp.source === '$' || regexp.source === '^\\s*$') {
228 229 230
		return false;
	}

E
Erich Gamma 已提交
231 232
	// We check against an empty string. If the regular expression doesn't advance
	// (e.g. ends in an endless loop) it will match an empty string.
B
Benjamin Pasero 已提交
233
	let match = regexp.exec('');
E
Erich Gamma 已提交
234 235 236
	return (match && <any>regexp.lastIndex === 0);
}

237 238 239 240
export function regExpContainsBackreference(regexpValue: string): boolean {
	return !!regexpValue.match(/([^\\]|^)(\\\\)*\\\d+/);
}

E
Erich Gamma 已提交
241 242 243 244 245
/**
 * Returns first index of the string that is not whitespace.
 * If string is empty or contains only whitespaces, returns -1
 */
export function firstNonWhitespaceIndex(str: string): number {
B
Benjamin Pasero 已提交
246
	for (let i = 0, len = str.length; i < len; i++) {
247 248
		let chCode = str.charCodeAt(i);
		if (chCode !== CharCode.Space && chCode !== CharCode.Tab) {
E
Erich Gamma 已提交
249 250 251 252 253 254 255 256 257 258
			return i;
		}
	}
	return -1;
}

/**
 * Returns the leading whitespace of the string.
 * If the string contains only whitespaces, returns entire string
 */
259 260
export function getLeadingWhitespace(str: string, start: number = 0, end: number = str.length): string {
	for (let i = start; i < end; i++) {
261 262
		let chCode = str.charCodeAt(i);
		if (chCode !== CharCode.Space && chCode !== CharCode.Tab) {
263
			return str.substring(start, i);
E
Erich Gamma 已提交
264 265
		}
	}
266
	return str.substring(start, end);
E
Erich Gamma 已提交
267 268 269 270 271 272
}

/**
 * Returns last index of the string that is not whitespace.
 * If string is empty or contains only whitespaces, returns -1
 */
273 274
export function lastNonWhitespaceIndex(str: string, startIndex: number = str.length - 1): number {
	for (let i = startIndex; i >= 0; i--) {
275 276
		let chCode = str.charCodeAt(i);
		if (chCode !== CharCode.Space && chCode !== CharCode.Tab) {
E
Erich Gamma 已提交
277 278 279 280 281 282
			return i;
		}
	}
	return -1;
}

J
Johannes Rieken 已提交
283
export function compare(a: string, b: string): number {
284 285
	if (a < b) {
		return -1;
J
Johannes Rieken 已提交
286
	} else if (a > b) {
287 288 289 290 291 292
		return 1;
	} else {
		return 0;
	}
}

293 294 295
export function compareIgnoreCase(a: string, b: string): number {
	const len = Math.min(a.length, b.length);
	for (let i = 0; i < len; i++) {
J
Johannes Rieken 已提交
296 297
		let codeA = a.charCodeAt(i);
		let codeB = b.charCodeAt(i);
298 299 300 301 302 303

		if (codeA === codeB) {
			// equal
			continue;
		}

J
Johannes Rieken 已提交
304
		if (isUpperAsciiLetter(codeA)) {
S
Sandeep Somavarapu 已提交
305
			codeA += 32;
J
Johannes Rieken 已提交
306 307 308
		}

		if (isUpperAsciiLetter(codeB)) {
S
Sandeep Somavarapu 已提交
309
			codeB += 32;
J
Johannes Rieken 已提交
310 311 312 313 314 315 316 317 318 319 320 321
		}

		const diff = codeA - codeB;

		if (diff === 0) {
			// equal -> ignoreCase
			continue;

		} else if (isLowerAsciiLetter(codeA) && isLowerAsciiLetter(codeB)) {
			//
			return diff;

J
Johannes Rieken 已提交
322 323
		} else {
			return compare(a.toLowerCase(), b.toLowerCase());
324 325 326 327 328 329 330 331 332 333 334 335
		}
	}

	if (a.length < b.length) {
		return -1;
	} else if (a.length > b.length) {
		return 1;
	} else {
		return 0;
	}
}

A
Alex Dima 已提交
336
export function isLowerAsciiLetter(code: number): boolean {
J
Johannes Rieken 已提交
337 338 339
	return code >= CharCode.a && code <= CharCode.z;
}

A
Alex Dima 已提交
340
export function isUpperAsciiLetter(code: number): boolean {
J
Johannes Rieken 已提交
341 342 343
	return code >= CharCode.A && code <= CharCode.Z;
}

344
function isAsciiLetter(code: number): boolean {
J
Johannes Rieken 已提交
345
	return isLowerAsciiLetter(code) || isUpperAsciiLetter(code);
E
Erich Gamma 已提交
346 347 348
}

export function equalsIgnoreCase(a: string, b: string): boolean {
349 350
	const len1 = a ? a.length : 0;
	const len2 = b ? b.length : 0;
E
Erich Gamma 已提交
351 352 353 354 355

	if (len1 !== len2) {
		return false;
	}

B
Benjamin Pasero 已提交
356 357 358
	return doEqualsIgnoreCase(a, b);
}

359 360 361 362 363
function doEqualsIgnoreCase(a: string, b: string, stopAt = a.length): boolean {
	if (typeof a !== 'string' || typeof b !== 'string') {
		return false;
	}

B
Benjamin Pasero 已提交
364
	for (let i = 0; i < stopAt; i++) {
365 366
		const codeA = a.charCodeAt(i);
		const codeB = b.charCodeAt(i);
E
Erich Gamma 已提交
367 368 369

		if (codeA === codeB) {
			continue;
370
		}
E
Erich Gamma 已提交
371

372 373
		// a-z A-Z
		if (isAsciiLetter(codeA) && isAsciiLetter(codeB)) {
B
Benjamin Pasero 已提交
374
			let diff = Math.abs(codeA - codeB);
E
Erich Gamma 已提交
375 376 377
			if (diff !== 0 && diff !== 32) {
				return false;
			}
378 379 380 381 382
		}

		// Any other charcode
		else {
			if (String.fromCharCode(codeA).toLowerCase() !== String.fromCharCode(codeB).toLowerCase()) {
E
Erich Gamma 已提交
383 384 385 386 387 388 389 390
				return false;
			}
		}
	}

	return true;
}

391
export function startsWithIgnoreCase(str: string, candidate: string): boolean {
B
Benjamin Pasero 已提交
392 393 394 395 396 397 398 399
	const candidateLength = candidate.length;
	if (candidate.length > str.length) {
		return false;
	}

	return doEqualsIgnoreCase(str, candidate, candidateLength);
}

E
Erich Gamma 已提交
400
/**
401
 * @returns the length of the common prefix of the two strings.
E
Erich Gamma 已提交
402 403 404
 */
export function commonPrefixLength(a: string, b: string): number {

B
Benjamin Pasero 已提交
405
	let i: number,
E
Erich Gamma 已提交
406 407 408 409 410 411 412 413 414 415 416 417
		len = Math.min(a.length, b.length);

	for (i = 0; i < len; i++) {
		if (a.charCodeAt(i) !== b.charCodeAt(i)) {
			return i;
		}
	}

	return len;
}

/**
418
 * @returns the length of the common suffix of the two strings.
E
Erich Gamma 已提交
419 420 421
 */
export function commonSuffixLength(a: string, b: string): number {

B
Benjamin Pasero 已提交
422
	let i: number,
E
Erich Gamma 已提交
423 424
		len = Math.min(a.length, b.length);

B
Benjamin Pasero 已提交
425 426
	let aLastIndex = a.length - 1;
	let bLastIndex = b.length - 1;
E
Erich Gamma 已提交
427 428 429 430 431 432 433 434 435 436

	for (i = 0; i < len; i++) {
		if (a.charCodeAt(aLastIndex - i) !== b.charCodeAt(bLastIndex - i)) {
			return i;
		}
	}

	return len;
}

J
Johannes Rieken 已提交
437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470 471 472 473
function substrEquals(a: string, aStart: number, aEnd: number, b: string, bStart: number, bEnd: number): boolean {
	while (aStart < aEnd && bStart < bEnd) {
		if (a[aStart] !== b[bStart]) {
			return false;
		}
		aStart += 1;
		bStart += 1;
	}
	return true;
}

/**
 * Return the overlap between the suffix of `a` and the prefix of `b`.
 * For instance `overlap("foobar", "arr, I'm a pirate") === 2`.
 */
export function overlap(a: string, b: string): number {
	let aEnd = a.length;
	let bEnd = b.length;
	let aStart = aEnd - bEnd;

	if (aStart === 0) {
		return a === b ? aEnd : 0;
	} else if (aStart < 0) {
		bEnd += aStart;
		aStart = 0;
	}

	while (aStart < aEnd && bEnd > 0) {
		if (substrEquals(a, aStart, aEnd, b, 0, bEnd)) {
			return bEnd;
		}
		bEnd -= 1;
		aStart += 1;
	}
	return 0;
}

E
Erich Gamma 已提交
474 475 476 477 478 479
// --- unicode
// http://en.wikipedia.org/wiki/Surrogate_pair
// Returns the code point starting at a specified index in a string
// Code points U+0000 to U+D7FF and U+E000 to U+FFFF are represented on a single character
// Code points U+10000 to U+10FFFF are represented on two consecutive characters
//export function getUnicodePoint(str:string, index:number, len:number):number {
B
Benjamin Pasero 已提交
480
//	let chrCode = str.charCodeAt(index);
E
Erich Gamma 已提交
481
//	if (0xD800 <= chrCode && chrCode <= 0xDBFF && index + 1 < len) {
B
Benjamin Pasero 已提交
482
//		let nextChrCode = str.charCodeAt(index + 1);
E
Erich Gamma 已提交
483 484 485 486 487 488
//		if (0xDC00 <= nextChrCode && nextChrCode <= 0xDFFF) {
//			return (chrCode - 0xD800) << 10 + (nextChrCode - 0xDC00) + 0x10000;
//		}
//	}
//	return chrCode;
//}
J
Johannes Rieken 已提交
489
export function isHighSurrogate(charCode: number): boolean {
490 491 492
	return (0xD800 <= charCode && charCode <= 0xDBFF);
}

J
Johannes Rieken 已提交
493
export function isLowSurrogate(charCode: number): boolean {
494 495
	return (0xDC00 <= charCode && charCode <= 0xDFFF);
}
E
Erich Gamma 已提交
496

A
Alex Dima 已提交
497 498 499 500 501 502 503 504 505 506 507 508
/**
 * Generated using https://github.com/alexandrudima/unicode-utils/blob/master/generate-rtl-test.js
 */
const CONTAINS_RTL = /(?:[\u05BE\u05C0\u05C3\u05C6\u05D0-\u05F4\u0608\u060B\u060D\u061B-\u064A\u066D-\u066F\u0671-\u06D5\u06E5\u06E6\u06EE\u06EF\u06FA-\u0710\u0712-\u072F\u074D-\u07A5\u07B1-\u07EA\u07F4\u07F5\u07FA-\u0815\u081A\u0824\u0828\u0830-\u0858\u085E-\u08BD\u200F\uFB1D\uFB1F-\uFB28\uFB2A-\uFD3D\uFD50-\uFDFC\uFE70-\uFEFC]|\uD802[\uDC00-\uDD1B\uDD20-\uDE00\uDE10-\uDE33\uDE40-\uDEE4\uDEEB-\uDF35\uDF40-\uDFFF]|\uD803[\uDC00-\uDCFF]|\uD83A[\uDC00-\uDCCF\uDD00-\uDD43\uDD50-\uDFFF]|\uD83B[\uDC00-\uDEBB])/;

/**
 * Returns true if `str` contains any Unicode character that is classified as "R" or "AL".
 */
export function containsRTL(str: string): boolean {
	return CONTAINS_RTL.test(str);
}

509 510 511 512 513 514 515 516 517
/**
 * Generated using https://github.com/alexandrudima/unicode-utils/blob/master/generate-emoji-test.js
 */
const CONTAINS_EMOJI = /(?:[\u231A\u231B\u23F0\u23F3\u2600-\u27BF\u2B50\u2B55]|\uD83C[\uDDE6-\uDDFF\uDF00-\uDFFF]|\uD83D[\uDC00-\uDE4F\uDE80-\uDEF8]|\uD83E[\uDD00-\uDDE6])/;

export function containsEmoji(str: string): boolean {
	return CONTAINS_EMOJI.test(str);
}

518 519 520 521 522 523 524 525
const IS_BASIC_ASCII = /^[\t\n\r\x20-\x7E]*$/;
/**
 * Returns true if `str` contains only basic ASCII characters in the range 32 - 126 (including 32 and 126) or \n, \r, \t
 */
export function isBasicASCII(str: string): boolean {
	return IS_BASIC_ASCII.test(str);
}

A
Alex Dima 已提交
526 527 528 529 530 531 532 533 534
export function containsFullWidthCharacter(str: string): boolean {
	for (let i = 0, len = str.length; i < len; i++) {
		if (isFullWidthCharacter(str.charCodeAt(i))) {
			return true;
		}
	}
	return false;
}

J
Johannes Rieken 已提交
535
export function isFullWidthCharacter(charCode: number): boolean {
536 537 538 539 540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565 566 567 568 569 570 571 572 573
	// Do a cheap trick to better support wrapping of wide characters, treat them as 2 columns
	// http://jrgraphix.net/research/unicode_blocks.php
	//          2E80 — 2EFF   CJK Radicals Supplement
	//          2F00 — 2FDF   Kangxi Radicals
	//          2FF0 — 2FFF   Ideographic Description Characters
	//          3000 — 303F   CJK Symbols and Punctuation
	//          3040 — 309F   Hiragana
	//          30A0 — 30FF   Katakana
	//          3100 — 312F   Bopomofo
	//          3130 — 318F   Hangul Compatibility Jamo
	//          3190 — 319F   Kanbun
	//          31A0 — 31BF   Bopomofo Extended
	//          31F0 — 31FF   Katakana Phonetic Extensions
	//          3200 — 32FF   Enclosed CJK Letters and Months
	//          3300 — 33FF   CJK Compatibility
	//          3400 — 4DBF   CJK Unified Ideographs Extension A
	//          4DC0 — 4DFF   Yijing Hexagram Symbols
	//          4E00 — 9FFF   CJK Unified Ideographs
	//          A000 — A48F   Yi Syllables
	//          A490 — A4CF   Yi Radicals
	//          AC00 — D7AF   Hangul Syllables
	// [IGNORE] D800 — DB7F   High Surrogates
	// [IGNORE] DB80 — DBFF   High Private Use Surrogates
	// [IGNORE] DC00 — DFFF   Low Surrogates
	// [IGNORE] E000 — F8FF   Private Use Area
	//          F900 — FAFF   CJK Compatibility Ideographs
	// [IGNORE] FB00 — FB4F   Alphabetic Presentation Forms
	// [IGNORE] FB50 — FDFF   Arabic Presentation Forms-A
	// [IGNORE] FE00 — FE0F   Variation Selectors
	// [IGNORE] FE20 — FE2F   Combining Half Marks
	// [IGNORE] FE30 — FE4F   CJK Compatibility Forms
	// [IGNORE] FE50 — FE6F   Small Form Variants
	// [IGNORE] FE70 — FEFF   Arabic Presentation Forms-B
	//          FF00 — FFEF   Halfwidth and Fullwidth Forms
	//               [https://en.wikipedia.org/wiki/Halfwidth_and_fullwidth_forms]
	//               of which FF01 - FF5E fullwidth ASCII of 21 to 7E
	// [IGNORE]    and FF65 - FFDC halfwidth of Katakana and Hangul
	// [IGNORE] FFF0 — FFFF   Specials
A
Alex Dima 已提交
574
	charCode = +charCode; // @perf
575 576 577 578 579 580 581
	return (
		(charCode >= 0x2E80 && charCode <= 0xD7AF)
		|| (charCode >= 0xF900 && charCode <= 0xFAFF)
		|| (charCode >= 0xFF01 && charCode <= 0xFF5E)
	);
}

E
Erich Gamma 已提交
582 583 584 585
/**
 * Given a string and a max length returns a shorted version. Shorting
 * happens at favorable positions - such as whitespace or punctuation characters.
 */
R
Rob Lourens 已提交
586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604
export function lcut(text: string, n: number) {
	if (text.length < n) {
		return text;
	}

	const re = /\b/g;
	let i = 0;
	while (re.test(text)) {
		if (text.length - re.lastIndex < n) {
			break;
		}

		i = re.lastIndex;
		re.lastIndex += 1;
	}

	return text.substring(i).replace(/^\s/, empty);
}

E
Erich Gamma 已提交
605 606
// Escape codes
// http://en.wikipedia.org/wiki/ANSI_escape_code
B
Benjamin Pasero 已提交
607 608 609
const EL = /\x1B\x5B[12]?K/g; // Erase in line
const COLOR_START = /\x1b\[\d+m/g; // Color
const COLOR_END = /\x1b\[0?m/g; // Color
E
Erich Gamma 已提交
610 611 612 613 614 615 616 617 618 619 620 621 622

export function removeAnsiEscapeCodes(str: string): string {
	if (str) {
		str = str.replace(EL, '');
		str = str.replace(COLOR_START, '');
		str = str.replace(COLOR_END, '');
	}

	return str;
}

// -- UTF-8 BOM

A
Alex Dima 已提交
623
export const UTF8_BOM_CHARACTER = String.fromCharCode(CharCode.UTF8_BOM);
E
Erich Gamma 已提交
624 625

export function startsWithUTF8BOM(str: string): boolean {
A
Alex Dima 已提交
626
	return (str && str.length > 0 && str.charCodeAt(0) === CharCode.UTF8_BOM);
I
isidor 已提交
627 628
}

629 630 631 632
export function stripUTF8BOM(str: string): string {
	return startsWithUTF8BOM(str) ? str.substr(1) : str;
}

633 634
export function safeBtoa(str: string): string {
	return btoa(encodeURIComponent(str)); // we use encodeURIComponent because btoa fails for non Latin 1 values
635 636
}

J
Johannes Rieken 已提交
637
export function repeat(s: string, count: number): string {
B
Benjamin Pasero 已提交
638 639
	let result = '';
	for (let i = 0; i < count; i++) {
640 641 642
		result += s;
	}
	return result;
643
}
644 645 646 647 648 649 650 651 652 653 654 655 656 657 658 659 660 661 662 663 664 665 666 667 668 669 670 671 672 673 674

/**
 * Checks if the characters of the provided query string are included in the
 * target string. The characters do not have to be contiguous within the string.
 */
export function fuzzyContains(target: string, query: string): boolean {
	if (!target || !query) {
		return false; // return early if target or query are undefined
	}

	if (target.length < query.length) {
		return false; // impossible for query to be contained in target
	}

	const queryLen = query.length;
	const targetLower = target.toLowerCase();

	let index = 0;
	let lastIndexOf = -1;
	while (index < queryLen) {
		let indexOf = targetLower.indexOf(query[index], lastIndexOf + 1);
		if (indexOf < 0) {
			return false;
		}

		lastIndexOf = indexOf;

		index++;
	}

	return true;
J
Johannes Rieken 已提交
675
}
676 677 678 679 680 681 682 683 684 685 686 687

export function containsUppercaseCharacter(target: string, ignoreEscapedChars = false): boolean {
	if (!target) {
		return false;
	}

	if (ignoreEscapedChars) {
		target = target.replace(/\\./g, '');
	}

	return target.toLowerCase() !== target;
}