third_party/WebKit/Source/devtools/front_end/common/TextUtils.js - chromium/src - Git at Google

 /*
  * Copyright (C) 2013 Google Inc. All rights reserved.
  *
  * Redistribution and use in source and binary forms, with or without
  * modification, are permitted provided that the following conditions are
  * met:
  *
  *     * Redistributions of source code must retain the above copyright
  * notice, this list of conditions and the following disclaimer.
  *     * Redistributions in binary form must reproduce the above
  * copyright notice, this list of conditions and the following disclaimer
  * in the documentation and/or other materials provided with the
  * distribution.
  *     * Neither the name of Google Inc. nor the names of its
  * contributors may be used to endorse or promote products derived from
  * this software without specific prior written permission.
  *
  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
  */
 Common.TextUtils = {
   /**
    * @param {string} char
    * @return {boolean}
    */
   isStopChar: function(char) {
     return (char > ' ' && char < '0') || (char > '9' && char < 'A') || (char > 'Z' && char < '_') ||
         (char > '_' && char < 'a') || (char > 'z' && char <= '~');
   },

   /**
    * @param {string} char
    * @return {boolean}
    */
   isWordChar: function(char) {
     return !Common.TextUtils.isStopChar(char) && !Common.TextUtils.isSpaceChar(char);
   },

   /**
    * @param {string} char
    * @return {boolean}
    */
   isSpaceChar: function(char) {
     return Common.TextUtils._SpaceCharRegex.test(char);
   },

   /**
    * @param {string} word
    * @return {boolean}
    */
   isWord: function(word) {
     for (var i = 0; i < word.length; ++i) {
       if (!Common.TextUtils.isWordChar(word.charAt(i)))
         return false;
     }
     return true;
   },

   /**
    * @param {string} char
    * @return {boolean}
    */
   isOpeningBraceChar: function(char) {
     return char === '(' || char === '{';
   },

   /**
    * @param {string} char
    * @return {boolean}
    */
   isClosingBraceChar: function(char) {
     return char === ')' || char === '}';
   },

   /**
    * @param {string} char
    * @return {boolean}
    */
   isBraceChar: function(char) {
     return Common.TextUtils.isOpeningBraceChar(char) || Common.TextUtils.isClosingBraceChar(char);
   },

   /**
    * @param {string} text
    * @param {function(string):boolean} isWordChar
    * @param {function(string)} wordCallback
    */
   textToWords: function(text, isWordChar, wordCallback) {
     var startWord = -1;
     for (var i = 0; i < text.length; ++i) {
       if (!isWordChar(text.charAt(i))) {
         if (startWord !== -1)
           wordCallback(text.substring(startWord, i));
         startWord = -1;
       } else if (startWord === -1) {
         startWord = i;
       }
     }
     if (startWord !== -1)
       wordCallback(text.substring(startWord));
   },

   /**
    * @param {string} line
    * @return {string}
    */
   lineIndent: function(line) {
     var indentation = 0;
     while (indentation < line.length && Common.TextUtils.isSpaceChar(line.charAt(indentation)))
       ++indentation;
     return line.substr(0, indentation);
   },

   /**
    * @param {string} text
    * @return {boolean}
    */
   isUpperCase: function(text) {
     return text === text.toUpperCase();
   },

   /**
    * @param {string} text
    * @return {boolean}
    */
   isLowerCase: function(text) {
     return text === text.toLowerCase();
   },

   /**
    * @param {string} text
    * @param {!Array<!RegExp>} regexes
    * @return {!Array<{value: string, position: number, regexIndex: number}>}
    */
   splitStringByRegexes(text, regexes) {
     var matches = [];
     var globalRegexes = [];
     for (var i = 0; i < regexes.length; i++) {
       var regex = regexes[i];
       if (!regex.global)
         globalRegexes.push(new RegExp(regex.source, regex.flags ? regex.flags + 'g' : 'g'));
       else
         globalRegexes.push(regex);
     }
     doSplit(text, 0, 0);
     return matches;

     /**
      * @param {string} text
      * @param {number} regexIndex
      * @param {number} startIndex
      */
     function doSplit(text, regexIndex, startIndex) {
       if (regexIndex >= globalRegexes.length) {
         // Set regexIndex as -1 if text did not match with any regular expression
         matches.push({value: text, position: startIndex, regexIndex: -1});
         return;
       }
       var regex = globalRegexes[regexIndex];
       var currentIndex = 0;
       var result;
       regex.lastIndex = 0;
       while ((result = regex.exec(text)) !== null) {
         var stringBeforeMatch = text.substring(currentIndex, result.index);
         if (stringBeforeMatch)
           doSplit(stringBeforeMatch, regexIndex + 1, startIndex + currentIndex);
         var match = result[0];
         matches.push({value: match, position: startIndex + result.index, regexIndex: regexIndex});
         currentIndex = result.index + match.length;
       }
       var stringAfterMatches = text.substring(currentIndex);
       if (stringAfterMatches)
         doSplit(stringAfterMatches, regexIndex + 1, startIndex + currentIndex);
     }
   }
 };

 Common.TextUtils._SpaceCharRegex = /\s/;

 /**
  * @enum {string}
  */
 Common.TextUtils.Indent = {
   TwoSpaces: '  ',
   FourSpaces: '    ',
   EightSpaces: '        ',
   TabCharacter: '\t'
 };

 /**
  * @unrestricted
  */
 Common.TextUtils.BalancedJSONTokenizer = class {
   /**
    * @param {function(string)} callback
    * @param {boolean=} findMultiple
    */
   constructor(callback, findMultiple) {
     this._callback = callback;
     this._index = 0;
     this._balance = 0;
     this._buffer = '';
     this._findMultiple = findMultiple || false;
     this._closingDoubleQuoteRegex = /[^\\](?:\\\\)*"/g;
   }

   /**
    * @param {string} chunk
    * @return {boolean}
    */
   write(chunk) {
     this._buffer += chunk;
     var lastIndex = this._buffer.length;
     var buffer = this._buffer;
     for (var index = this._index; index < lastIndex; ++index) {
       var character = buffer[index];
       if (character === '"') {
         this._closingDoubleQuoteRegex.lastIndex = index;
         if (!this._closingDoubleQuoteRegex.test(buffer))
           break;
         index = this._closingDoubleQuoteRegex.lastIndex - 1;
       } else if (character === '{') {
         ++this._balance;
       } else if (character === '}') {
         --this._balance;
         if (this._balance < 0) {
           this._reportBalanced();
           return false;
         }
         if (!this._balance) {
           this._lastBalancedIndex = index + 1;
           if (!this._findMultiple)
             break;
         }
       } else if (character === ']' && !this._balance) {
         this._reportBalanced();
         return false;
       }
     }
     this._index = index;
     this._reportBalanced();
     return true;
   }

   _reportBalanced() {
     if (!this._lastBalancedIndex)
       return;
     this._callback(this._buffer.slice(0, this._lastBalancedIndex));
     this._buffer = this._buffer.slice(this._lastBalancedIndex);
     this._index -= this._lastBalancedIndex;
     this._lastBalancedIndex = 0;
   }

   /**
    * @return {string}
    */
   remainder() {
     return this._buffer;
   }
 };

 /**
  * @interface
  */
 Common.TokenizerFactory = function() {};

 Common.TokenizerFactory.prototype = {
   /**
    * @param {string} mimeType
    * @return {function(string, function(string, ?string, number, number))}
    */
   createTokenizer: function(mimeType) {}
 };
	/*
	* Copyright (C) 2013 Google Inc. All rights reserved.
	*
	* Redistribution and use in source and binary forms, with or without
	* modification, are permitted provided that the following conditions are
	* met:
	*
	* * Redistributions of source code must retain the above copyright
	* notice, this list of conditions and the following disclaimer.
	* * Redistributions in binary form must reproduce the above
	* copyright notice, this list of conditions and the following disclaimer
	* in the documentation and/or other materials provided with the
	* distribution.
	* * Neither the name of Google Inc. nor the names of its
	* contributors may be used to endorse or promote products derived from
	* this software without specific prior written permission.
	*
	* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
	* "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
	* LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
	* A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
	* OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
	* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
	* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
	* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
	* THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
	* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
	* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
	*/
	Common.TextUtils = {
	/**
	* @param {string} char
	* @return {boolean}
	*/
	isStopChar: function(char) {
	return (char > ' ' && char < '0') \|\| (char > '9' && char < 'A') \|\| (char > 'Z' && char < '_') \|\|
	(char > '_' && char < 'a') \|\| (char > 'z' && char <= '~');
	},

	/**
	* @param {string} char
	* @return {boolean}
	*/
	isWordChar: function(char) {
	return !Common.TextUtils.isStopChar(char) && !Common.TextUtils.isSpaceChar(char);
	},

	/**
	* @param {string} char
	* @return {boolean}
	*/
	isSpaceChar: function(char) {
	return Common.TextUtils._SpaceCharRegex.test(char);
	},

	/**
	* @param {string} word
	* @return {boolean}
	*/
	isWord: function(word) {
	for (var i = 0; i < word.length; ++i) {
	if (!Common.TextUtils.isWordChar(word.charAt(i)))
	return false;
	}
	return true;
	},

	/**
	* @param {string} char
	* @return {boolean}
	*/
	isOpeningBraceChar: function(char) {
	return char === '(' \|\| char === '{';
	},

	/**
	* @param {string} char
	* @return {boolean}
	*/
	isClosingBraceChar: function(char) {
	return char === ')' \|\| char === '}';
	},

	/**
	* @param {string} char
	* @return {boolean}
	*/
	isBraceChar: function(char) {
	return Common.TextUtils.isOpeningBraceChar(char) \|\| Common.TextUtils.isClosingBraceChar(char);
	},

	/**
	* @param {string} text
	* @param {function(string):boolean} isWordChar
	* @param {function(string)} wordCallback
	*/
	textToWords: function(text, isWordChar, wordCallback) {
	var startWord = -1;
	for (var i = 0; i < text.length; ++i) {
	if (!isWordChar(text.charAt(i))) {
	if (startWord !== -1)
	wordCallback(text.substring(startWord, i));
	startWord = -1;
	} else if (startWord === -1) {
	startWord = i;
	}
	}
	if (startWord !== -1)
	wordCallback(text.substring(startWord));
	},

	/**
	* @param {string} line
	* @return {string}
	*/
	lineIndent: function(line) {
	var indentation = 0;
	while (indentation < line.length && Common.TextUtils.isSpaceChar(line.charAt(indentation)))
	++indentation;
	return line.substr(0, indentation);
	},

	/**
	* @param {string} text
	* @return {boolean}
	*/
	isUpperCase: function(text) {
	return text === text.toUpperCase();
	},

	/**
	* @param {string} text
	* @return {boolean}
	*/
	isLowerCase: function(text) {
	return text === text.toLowerCase();
	},

	/**
	* @param {string} text
	* @param {!Array<!RegExp>} regexes
	* @return {!Array<{value: string, position: number, regexIndex: number}>}
	*/
	splitStringByRegexes(text, regexes) {
	var matches = [];
	var globalRegexes = [];
	for (var i = 0; i < regexes.length; i++) {
	var regex = regexes[i];
	if (!regex.global)
	globalRegexes.push(new RegExp(regex.source, regex.flags ? regex.flags + 'g' : 'g'));
	else
	globalRegexes.push(regex);
	}
	doSplit(text, 0, 0);
	return matches;

	/**
	* @param {string} text
	* @param {number} regexIndex
	* @param {number} startIndex
	*/
	function doSplit(text, regexIndex, startIndex) {
	if (regexIndex >= globalRegexes.length) {
	// Set regexIndex as -1 if text did not match with any regular expression
	matches.push({value: text, position: startIndex, regexIndex: -1});
	return;
	}
	var regex = globalRegexes[regexIndex];
	var currentIndex = 0;
	var result;
	regex.lastIndex = 0;
	while ((result = regex.exec(text)) !== null) {
	var stringBeforeMatch = text.substring(currentIndex, result.index);
	if (stringBeforeMatch)
	doSplit(stringBeforeMatch, regexIndex + 1, startIndex + currentIndex);
	var match = result[0];
	matches.push({value: match, position: startIndex + result.index, regexIndex: regexIndex});
	currentIndex = result.index + match.length;
	}
	var stringAfterMatches = text.substring(currentIndex);
	if (stringAfterMatches)
	doSplit(stringAfterMatches, regexIndex + 1, startIndex + currentIndex);
	}
	}
	};

	Common.TextUtils._SpaceCharRegex = /\s/;

	/**
	* @enum {string}
	*/
	Common.TextUtils.Indent = {
	TwoSpaces: ' ',
	FourSpaces: ' ',
	EightSpaces: ' ',
	TabCharacter: '\t'
	};

	/**
	* @unrestricted
	*/
	Common.TextUtils.BalancedJSONTokenizer = class {
	/**
	* @param {function(string)} callback
	* @param {boolean=} findMultiple
	*/
	constructor(callback, findMultiple) {
	this._callback = callback;
	this._index = 0;
	this._balance = 0;
	this._buffer = '';
	this._findMultiple = findMultiple \|\| false;
	this._closingDoubleQuoteRegex = /[^\\](?:\\\\)*"/g;
	}

	/**
	* @param {string} chunk
	* @return {boolean}
	*/
	write(chunk) {
	this._buffer += chunk;
	var lastIndex = this._buffer.length;
	var buffer = this._buffer;
	for (var index = this._index; index < lastIndex; ++index) {
	var character = buffer[index];
	if (character === '"') {
	this._closingDoubleQuoteRegex.lastIndex = index;
	if (!this._closingDoubleQuoteRegex.test(buffer))
	break;
	index = this._closingDoubleQuoteRegex.lastIndex - 1;
	} else if (character === '{') {
	++this._balance;
	} else if (character === '}') {
	--this._balance;
	if (this._balance < 0) {
	this._reportBalanced();
	return false;
	}
	if (!this._balance) {
	this._lastBalancedIndex = index + 1;
	if (!this._findMultiple)
	break;
	}
	} else if (character === ']' && !this._balance) {
	this._reportBalanced();
	return false;
	}
	}
	this._index = index;
	this._reportBalanced();
	return true;
	}

	_reportBalanced() {
	if (!this._lastBalancedIndex)
	return;
	this._callback(this._buffer.slice(0, this._lastBalancedIndex));
	this._buffer = this._buffer.slice(this._lastBalancedIndex);
	this._index -= this._lastBalancedIndex;
	this._lastBalancedIndex = 0;
	}

	/**
	* @return {string}
	*/
	remainder() {
	return this._buffer;
	}
	};

	/**
	* @interface
	*/
	Common.TokenizerFactory = function() {};

	Common.TokenizerFactory.prototype = {
	/**
	* @param {string} mimeType
	* @return {function(string, function(string, ?string, number, number))}
	*/
	createTokenizer: function(mimeType) {}
	};