lib/goog/string/string.js

1 // Copyright 2006 The Closure Library Authors. All Rights Reserved.
2 //
3 // Licensed under the Apache License, Version 2.0 (the "License");
4 // you may not use this file except in compliance with the License.
5 // You may obtain a copy of the License at
6 //
7 //      http://www.apache.org/licenses/LICENSE-2.0
8 //
9 // Unless required by applicable law or agreed to in writing, software
10 // distributed under the License is distributed on an "AS-IS" BASIS,
11 // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12 // See the License for the specific language governing permissions and
13 // limitations under the License.
14 
15 /**
16  * @fileoverview Utilities for string manipulation.
17  */
18 
19 
20 /**
21  * Namespace for string utilities
22  */
23 goog.provide('goog.string');
24 goog.provide('goog.string.Unicode');
25 
26 
27 /**
28  * @define {boolean} Enables HTML escaping of lowercase letter "e" which helps
29  * with detection of double-escaping as this letter is frequently used.
30  */
31 goog.define('goog.string.DETECT_DOUBLE_ESCAPING', false);
32 
33 
34 /**
35  * Common Unicode string characters.
36  * @enum {string}
37  */
38 goog.string.Unicode = {
39   NBSP: '\xa0'
40 };
41 
42 
43 /**
44  * Fast prefix-checker.
45  * @param {string} str The string to check.
46  * @param {string} prefix A string to look for at the start of {@code str}.
47  * @return {boolean} True if {@code str} begins with {@code prefix}.
48  */
49 goog.string.startsWith = function(str, prefix) {
50   return str.lastIndexOf(prefix, 0) == 0;
51 };
52 
53 
54 /**
55  * Fast suffix-checker.
56  * @param {string} str The string to check.
57  * @param {string} suffix A string to look for at the end of {@code str}.
58  * @return {boolean} True if {@code str} ends with {@code suffix}.
59  */
60 goog.string.endsWith = function(str, suffix) {
61   var l = str.length - suffix.length;
62   return l >= 0 && str.indexOf(suffix, l) == l;
63 };
64 
65 
66 /**
67  * Case-insensitive prefix-checker.
68  * @param {string} str The string to check.
69  * @param {string} prefix  A string to look for at the end of {@code str}.
70  * @return {boolean} True if {@code str} begins with {@code prefix} (ignoring
71  *     case).
72  */
73 goog.string.caseInsensitiveStartsWith = function(str, prefix) {
74   return goog.string.caseInsensitiveCompare(
75       prefix, str.substr(0, prefix.length)) == 0;
76 };
77 
78 
79 /**
80  * Case-insensitive suffix-checker.
81  * @param {string} str The string to check.
82  * @param {string} suffix A string to look for at the end of {@code str}.
83  * @return {boolean} True if {@code str} ends with {@code suffix} (ignoring
84  *     case).
85  */
86 goog.string.caseInsensitiveEndsWith = function(str, suffix) {
87   return goog.string.caseInsensitiveCompare(
88       suffix, str.substr(str.length - suffix.length, suffix.length)) == 0;
89 };
90 
91 
92 /**
93  * Case-insensitive equality checker.
94  * @param {string} str1 First string to check.
95  * @param {string} str2 Second string to check.
96  * @return {boolean} True if {@code str1} and {@code str2} are the same string,
97  *     ignoring case.
98  */
99 goog.string.caseInsensitiveEquals = function(str1, str2) {
100   return str1.toLowerCase() == str2.toLowerCase();
101 };
102 
103 
104 /**
105  * Does simple python-style string substitution.
106  * subs("foo%s hot%s", "bar", "dog") becomes "foobar hotdog".
107  * @param {string} str The string containing the pattern.
108  * @param {...*} var_args The items to substitute into the pattern.
109  * @return {string} A copy of {@code str} in which each occurrence of
110  *     {@code %s} has been replaced an argument from {@code var_args}.
111  */
112 goog.string.subs = function(str, var_args) {
113   var splitParts = str.split('%s');
114   var returnString = '';
115 
116   var subsArguments = Array.prototype.slice.call(arguments, 1);
117   while (subsArguments.length &&
118          // Replace up to the last split part. We are inserting in the
119          // positions between split parts.
120          splitParts.length > 1) {
121     returnString += splitParts.shift() + subsArguments.shift();
122   }
123 
124   return returnString + splitParts.join('%s'); // Join unused '%s'
125 };
126 
127 
128 /**
129  * Converts multiple whitespace chars (spaces, non-breaking-spaces, new lines
130  * and tabs) to a single space, and strips leading and trailing whitespace.
131  * @param {string} str Input string.
132  * @return {string} A copy of {@code str} with collapsed whitespace.
133  */
134 goog.string.collapseWhitespace = function(str) {
135   // Since IE doesn't include non-breaking-space (0xa0) in their \s character
136   // class (as required by section 7.2 of the ECMAScript spec), we explicitly
137   // include it in the regexp to enforce consistent cross-browser behavior.
138   return str.replace(/[\s\xa0]+/g, ' ').replace(/^\s+|\s+$/g, '');
139 };
140 
141 
142 /**
143  * Checks if a string is empty or contains only whitespaces.
144  * @param {string} str The string to check.
145  * @return {boolean} True if {@code str} is empty or whitespace only.
146  */
147 goog.string.isEmpty = function(str) {
148   // testing length == 0 first is actually slower in all browsers (about the
149   // same in Opera).
150   // Since IE doesn't include non-breaking-space (0xa0) in their \s character
151   // class (as required by section 7.2 of the ECMAScript spec), we explicitly
152   // include it in the regexp to enforce consistent cross-browser behavior.
153   return /^[\s\xa0]*$/.test(str);
154 };
155 
156 
157 /**
158  * Checks if a string is null, undefined, empty or contains only whitespaces.
159  * @param {*} str The string to check.
160  * @return {boolean} True if{@code str} is null, undefined, empty, or
161  *     whitespace only.
162  */
163 goog.string.isEmptySafe = function(str) {
164   return goog.string.isEmpty(goog.string.makeSafe(str));
165 };
166 
167 
168 /**
169  * Checks if a string is all breaking whitespace.
170  * @param {string} str The string to check.
171  * @return {boolean} Whether the string is all breaking whitespace.
172  */
173 goog.string.isBreakingWhitespace = function(str) {
174   return !/[^\t\n\r ]/.test(str);
175 };
176 
177 
178 /**
179  * Checks if a string contains all letters.
180  * @param {string} str string to check.
181  * @return {boolean} True if {@code str} consists entirely of letters.
182  */
183 goog.string.isAlpha = function(str) {
184   return !/[^a-zA-Z]/.test(str);
185 };
186 
187 
188 /**
189  * Checks if a string contains only numbers.
190  * @param {*} str string to check. If not a string, it will be
191  *     casted to one.
192  * @return {boolean} True if {@code str} is numeric.
193  */
194 goog.string.isNumeric = function(str) {
195   return !/[^0-9]/.test(str);
196 };
197 
198 
199 /**
200  * Checks if a string contains only numbers or letters.
201  * @param {string} str string to check.
202  * @return {boolean} True if {@code str} is alphanumeric.
203  */
204 goog.string.isAlphaNumeric = function(str) {
205   return !/[^a-zA-Z0-9]/.test(str);
206 };
207 
208 
209 /**
210  * Checks if a character is a space character.
211  * @param {string} ch Character to check.
212  * @return {boolean} True if {code ch} is a space.
213  */
214 goog.string.isSpace = function(ch) {
215   return ch == ' ';
216 };
217 
218 
219 /**
220  * Checks if a character is a valid unicode character.
221  * @param {string} ch Character to check.
222  * @return {boolean} True if {code ch} is a valid unicode character.
223  */
224 goog.string.isUnicodeChar = function(ch) {
225   return ch.length == 1 && ch >= ' ' && ch <= '~' ||
226          ch >= '\u0080' && ch <= '\uFFFD';
227 };
228 
229 
230 /**
231  * Takes a string and replaces newlines with a space. Multiple lines are
232  * replaced with a single space.
233  * @param {string} str The string from which to strip newlines.
234  * @return {string} A copy of {@code str} stripped of newlines.
235  */
236 goog.string.stripNewlines = function(str) {
237   return str.replace(/(\r\n|\r|\n)+/g, ' ');
238 };
239 
240 
241 /**
242  * Replaces Windows and Mac new lines with unix style: \r or \r\n with \n.
243  * @param {string} str The string to in which to canonicalize newlines.
244  * @return {string} {@code str} A copy of {@code} with canonicalized newlines.
245  */
246 goog.string.canonicalizeNewlines = function(str) {
247   return str.replace(/(\r\n|\r|\n)/g, '\n');
248 };
249 
250 
251 /**
252  * Normalizes whitespace in a string, replacing all whitespace chars with
253  * a space.
254  * @param {string} str The string in which to normalize whitespace.
255  * @return {string} A copy of {@code str} with all whitespace normalized.
256  */
257 goog.string.normalizeWhitespace = function(str) {
258   return str.replace(/\xa0|\s/g, ' ');
259 };
260 
261 
262 /**
263  * Normalizes spaces in a string, replacing all consecutive spaces and tabs
264  * with a single space. Replaces non-breaking space with a space.
265  * @param {string} str The string in which to normalize spaces.
266  * @return {string} A copy of {@code str} with all consecutive spaces and tabs
267  *    replaced with a single space.
268  */
269 goog.string.normalizeSpaces = function(str) {
270   return str.replace(/\xa0|[ \t]+/g, ' ');
271 };
272 
273 
274 /**
275  * Removes the breaking spaces from the left and right of the string and
276  * collapses the sequences of breaking spaces in the middle into single spaces.
277  * The original and the result strings render the same way in HTML.
278  * @param {string} str A string in which to collapse spaces.
279  * @return {string} Copy of the string with normalized breaking spaces.
280  */
281 goog.string.collapseBreakingSpaces = function(str) {
282   return str.replace(/[\t\r\n ]+/g, ' ').replace(
283       /^[\t\r\n ]+|[\t\r\n ]+$/g, '');
284 };
285 
286 
287 /**
288  * Trims white spaces to the left and right of a string.
289  * @param {string} str The string to trim.
290  * @return {string} A trimmed copy of {@code str}.
291  */
292 goog.string.trim = function(str) {
293   // Since IE doesn't include non-breaking-space (0xa0) in their \s character
294   // class (as required by section 7.2 of the ECMAScript spec), we explicitly
295   // include it in the regexp to enforce consistent cross-browser behavior.
296   return str.replace(/^[\s\xa0]+|[\s\xa0]+$/g, '');
297 };
298 
299 
300 /**
301  * Trims whitespaces at the left end of a string.
302  * @param {string} str The string to left trim.
303  * @return {string} A trimmed copy of {@code str}.
304  */
305 goog.string.trimLeft = function(str) {
306   // Since IE doesn't include non-breaking-space (0xa0) in their \s character
307   // class (as required by section 7.2 of the ECMAScript spec), we explicitly
308   // include it in the regexp to enforce consistent cross-browser behavior.
309   return str.replace(/^[\s\xa0]+/, '');
310 };
311 
312 
313 /**
314  * Trims whitespaces at the right end of a string.
315  * @param {string} str The string to right trim.
316  * @return {string} A trimmed copy of {@code str}.
317  */
318 goog.string.trimRight = function(str) {
319   // Since IE doesn't include non-breaking-space (0xa0) in their \s character
320   // class (as required by section 7.2 of the ECMAScript spec), we explicitly
321   // include it in the regexp to enforce consistent cross-browser behavior.
322   return str.replace(/[\s\xa0]+$/, '');
323 };
324 
325 
326 /**
327  * A string comparator that ignores case.
328  * -1 = str1 less than str2
329  *  0 = str1 equals str2
330  *  1 = str1 greater than str2
331  *
332  * @param {string} str1 The string to compare.
333  * @param {string} str2 The string to compare {@code str1} to.
334  * @return {number} The comparator result, as described above.
335  */
336 goog.string.caseInsensitiveCompare = function(str1, str2) {
337   var test1 = String(str1).toLowerCase();
338   var test2 = String(str2).toLowerCase();
339 
340   if (test1 < test2) {
341     return -1;
342   } else if (test1 == test2) {
343     return 0;
344   } else {
345     return 1;
346   }
347 };
348 
349 
350 /**
351  * Regular expression used for splitting a string into substrings of fractional
352  * numbers, integers, and non-numeric characters.
353  * @type {RegExp}
354  * @private
355  */
356 goog.string.numerateCompareRegExp_ = /(\.\d+)|(\d+)|(\D+)/g;
357 
358 
359 /**
360  * String comparison function that handles numbers in a way humans might expect.
361  * Using this function, the string "File 2.jpg" sorts before "File 10.jpg". The
362  * comparison is mostly case-insensitive, though strings that are identical
363  * except for case are sorted with the upper-case strings before lower-case.
364  *
365  * This comparison function is significantly slower (about 500x) than either
366  * the default or the case-insensitive compare. It should not be used in
367  * time-critical code, but should be fast enough to sort several hundred short
368  * strings (like filenames) with a reasonable delay.
369  *
370  * @param {string} str1 The string to compare in a numerically sensitive way.
371  * @param {string} str2 The string to compare {@code str1} to.
372  * @return {number} less than 0 if str1 < str2, 0 if str1 == str2, greater than
373  *     0 if str1 > str2.
374  */
375 goog.string.numerateCompare = function(str1, str2) {
376   if (str1 == str2) {
377     return 0;
378   }
379   if (!str1) {
380     return -1;
381   }
382   if (!str2) {
383     return 1;
384   }
385 
386   // Using match to split the entire string ahead of time turns out to be faster
387   // for most inputs than using RegExp.exec or iterating over each character.
388   var tokens1 = str1.toLowerCase().match(goog.string.numerateCompareRegExp_);
389   var tokens2 = str2.toLowerCase().match(goog.string.numerateCompareRegExp_);
390 
391   var count = Math.min(tokens1.length, tokens2.length);
392 
393   for (var i = 0; i < count; i++) {
394     var a = tokens1[i];
395     var b = tokens2[i];
396 
397     // Compare pairs of tokens, returning if one token sorts before the other.
398     if (a != b) {
399 
400       // Only if both tokens are integers is a special comparison required.
401       // Decimal numbers are sorted as strings (e.g., '.09' < '.1').
402       var num1 = parseInt(a, 10);
403       if (!isNaN(num1)) {
404         var num2 = parseInt(b, 10);
405         if (!isNaN(num2) && num1 - num2) {
406           return num1 - num2;
407         }
408       }
409       return a < b ? -1 : 1;
410     }
411   }
412 
413   // If one string is a substring of the other, the shorter string sorts first.
414   if (tokens1.length != tokens2.length) {
415     return tokens1.length - tokens2.length;
416   }
417 
418   // The two strings must be equivalent except for case (perfect equality is
419   // tested at the head of the function.) Revert to default ASCII-betical string
420   // comparison to stablize the sort.
421   return str1 < str2 ? -1 : 1;
422 };
423 
424 
425 /**
426  * URL-encodes a string
427  * @param {*} str The string to url-encode.
428  * @return {string} An encoded copy of {@code str} that is safe for urls.
429  *     Note that '#', ':', and other characters used to delimit portions
430  *     of URLs *will* be encoded.
431  */
432 goog.string.urlEncode = function(str) {
433   return encodeURIComponent(String(str));
434 };
435 
436 
437 /**
438  * URL-decodes the string. We need to specially handle '+'s because
439  * the javascript library doesn't convert them to spaces.
440  * @param {string} str The string to url decode.
441  * @return {string} The decoded {@code str}.
442  */
443 goog.string.urlDecode = function(str) {
444   return decodeURIComponent(str.replace(/\+/g, ' '));
445 };
446 
447 
448 /**
449  * Converts \n to <br>s or <br />s.
450  * @param {string} str The string in which to convert newlines.
451  * @param {boolean=} opt_xml Whether to use XML compatible tags.
452  * @return {string} A copy of {@code str} with converted newlines.
453  */
454 goog.string.newLineToBr = function(str, opt_xml) {
455   return str.replace(/(\r\n|\r|\n)/g, opt_xml ? '<br />' : '<br>');
456 };
457 
458 
459 /**
460  * Escapes double quote '"' and single quote '\'' characters in addition to
461  * '&', '<', and '>' so that a string can be included in an HTML tag attribute
462  * value within double or single quotes.
463  *
464  * It should be noted that > doesn't need to be escaped for the HTML or XML to
465  * be valid, but it has been decided to escape it for consistency with other
466  * implementations.
467  *
468  * With goog.string.DETECT_DOUBLE_ESCAPING, this function escapes also the
469  * lowercase letter "e".
470  *
471  * NOTE(user):
472  * HtmlEscape is often called during the generation of large blocks of HTML.
473  * Using statics for the regular expressions and strings is an optimization
474  * that can more than half the amount of time IE spends in this function for
475  * large apps, since strings and regexes both contribute to GC allocations.
476  *
477  * Testing for the presence of a character before escaping increases the number
478  * of function calls, but actually provides a speed increase for the average
479  * case -- since the average case often doesn't require the escaping of all 4
480  * characters and indexOf() is much cheaper than replace().
481  * The worst case does suffer slightly from the additional calls, therefore the
482  * opt_isLikelyToContainHtmlChars option has been included for situations
483  * where all 4 HTML entities are very likely to be present and need escaping.
484  *
485  * Some benchmarks (times tended to fluctuate +-0.05ms):
486  *                                     FireFox                     IE6
487  * (no chars / average (mix of cases) / all 4 chars)
488  * no checks                     0.13 / 0.22 / 0.22         0.23 / 0.53 / 0.80
489  * indexOf                       0.08 / 0.17 / 0.26         0.22 / 0.54 / 0.84
490  * indexOf + re test             0.07 / 0.17 / 0.28         0.19 / 0.50 / 0.85
491  *
492  * An additional advantage of checking if replace actually needs to be called
493  * is a reduction in the number of object allocations, so as the size of the
494  * application grows the difference between the various methods would increase.
495  *
496  * @param {string} str string to be escaped.
497  * @param {boolean=} opt_isLikelyToContainHtmlChars Don't perform a check to see
498  *     if the character needs replacing - use this option if you expect each of
499  *     the characters to appear often. Leave false if you expect few html
500  *     characters to occur in your strings, such as if you are escaping HTML.
501  * @return {string} An escaped copy of {@code str}.
502  */
503 goog.string.htmlEscape = function(str, opt_isLikelyToContainHtmlChars) {
504 
505   if (opt_isLikelyToContainHtmlChars) {
506     str = str.replace(goog.string.AMP_RE_, '&amp;')
507           .replace(goog.string.LT_RE_, '&lt;')
508           .replace(goog.string.GT_RE_, '&gt;')
509           .replace(goog.string.QUOT_RE_, '&quot;')
510           .replace(goog.string.SINGLE_QUOTE_RE_, '&#39;')
511           .replace(goog.string.NULL_RE_, '&#0;');
512     if (goog.string.DETECT_DOUBLE_ESCAPING) {
513       str = str.replace(goog.string.E_RE_, '&#101;');
514     }
515     return str;
516 
517   } else {
518     // quick test helps in the case when there are no chars to replace, in
519     // worst case this makes barely a difference to the time taken
520     if (!goog.string.ALL_RE_.test(str)) return str;
521 
522     // str.indexOf is faster than regex.test in this case
523     if (str.indexOf('&') != -1) {
524       str = str.replace(goog.string.AMP_RE_, '&amp;');
525     }
526     if (str.indexOf('<') != -1) {
527       str = str.replace(goog.string.LT_RE_, '&lt;');
528     }
529     if (str.indexOf('>') != -1) {
530       str = str.replace(goog.string.GT_RE_, '&gt;');
531     }
532     if (str.indexOf('"') != -1) {
533       str = str.replace(goog.string.QUOT_RE_, '&quot;');
534     }
535     if (str.indexOf('\'') != -1) {
536       str = str.replace(goog.string.SINGLE_QUOTE_RE_, '&#39;');
537     }
538     if (str.indexOf('\x00') != -1) {
539       str = str.replace(goog.string.NULL_RE_, '&#0;');
540     }
541     if (goog.string.DETECT_DOUBLE_ESCAPING && str.indexOf('e') != -1) {
542       str = str.replace(goog.string.E_RE_, '&#101;');
543     }
544     return str;
545   }
546 };
547 
548 
549 /**
550  * Regular expression that matches an ampersand, for use in escaping.
551  * @const {!RegExp}
552  * @private
553  */
554 goog.string.AMP_RE_ = /&/g;
555 
556 
557 /**
558  * Regular expression that matches a less than sign, for use in escaping.
559  * @const {!RegExp}
560  * @private
561  */
562 goog.string.LT_RE_ = /</g;
563 
564 
565 /**
566  * Regular expression that matches a greater than sign, for use in escaping.
567  * @const {!RegExp}
568  * @private
569  */
570 goog.string.GT_RE_ = />/g;
571 
572 
573 /**
574  * Regular expression that matches a double quote, for use in escaping.
575  * @const {!RegExp}
576  * @private
577  */
578 goog.string.QUOT_RE_ = /"/g;
579 
580 
581 /**
582  * Regular expression that matches a single quote, for use in escaping.
583  * @const {!RegExp}
584  * @private
585  */
586 goog.string.SINGLE_QUOTE_RE_ = /'/g;
587 
588 
589 /**
590  * Regular expression that matches null character, for use in escaping.
591  * @const {!RegExp}
592  * @private
593  */
594 goog.string.NULL_RE_ = /\x00/g;
595 
596 
597 /**
598  * Regular expression that matches a lowercase letter "e", for use in escaping.
599  * @const {!RegExp}
600  * @private
601  */
602 goog.string.E_RE_ = /e/g;
603 
604 
605 /**
606  * Regular expression that matches any character that needs to be escaped.
607  * @const {!RegExp}
608  * @private
609  */
610 goog.string.ALL_RE_ = (goog.string.DETECT_DOUBLE_ESCAPING ?
611     /[\x00&<>"'e]/ :
612     /[\x00&<>"']/);
613 
614 
615 /**
616  * Unescapes an HTML string.
617  *
618  * @param {string} str The string to unescape.
619  * @return {string} An unescaped copy of {@code str}.
620  */
621 goog.string.unescapeEntities = function(str) {
622   if (goog.string.contains(str, '&')) {
623     // We are careful not to use a DOM if we do not have one. We use the []
624     // notation so that the JSCompiler will not complain about these objects and
625     // fields in the case where we have no DOM.
626     if ('document' in goog.global) {
627       return goog.string.unescapeEntitiesUsingDom_(str);
628     } else {
629       // Fall back on pure XML entities
630       return goog.string.unescapePureXmlEntities_(str);
631     }
632   }
633   return str;
634 };
635 
636 
637 /**
638  * Unescapes a HTML string using the provided document.
639  *
640  * @param {string} str The string to unescape.
641  * @param {!Document} document A document to use in escaping the string.
642  * @return {string} An unescaped copy of {@code str}.
643  */
644 goog.string.unescapeEntitiesWithDocument = function(str, document) {
645   if (goog.string.contains(str, '&')) {
646     return goog.string.unescapeEntitiesUsingDom_(str, document);
647   }
648   return str;
649 };
650 
651 
652 /**
653  * Unescapes an HTML string using a DOM to resolve non-XML, non-numeric
654  * entities. This function is XSS-safe and whitespace-preserving.
655  * @private
656  * @param {string} str The string to unescape.
657  * @param {Document=} opt_document An optional document to use for creating
658  *     elements. If this is not specified then the default window.document
659  *     will be used.
660  * @return {string} The unescaped {@code str} string.
661  */
662 goog.string.unescapeEntitiesUsingDom_ = function(str, opt_document) {
663   var seen = {'&amp;': '&', '&lt;': '<', '&gt;': '>', '&quot;': '"'};
664   var div;
665   if (opt_document) {
666     div = opt_document.createElement('div');
667   } else {
668     div = goog.global.document.createElement('div');
669   }
670   // Match as many valid entity characters as possible. If the actual entity
671   // happens to be shorter, it will still work as innerHTML will return the
672   // trailing characters unchanged. Since the entity characters do not include
673   // open angle bracket, there is no chance of XSS from the innerHTML use.
674   // Since no whitespace is passed to innerHTML, whitespace is preserved.
675   return str.replace(goog.string.HTML_ENTITY_PATTERN_, function(s, entity) {
676     // Check for cached entity.
677     var value = seen[s];
678     if (value) {
679       return value;
680     }
681     // Check for numeric entity.
682     if (entity.charAt(0) == '#') {
683       // Prefix with 0 so that hex entities (e.g. &#x10) parse as hex numbers.
684       var n = Number('0' + entity.substr(1));
685       if (!isNaN(n)) {
686         value = String.fromCharCode(n);
687       }
688     }
689     // Fall back to innerHTML otherwise.
690     if (!value) {
691       // Append a non-entity character to avoid a bug in Webkit that parses
692       // an invalid entity at the end of innerHTML text as the empty string.
693       div.innerHTML = s + ' ';
694       // Then remove the trailing character from the result.
695       value = div.firstChild.nodeValue.slice(0, -1);
696     }
697     // Cache and return.
698     return seen[s] = value;
699   });
700 };
701 
702 
703 /**
704  * Unescapes XML entities.
705  * @private
706  * @param {string} str The string to unescape.
707  * @return {string} An unescaped copy of {@code str}.
708  */
709 goog.string.unescapePureXmlEntities_ = function(str) {
710   return str.replace(/&([^;]+);/g, function(s, entity) {
711     switch (entity) {
712       case 'amp':
713         return '&';
714       case 'lt':
715         return '<';
716       case 'gt':
717         return '>';
718       case 'quot':
719         return '"';
720       default:
721         if (entity.charAt(0) == '#') {
722           // Prefix with 0 so that hex entities (e.g. &#x10) parse as hex.
723           var n = Number('0' + entity.substr(1));
724           if (!isNaN(n)) {
725             return String.fromCharCode(n);
726           }
727         }
728         // For invalid entities we just return the entity
729         return s;
730     }
731   });
732 };
733 
734 
735 /**
736  * Regular expression that matches an HTML entity.
737  * See also HTML5: Tokenization / Tokenizing character references.
738  * @private
739  * @type {!RegExp}
740  */
741 goog.string.HTML_ENTITY_PATTERN_ = /&([^;\s<&]+);?/g;
742 
743 
744 /**
745  * Do escaping of whitespace to preserve spatial formatting. We use character
746  * entity #160 to make it safer for xml.
747  * @param {string} str The string in which to escape whitespace.
748  * @param {boolean=} opt_xml Whether to use XML compatible tags.
749  * @return {string} An escaped copy of {@code str}.
750  */
751 goog.string.whitespaceEscape = function(str, opt_xml) {
752   // This doesn't use goog.string.preserveSpaces for backwards compatibility.
753   return goog.string.newLineToBr(str.replace(/  /g, ' &#160;'), opt_xml);
754 };
755 
756 
757 /**
758  * Preserve spaces that would be otherwise collapsed in HTML by replacing them
759  * with non-breaking space Unicode characters.
760  * @param {string} str The string in which to preserve whitespace.
761  * @return {string} A copy of {@code str} with preserved whitespace.
762  */
763 goog.string.preserveSpaces = function(str) {
764   return str.replace(/(^|[\n ]) /g, '$1' + goog.string.Unicode.NBSP);
765 };
766 
767 
768 /**
769  * Strip quote characters around a string.  The second argument is a string of
770  * characters to treat as quotes.  This can be a single character or a string of
771  * multiple character and in that case each of those are treated as possible
772  * quote characters. For example:
773  *
774  * <pre>
775  * goog.string.stripQuotes('"abc"', '"`') --> 'abc'
776  * goog.string.stripQuotes('`abc`', '"`') --> 'abc'
777  * </pre>
778  *
779  * @param {string} str The string to strip.
780  * @param {string} quoteChars The quote characters to strip.
781  * @return {string} A copy of {@code str} without the quotes.
782  */
783 goog.string.stripQuotes = function(str, quoteChars) {
784   var length = quoteChars.length;
785   for (var i = 0; i < length; i++) {
786     var quoteChar = length == 1 ? quoteChars : quoteChars.charAt(i);
787     if (str.charAt(0) == quoteChar && str.charAt(str.length - 1) == quoteChar) {
788       return str.substring(1, str.length - 1);
789     }
790   }
791   return str;
792 };
793 
794 
795 /**
796  * Truncates a string to a certain length and adds '...' if necessary.  The
797  * length also accounts for the ellipsis, so a maximum length of 10 and a string
798  * 'Hello World!' produces 'Hello W...'.
799  * @param {string} str The string to truncate.
800  * @param {number} chars Max number of characters.
801  * @param {boolean=} opt_protectEscapedCharacters Whether to protect escaped
802  *     characters from being cut off in the middle.
803  * @return {string} The truncated {@code str} string.
804  */
805 goog.string.truncate = function(str, chars, opt_protectEscapedCharacters) {
806   if (opt_protectEscapedCharacters) {
807     str = goog.string.unescapeEntities(str);
808   }
809 
810   if (str.length > chars) {
811     str = str.substring(0, chars - 3) + '...';
812   }
813 
814   if (opt_protectEscapedCharacters) {
815     str = goog.string.htmlEscape(str);
816   }
817 
818   return str;
819 };
820 
821 
822 /**
823  * Truncate a string in the middle, adding "..." if necessary,
824  * and favoring the beginning of the string.
825  * @param {string} str The string to truncate the middle of.
826  * @param {number} chars Max number of characters.
827  * @param {boolean=} opt_protectEscapedCharacters Whether to protect escaped
828  *     characters from being cutoff in the middle.
829  * @param {number=} opt_trailingChars Optional number of trailing characters to
830  *     leave at the end of the string, instead of truncating as close to the
831  *     middle as possible.
832  * @return {string} A truncated copy of {@code str}.
833  */
834 goog.string.truncateMiddle = function(str, chars,
835     opt_protectEscapedCharacters, opt_trailingChars) {
836   if (opt_protectEscapedCharacters) {
837     str = goog.string.unescapeEntities(str);
838   }
839 
840   if (opt_trailingChars && str.length > chars) {
841     if (opt_trailingChars > chars) {
842       opt_trailingChars = chars;
843     }
844     var endPoint = str.length - opt_trailingChars;
845     var startPoint = chars - opt_trailingChars;
846     str = str.substring(0, startPoint) + '...' + str.substring(endPoint);
847   } else if (str.length > chars) {
848     // Favor the beginning of the string:
849     var half = Math.floor(chars / 2);
850     var endPos = str.length - half;
851     half += chars % 2;
852     str = str.substring(0, half) + '...' + str.substring(endPos);
853   }
854 
855   if (opt_protectEscapedCharacters) {
856     str = goog.string.htmlEscape(str);
857   }
858 
859   return str;
860 };
861 
862 
863 /**
864  * Special chars that need to be escaped for goog.string.quote.
865  * @private
866  * @type {Object}
867  */
868 goog.string.specialEscapeChars_ = {
869   '\0': '\\0',
870   '\b': '\\b',
871   '\f': '\\f',
872   '\n': '\\n',
873   '\r': '\\r',
874   '\t': '\\t',
875   '\x0B': '\\x0B', // '\v' is not supported in JScript
876   '"': '\\"',
877   '\\': '\\\\'
878 };
879 
880 
881 /**
882  * Character mappings used internally for goog.string.escapeChar.
883  * @private
884  * @type {Object}
885  */
886 goog.string.jsEscapeCache_ = {
887   '\'': '\\\''
888 };
889 
890 
891 /**
892  * Encloses a string in double quotes and escapes characters so that the
893  * string is a valid JS string.
894  * @param {string} s The string to quote.
895  * @return {string} A copy of {@code s} surrounded by double quotes.
896  */
897 goog.string.quote = function(s) {
898   s = String(s);
899   if (s.quote) {
900     return s.quote();
901   } else {
902     var sb = ['"'];
903     for (var i = 0; i < s.length; i++) {
904       var ch = s.charAt(i);
905       var cc = ch.charCodeAt(0);
906       sb[i + 1] = goog.string.specialEscapeChars_[ch] ||
907           ((cc > 31 && cc < 127) ? ch : goog.string.escapeChar(ch));
908     }
909     sb.push('"');
910     return sb.join('');
911   }
912 };
913 
914 
915 /**
916  * Takes a string and returns the escaped string for that character.
917  * @param {string} str The string to escape.
918  * @return {string} An escaped string representing {@code str}.
919  */
920 goog.string.escapeString = function(str) {
921   var sb = [];
922   for (var i = 0; i < str.length; i++) {
923     sb[i] = goog.string.escapeChar(str.charAt(i));
924   }
925   return sb.join('');
926 };
927 
928 
929 /**
930  * Takes a character and returns the escaped string for that character. For
931  * example escapeChar(String.fromCharCode(15)) -> "\\x0E".
932  * @param {string} c The character to escape.
933  * @return {string} An escaped string representing {@code c}.
934  */
935 goog.string.escapeChar = function(c) {
936   if (c in goog.string.jsEscapeCache_) {
937     return goog.string.jsEscapeCache_[c];
938   }
939 
940   if (c in goog.string.specialEscapeChars_) {
941     return goog.string.jsEscapeCache_[c] = goog.string.specialEscapeChars_[c];
942   }
943 
944   var rv = c;
945   var cc = c.charCodeAt(0);
946   if (cc > 31 && cc < 127) {
947     rv = c;
948   } else {
949     // tab is 9 but handled above
950     if (cc < 256) {
951       rv = '\\x';
952       if (cc < 16 || cc > 256) {
953         rv += '0';
954       }
955     } else {
956       rv = '\\u';
957       if (cc < 4096) { // \u1000
958         rv += '0';
959       }
960     }
961     rv += cc.toString(16).toUpperCase();
962   }
963 
964   return goog.string.jsEscapeCache_[c] = rv;
965 };
966 
967 
968 /**
969  * Takes a string and creates a map (Object) in which the keys are the
970  * characters in the string. The value for the key is set to true. You can
971  * then use goog.object.map or goog.array.map to change the values.
972  * @param {string} s The string to build the map from.
973  * @return {!Object} The map of characters used.
974  */
975 // TODO(arv): It seems like we should have a generic goog.array.toMap. But do
976 //            we want a dependency on goog.array in goog.string?
977 goog.string.toMap = function(s) {
978   var rv = {};
979   for (var i = 0; i < s.length; i++) {
980     rv[s.charAt(i)] = true;
981   }
982   return rv;
983 };
984 
985 
986 /**
987  * Determines whether a string contains a substring.
988  * @param {string} str The string to search.
989  * @param {string} subString The substring to search for.
990  * @return {boolean} Whether {@code str} contains {@code subString}.
991  */
992 goog.string.contains = function(str, subString) {
993   return str.indexOf(subString) != -1;
994 };
995 
996 
997 /**
998  * Determines whether a string contains a substring, ignoring case.
999  * @param {string} str The string to search.
1000  * @param {string} subString The substring to search for.
1001  * @return {boolean} Whether {@code str} contains {@code subString}.
1002  */
1003 goog.string.caseInsensitiveContains = function(str, subString) {
1004   return goog.string.contains(str.toLowerCase(), subString.toLowerCase());
1005 };
1006 
1007 
1008 /**
1009  * Returns the non-overlapping occurrences of ss in s.
1010  * If either s or ss evalutes to false, then returns zero.
1011  * @param {string} s The string to look in.
1012  * @param {string} ss The string to look for.
1013  * @return {number} Number of occurrences of ss in s.
1014  */
1015 goog.string.countOf = function(s, ss) {
1016   return s && ss ? s.split(ss).length - 1 : 0;
1017 };
1018 
1019 
1020 /**
1021  * Removes a substring of a specified length at a specific
1022  * index in a string.
1023  * @param {string} s The base string from which to remove.
1024  * @param {number} index The index at which to remove the substring.
1025  * @param {number} stringLength The length of the substring to remove.
1026  * @return {string} A copy of {@code s} with the substring removed or the full
1027  *     string if nothing is removed or the input is invalid.
1028  */
1029 goog.string.removeAt = function(s, index, stringLength) {
1030   var resultStr = s;
1031   // If the index is greater or equal to 0 then remove substring
1032   if (index >= 0 && index < s.length && stringLength > 0) {
1033     resultStr = s.substr(0, index) +
1034         s.substr(index + stringLength, s.length - index - stringLength);
1035   }
1036   return resultStr;
1037 };
1038 
1039 
1040 /**
1041  *  Removes the first occurrence of a substring from a string.
1042  *  @param {string} s The base string from which to remove.
1043  *  @param {string} ss The string to remove.
1044  *  @return {string} A copy of {@code s} with {@code ss} removed or the full
1045  *      string if nothing is removed.
1046  */
1047 goog.string.remove = function(s, ss) {
1048   var re = new RegExp(goog.string.regExpEscape(ss), '');
1049   return s.replace(re, '');
1050 };
1051 
1052 
1053 /**
1054  *  Removes all occurrences of a substring from a string.
1055  *  @param {string} s The base string from which to remove.
1056  *  @param {string} ss The string to remove.
1057  *  @return {string} A copy of {@code s} with {@code ss} removed or the full
1058  *      string if nothing is removed.
1059  */
1060 goog.string.removeAll = function(s, ss) {
1061   var re = new RegExp(goog.string.regExpEscape(ss), 'g');
1062   return s.replace(re, '');
1063 };
1064 
1065 
1066 /**
1067  * Escapes characters in the string that are not safe to use in a RegExp.
1068  * @param {*} s The string to escape. If not a string, it will be casted
1069  *     to one.
1070  * @return {string} A RegExp safe, escaped copy of {@code s}.
1071  */
1072 goog.string.regExpEscape = function(s) {
1073   return String(s).replace(/([-()\[\]{}+?*.$\^|,:#<!\\])/g, '\\$1').
1074       replace(/\x08/g, '\\x08');
1075 };
1076 
1077 
1078 /**
1079  * Repeats a string n times.
1080  * @param {string} string The string to repeat.
1081  * @param {number} length The number of times to repeat.
1082  * @return {string} A string containing {@code length} repetitions of
1083  *     {@code string}.
1084  */
1085 goog.string.repeat = function(string, length) {
1086   return new Array(length + 1).join(string);
1087 };
1088 
1089 
1090 /**
1091  * Pads number to given length and optionally rounds it to a given precision.
1092  * For example:
1093  * <pre>padNumber(1.25, 2, 3) -> '01.250'
1094  * padNumber(1.25, 2) -> '01.25'
1095  * padNumber(1.25, 2, 1) -> '01.3'
1096  * padNumber(1.25, 0) -> '1.25'</pre>
1097  *
1098  * @param {number} num The number to pad.
1099  * @param {number} length The desired length.
1100  * @param {number=} opt_precision The desired precision.
1101  * @return {string} {@code num} as a string with the given options.
1102  */
1103 goog.string.padNumber = function(num, length, opt_precision) {
1104   var s = goog.isDef(opt_precision) ? num.toFixed(opt_precision) : String(num);
1105   var index = s.indexOf('.');
1106   if (index == -1) {
1107     index = s.length;
1108   }
1109   return goog.string.repeat('0', Math.max(0, length - index)) + s;
1110 };
1111 
1112 
1113 /**
1114  * Returns a string representation of the given object, with
1115  * null and undefined being returned as the empty string.
1116  *
1117  * @param {*} obj The object to convert.
1118  * @return {string} A string representation of the {@code obj}.
1119  */
1120 goog.string.makeSafe = function(obj) {
1121   return obj == null ? '' : String(obj);
1122 };
1123 
1124 
1125 /**
1126  * Concatenates string expressions. This is useful
1127  * since some browsers are very inefficient when it comes to using plus to
1128  * concat strings. Be careful when using null and undefined here since
1129  * these will not be included in the result. If you need to represent these
1130  * be sure to cast the argument to a String first.
1131  * For example:
1132  * <pre>buildString('a', 'b', 'c', 'd') -> 'abcd'
1133  * buildString(null, undefined) -> ''
1134  * </pre>
1135  * @param {...*} var_args A list of strings to concatenate. If not a string,
1136  *     it will be casted to one.
1137  * @return {string} The concatenation of {@code var_args}.
1138  */
1139 goog.string.buildString = function(var_args) {
1140   return Array.prototype.join.call(arguments, '');
1141 };
1142 
1143 
1144 /**
1145  * Returns a string with at least 64-bits of randomness.
1146  *
1147  * Doesn't trust Javascript's random function entirely. Uses a combination of
1148  * random and current timestamp, and then encodes the string in base-36 to
1149  * make it shorter.
1150  *
1151  * @return {string} A random string, e.g. sn1s7vb4gcic.
1152  */
1153 goog.string.getRandomString = function() {
1154   var x = 2147483648;
1155   return Math.floor(Math.random() * x).toString(36) +
1156          Math.abs(Math.floor(Math.random() * x) ^ goog.now()).toString(36);
1157 };
1158 
1159 
1160 /**
1161  * Compares two version numbers.
1162  *
1163  * @param {string|number} version1 Version of first item.
1164  * @param {string|number} version2 Version of second item.
1165  *
1166  * @return {number}  1 if {@code version1} is higher.
1167  *                   0 if arguments are equal.
1168  *                  -1 if {@code version2} is higher.
1169  */
1170 goog.string.compareVersions = function(version1, version2) {
1171   var order = 0;
1172   // Trim leading and trailing whitespace and split the versions into
1173   // subversions.
1174   var v1Subs = goog.string.trim(String(version1)).split('.');
1175   var v2Subs = goog.string.trim(String(version2)).split('.');
1176   var subCount = Math.max(v1Subs.length, v2Subs.length);
1177 
1178   // Iterate over the subversions, as long as they appear to be equivalent.
1179   for (var subIdx = 0; order == 0 && subIdx < subCount; subIdx++) {
1180     var v1Sub = v1Subs[subIdx] || '';
1181     var v2Sub = v2Subs[subIdx] || '';
1182 
1183     // Split the subversions into pairs of numbers and qualifiers (like 'b').
1184     // Two different RegExp objects are needed because they are both using
1185     // the 'g' flag.
1186     var v1CompParser = new RegExp('(\\d*)(\\D*)', 'g');
1187     var v2CompParser = new RegExp('(\\d*)(\\D*)', 'g');
1188     do {
1189       var v1Comp = v1CompParser.exec(v1Sub) || ['', '', ''];
1190       var v2Comp = v2CompParser.exec(v2Sub) || ['', '', ''];
1191       // Break if there are no more matches.
1192       if (v1Comp[0].length == 0 && v2Comp[0].length == 0) {
1193         break;
1194       }
1195 
1196       // Parse the numeric part of the subversion. A missing number is
1197       // equivalent to 0.
1198       var v1CompNum = v1Comp[1].length == 0 ? 0 : parseInt(v1Comp[1], 10);
1199       var v2CompNum = v2Comp[1].length == 0 ? 0 : parseInt(v2Comp[1], 10);
1200 
1201       // Compare the subversion components. The number has the highest
1202       // precedence. Next, if the numbers are equal, a subversion without any
1203       // qualifier is always higher than a subversion with any qualifier. Next,
1204       // the qualifiers are compared as strings.
1205       order = goog.string.compareElements_(v1CompNum, v2CompNum) ||
1206           goog.string.compareElements_(v1Comp[2].length == 0,
1207               v2Comp[2].length == 0) ||
1208           goog.string.compareElements_(v1Comp[2], v2Comp[2]);
1209       // Stop as soon as an inequality is discovered.
1210     } while (order == 0);
1211   }
1212 
1213   return order;
1214 };
1215 
1216 
1217 /**
1218  * Compares elements of a version number.
1219  *
1220  * @param {string|number|boolean} left An element from a version number.
1221  * @param {string|number|boolean} right An element from a version number.
1222  *
1223  * @return {number}  1 if {@code left} is higher.
1224  *                   0 if arguments are equal.
1225  *                  -1 if {@code right} is higher.
1226  * @private
1227  */
1228 goog.string.compareElements_ = function(left, right) {
1229   if (left < right) {
1230     return -1;
1231   } else if (left > right) {
1232     return 1;
1233   }
1234   return 0;
1235 };
1236 
1237 
1238 /**
1239  * Maximum value of #goog.string.hashCode, exclusive. 2^32.
1240  * @type {number}
1241  * @private
1242  */
1243 goog.string.HASHCODE_MAX_ = 0x100000000;
1244 
1245 
1246 /**
1247  * String hash function similar to java.lang.String.hashCode().
1248  * The hash code for a string is computed as
1249  * s[0] * 31 ^ (n - 1) + s[1] * 31 ^ (n - 2) + ... + s[n - 1],
1250  * where s[i] is the ith character of the string and n is the length of
1251  * the string. We mod the result to make it between 0 (inclusive) and 2^32
1252  * (exclusive).
1253  * @param {string} str A string.
1254  * @return {number} Hash value for {@code str}, between 0 (inclusive) and 2^32
1255  *  (exclusive). The empty string returns 0.
1256  */
1257 goog.string.hashCode = function(str) {
1258   var result = 0;
1259   for (var i = 0; i < str.length; ++i) {
1260     result = 31 * result + str.charCodeAt(i);
1261     // Normalize to 4 byte range, 0 ... 2^32.
1262     result %= goog.string.HASHCODE_MAX_;
1263   }
1264   return result;
1265 };
1266 
1267 
1268 /**
1269  * The most recent unique ID. |0 is equivalent to Math.floor in this case.
1270  * @type {number}
1271  * @private
1272  */
1273 goog.string.uniqueStringCounter_ = Math.random() * 0x80000000 | 0;
1274 
1275 
1276 /**
1277  * Generates and returns a string which is unique in the current document.
1278  * This is useful, for example, to create unique IDs for DOM elements.
1279  * @return {string} A unique id.
1280  */
1281 goog.string.createUniqueString = function() {
1282   return 'goog_' + goog.string.uniqueStringCounter_++;
1283 };
1284 
1285 
1286 /**
1287  * Converts the supplied string to a number, which may be Infinity or NaN.
1288  * This function strips whitespace: (toNumber(' 123') === 123)
1289  * This function accepts scientific notation: (toNumber('1e1') === 10)
1290  *
1291  * This is better than Javascript's built-in conversions because, sadly:
1292  *     (Number(' ') === 0) and (parseFloat('123a') === 123)
1293  *
1294  * @param {string} str The string to convert.
1295  * @return {number} The number the supplied string represents, or NaN.
1296  */
1297 goog.string.toNumber = function(str) {
1298   var num = Number(str);
1299   if (num == 0 && goog.string.isEmpty(str)) {
1300     return NaN;
1301   }
1302   return num;
1303 };
1304 
1305 
1306 /**
1307  * Returns whether the given string is lower camel case (e.g. "isFooBar").
1308  *
1309  * Note that this assumes the string is entirely letters.
1310  * @see http://en.wikipedia.org/wiki/CamelCase#Variations_and_synonyms
1311  *
1312  * @param {string} str String to test.
1313  * @return {boolean} Whether the string is lower camel case.
1314  */
1315 goog.string.isLowerCamelCase = function(str) {
1316   return /^[a-z]+([A-Z][a-z]*)*$/.test(str);
1317 };
1318 
1319 
1320 /**
1321  * Returns whether the given string is upper camel case (e.g. "FooBarBaz").
1322  *
1323  * Note that this assumes the string is entirely letters.
1324  * @see http://en.wikipedia.org/wiki/CamelCase#Variations_and_synonyms
1325  *
1326  * @param {string} str String to test.
1327  * @return {boolean} Whether the string is upper camel case.
1328  */
1329 goog.string.isUpperCamelCase = function(str) {
1330   return /^([A-Z][a-z]*)+$/.test(str);
1331 };
1332 
1333 
1334 /**
1335  * Converts a string from selector-case to camelCase (e.g. from
1336  * "multi-part-string" to "multiPartString"), useful for converting
1337  * CSS selectors and HTML dataset keys to their equivalent JS properties.
1338  * @param {string} str The string in selector-case form.
1339  * @return {string} The string in camelCase form.
1340  */
1341 goog.string.toCamelCase = function(str) {
1342   return String(str).replace(/\-([a-z])/g, function(all, match) {
1343     return match.toUpperCase();
1344   });
1345 };
1346 
1347 
1348 /**
1349  * Converts a string from camelCase to selector-case (e.g. from
1350  * "multiPartString" to "multi-part-string"), useful for converting JS
1351  * style and dataset properties to equivalent CSS selectors and HTML keys.
1352  * @param {string} str The string in camelCase form.
1353  * @return {string} The string in selector-case form.
1354  */
1355 goog.string.toSelectorCase = function(str) {
1356   return String(str).replace(/([A-Z])/g, '-$1').toLowerCase();
1357 };
1358 
1359 
1360 /**
1361  * Converts a string into TitleCase. First character of the string is always
1362  * capitalized in addition to the first letter of every subsequent word.
1363  * Words are delimited by one or more whitespaces by default. Custom delimiters
1364  * can optionally be specified to replace the default, which doesn't preserve
1365  * whitespace delimiters and instead must be explicitly included if needed.
1366  *
1367  * Default delimiter => " ":
1368  *    goog.string.toTitleCase('oneTwoThree')    => 'OneTwoThree'
1369  *    goog.string.toTitleCase('one two three')  => 'One Two Three'
1370  *    goog.string.toTitleCase('  one   two   ') => '  One   Two   '
1371  *    goog.string.toTitleCase('one_two_three')  => 'One_two_three'
1372  *    goog.string.toTitleCase('one-two-three')  => 'One-two-three'
1373  *
1374  * Custom delimiter => "_-.":
1375  *    goog.string.toTitleCase('oneTwoThree', '_-.')       => 'OneTwoThree'
1376  *    goog.string.toTitleCase('one two three', '_-.')     => 'One two three'
1377  *    goog.string.toTitleCase('  one   two   ', '_-.')    => '  one   two   '
1378  *    goog.string.toTitleCase('one_two_three', '_-.')     => 'One_Two_Three'
1379  *    goog.string.toTitleCase('one-two-three', '_-.')     => 'One-Two-Three'
1380  *    goog.string.toTitleCase('one...two...three', '_-.') => 'One...Two...Three'
1381  *    goog.string.toTitleCase('one. two. three', '_-.')   => 'One. two. three'
1382  *    goog.string.toTitleCase('one-two.three', '_-.')     => 'One-Two.Three'
1383  *
1384  * @param {string} str String value in camelCase form.
1385  * @param {string=} opt_delimiters Custom delimiter character set used to
1386  *      distinguish words in the string value. Each character represents a
1387  *      single delimiter. When provided, default whitespace delimiter is
1388  *      overridden and must be explicitly included if needed.
1389  * @return {string} String value in TitleCase form.
1390  */
1391 goog.string.toTitleCase = function(str, opt_delimiters) {
1392   var delimiters = goog.isString(opt_delimiters) ?
1393       goog.string.regExpEscape(opt_delimiters) : '\\s';
1394 
1395   // For IE8, we need to prevent using an empty character set. Otherwise,
1396   // incorrect matching will occur.
1397   delimiters = delimiters ? '|[' + delimiters + ']+' : '';
1398 
1399   var regexp = new RegExp('(^' + delimiters + ')([a-z])', 'g');
1400   return str.replace(regexp, function(all, p1, p2) {
1401     return p1 + p2.toUpperCase();
1402   });
1403 };
1404 
1405 
1406 /**
1407  * Parse a string in decimal or hexidecimal ('0xFFFF') form.
1408  *
1409  * To parse a particular radix, please use parseInt(string, radix) directly. See
1410  * https://developer.mozilla.org/en/JavaScript/Reference/Global_Objects/parseInt
1411  *
1412  * This is a wrapper for the built-in parseInt function that will only parse
1413  * numbers as base 10 or base 16.  Some JS implementations assume strings
1414  * starting with "0" are intended to be octal. ES3 allowed but discouraged
1415  * this behavior. ES5 forbids it.  This function emulates the ES5 behavior.
1416  *
1417  * For more information, see Mozilla JS Reference: http://goo.gl/8RiFj
1418  *
1419  * @param {string|number|null|undefined} value The value to be parsed.
1420  * @return {number} The number, parsed. If the string failed to parse, this
1421  *     will be NaN.
1422  */
1423 goog.string.parseInt = function(value) {
1424   // Force finite numbers to strings.
1425   if (isFinite(value)) {
1426     value = String(value);
1427   }
1428 
1429   if (goog.isString(value)) {
1430     // If the string starts with '0x' or '-0x', parse as hex.
1431     return /^\s*-?0x/i.test(value) ?
1432         parseInt(value, 16) : parseInt(value, 10);
1433   }
1434 
1435   return NaN;
1436 };
1437 
1438 
1439 /**
1440  * Splits a string on a separator a limited number of times.
1441  *
1442  * This implementation is more similar to Python or Java, where the limit
1443  * parameter specifies the maximum number of splits rather than truncating
1444  * the number of results.
1445  *
1446  * See http://docs.python.org/2/library/stdtypes.html#str.split
1447  * See JavaDoc: http://goo.gl/F2AsY
1448  * See Mozilla reference: http://goo.gl/dZdZs
1449  *
1450  * @param {string} str String to split.
1451  * @param {string} separator The separator.
1452  * @param {number} limit The limit to the number of splits. The resulting array
1453  *     will have a maximum length of limit+1.  Negative numbers are the same
1454  *     as zero.
1455  * @return {!Array.<string>} The string, split.
1456  */
1457 
1458 goog.string.splitLimit = function(str, separator, limit) {
1459   var parts = str.split(separator);
1460   var returnVal = [];
1461 
1462   // Only continue doing this while we haven't hit the limit and we have
1463   // parts left.
1464   while (limit > 0 && parts.length) {
1465     returnVal.push(parts.shift());
1466     limit--;
1467   }
1468 
1469   // If there are remaining parts, append them to the end.
1470   if (parts.length) {
1471     returnVal.push(parts.join(separator));
1472   }
1473 
1474   return returnVal;
1475 };
1476