zcommon/src/main/java/org/zkoss/lang/JavaScriptEscape.java
/*
* =============================================================================
*
* Copyright (c) 2014, The UNBESCAPE team (http://www.unbescape.org)
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* =============================================================================
*/
package org.zkoss.lang;
import java.io.IOException;
import java.io.Writer;
/**
* <p>
* Utility class for performing JavaScript escape/unescape operations.
* </p>
*
* <strong><u>Configuration of escape/unescape operations</u></strong>
*
* <p>
* <strong>Escape</strong> operations can be (optionally) configured by means of:
* </p>
* <ul>
* <li><em>Level</em>, which defines how deep the escape operation must be (what
* chars are to be considered eligible for escaping, depending on the specific
* needs of the scenario). Its values are defined by the {@link org.unbescape.javascript.JavaScriptEscapeLevel}
* enum.</li>
* <li><em>Type</em>, which defines whether escaping should be performed by means of SECs
* (Single Escape Characters like <tt>\n</tt>) or additionally by means of x-based or u-based
* hexadecimal escapes (<tt>\xE1</tt> or <tt>\u00E1</tt>).
* Its values are defined by the {@link org.unbescape.javascript.JavaScriptEscapeType} enum.</li>
* </ul>
* <p>
* <strong>Unescape</strong> operations need no configuration parameters. Unescape operations
* will always perform <em>complete</em> unescape of SECs (<tt>\n</tt>), x-based (<tt>\xE1</tt>)
* and u-based (<tt>\u00E1</tt>) hexadecimal escapes, and even octal escapes (<tt>\057</tt>, which
* are deprecated since ECMAScript v5 and therefore not used for escaping).
* </p>
*
* <strong><u>Features</u></strong>
*
* <p>
* Specific features of the JavaScript escape/unescape operations performed by means of this class:
* </p>
* <ul>
* <li>The JavaScript basic escape set is supported. This <em>basic set</em> consists of:
* <ul>
* <li>The <em>Single Escape Characters</em>:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>).
* Note that <tt>\/</tt> is optional, and will only be used when the <tt>/</tt>
* symbol appears after <tt><</tt>, as in <tt></</tt>. This is to avoid accidentally
* closing <tt><script></tt> tags in HTML. Also, note that <tt>\v</tt>
* (<tt>U+000B</tt>) is actually included as a Single Escape
* Character in the JavaScript (ECMAScript) specification, but will not be used as it
* is not supported by Microsoft Internet Explorer versions < 9.
* </li>
* <li>
* Two ranges of non-displayable, control characters (some of which are already part of the
* <em>single escape characters</em> list): <tt>U+0001</tt> to <tt>U+001F</tt> and
* <tt>U+007F</tt> to <tt>U+009F</tt>.
* </li>
* </ul>
* </li>
* <li>X-based hexadecimal escapes (a.k.a. <em>hexadecimal escapes</em>) are supported both in escape
* and unescape operations: <tt>\xE1</tt>.</li>
* <li>U-based hexadecimal escapes (a.k.a. <em>unicode escapes</em>) are supported both in escape
* and unescape operations: <tt>\u00E1</tt>.</li>
* <li>Octal escapes are supported, though only in unescape operations: <tt>\071</tt>. These are not supported
* in escape operations because octal escapes were deprecated in version 5 of the ECMAScript
* specification.</li>
* <li>Support for the whole Unicode character set: <tt>\u0000</tt> to <tt>\u10FFFF</tt>, including
* characters not representable by only one <tt>char</tt> in Java (<tt>>\uFFFF</tt>).</li>
* </ul>
*
* <strong><u>Input/Output</u></strong>
*
* <p>
* There are two different input/output modes that can be used in escape/unescape operations:
* </p>
* <ul>
* <li><em><tt>String</tt> input, <tt>String</tt> output</em>: Input is specified as a <tt>String</tt> object
* and output is returned as another. In order to improve memory performance, all escape and unescape
* operations <u>will return the exact same input object as output if no escape/unescape modifications
* are required</u>.</li>
* <li><em><tt>char[]</tt> input, <tt>java.io.Writer</tt> output</em>: Input will be read from a char array
* (<tt>char[]</tt>) and output will be written into the specified <tt>java.io.Writer</tt>.
* Two <tt>int</tt> arguments called <tt>offset</tt> and <tt>len</tt> will be
* used for specifying the part of the <tt>char[]</tt> that should be escaped/unescaped. These methods
* should be called with <tt>offset = 0</tt> and <tt>len = text.length</tt> in order to process
* the whole <tt>char[]</tt>.</li>
* </ul>
*
* <strong><u>Glossary</u></strong>
*
* <dl>
* <dt>SEC</dt>
* <dd>Single Escape Character:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>) (optional, only in <tt></</tt>).
* </dd>
* <dt>XHEXA escapes</dt>
* <dd>Also called <em>x-based hexadecimal escapes</em> or simply <em>hexadecimal escapes</em>:
* compact representation of unicode codepoints up to <tt>U+00FF</tt>, with <tt>\x</tt>
* followed by exactly two hexadecimal figures: <tt>\xE1</tt>. XHEXA is many times used
* instead of UHEXA (when possible) in order to obtain shorter escaped strings.</dd>
* <dt>UHEXA escapes</dt>
* <dd>Also called <em>u-based hexadecimal escapes</em> or simply <em>unicode escapes</em>:
* complete representation of unicode codepoints up to <tt>U+FFFF</tt>, with <tt>\u</tt>
* followed by exactly four hexadecimal figures: <tt>\u00E1</tt>. Unicode codepoints >
* <tt>U+FFFF</tt> can be represented in JavaScript by mean of two UHEXA escapes (a
* <em>surrogate pair</em>).</dd>
* <dt>Octal escapes</dt>
* <dd>Octal representation of unicode codepoints up to <tt>U+00FF</tt>, with <tt>\</tt>
* followed by up to three octal figures: <tt>\071</tt>. Though up to three octal figures
* are allowed, octal numbers > <tt>377</tt> (<tt>0xFF</tt>) are not supported. Note
* <u>octal escapes have been deprecated as of version 5 of the ECMAScript specification</u>.</dd>
* <dt>Unicode Codepoint</dt>
* <dd>Each of the <tt>int</tt> values conforming the Unicode code space.
* Normally corresponding to a Java <tt>char</tt> primitive value (codepoint <= <tt>\uFFFF</tt>),
* but might be two <tt>char</tt>s for codepoints <tt>\u10000</tt> to <tt>\u10FFFF</tt> if the
* first <tt>char</tt> is a high surrogate (<tt>\uD800</tt> to <tt>\uDBFF</tt>) and the
* second is a low surrogate (<tt>\uDC00</tt> to <tt>\uDFFF</tt>).</dd>
* </dl>
*
* <strong><u>References</u></strong>
*
* <p>
* The following references apply:
* </p>
* <ul>
* <li><a href="http://www.ecmascript.org/docs.php" target="_blank">The ECMAScript Specification</a>
* [ecmascript.org]</li>
* <li><a href="http://mathiasbynens.be/notes/javascript-escapes" target="_blank">JavaScript
* character escape sequences</a> [mathiasbynens.be]</li>
* </ul>
*
*
* @author Daniel Fernández
*
* @since 1.0.0
*
*/
/**package*/ final class JavaScriptEscape {
/**
* <p>
* Perform a JavaScript level 1 (only basic set) <strong>escape</strong> operation
* on a <tt>String</tt> input.
* </p>
* <p>
* <em>Level 1</em> means this method will only escape the JavaScript basic escape set:
* </p>
* <ul>
* <li>The <em>Single Escape Characters</em>:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>).
* Note that <tt>\/</tt> is optional, and will only be used when the <tt>/</tt>
* symbol appears after <tt><</tt>, as in <tt></</tt>. This is to avoid accidentally
* closing <tt><script></tt> tags in HTML. Also, note that <tt>\v</tt>
* (<tt>U+000B</tt>) is actually included as a Single Escape
* Character in the JavaScript (ECMAScript) specification, but will not be used as it
* is not supported by Microsoft Internet Explorer versions < 9.
* </li>
* <li>
* Two ranges of non-displayable, control characters (some of which are already part of the
* <em>single escape characters</em> list): <tt>U+0001</tt> to <tt>U+001F</tt> and
* <tt>U+007F</tt> to <tt>U+009F</tt>.
* </li>
* </ul>
* <p>
* This method calls {@link #escapeJavaScript(String, JavaScriptEscapeType, JavaScriptEscapeLevel)}
* with the following preconfigured values:
* </p>
* <ul>
* <li><tt>type</tt>:
* {@link JavaScriptEscapeType#SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA}</li>
* <li><tt>level</tt>:
* {@link JavaScriptEscapeLevel#LEVEL_1_BASIC_ESCAPE_SET}</li>
* </ul>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>String</tt> to be escaped.
* @return The escaped result <tt>String</tt>. As a memory-performance improvement, will return the exact
* same object as the <tt>text</tt> input argument if no escaping modifications were required (and
* no additional <tt>String</tt> objects will be created during processing). Will
* return <tt>null</tt> if <tt>text</tt> is <tt>null</tt>.
*/
public static String escapeJavaScriptMinimal(final String text) {
return escapeJavaScript(text,
JavaScriptEscapeType.SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA,
JavaScriptEscapeLevel.LEVEL_1_BASIC_ESCAPE_SET);
}
/**
* <p>
* Perform a JavaScript level 2 (basic set and all non-ASCII chars) <strong>escape</strong> operation
* on a <tt>String</tt> input.
* </p>
* <p>
* <em>Level 2</em> means this method will escape:
* </p>
* <ul>
* <li>The JavaScript basic escape set:
* <ul>
* <li>The <em>Single Escape Characters</em>:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>).
* Note that <tt>\/</tt> is optional, and will only be used when the <tt>/</tt>
* symbol appears after <tt><</tt>, as in <tt></</tt>. This is to avoid accidentally
* closing <tt><script></tt> tags in HTML. Also, note that <tt>\v</tt>
* (<tt>U+000B</tt>) is actually included as a Single Escape
* Character in the JavaScript (ECMAScript) specification, but will not be used as it
* is not supported by Microsoft Internet Explorer versions < 9.
* </li>
* <li>
* Two ranges of non-displayable, control characters (some of which are already part of the
* <em>single escape characters</em> list): <tt>U+0001</tt> to <tt>U+001F</tt> and
* <tt>U+007F</tt> to <tt>U+009F</tt>.
* </li>
* </ul>
* </li>
* <li>All non ASCII characters.</li>
* </ul>
* <p>
* This escape will be performed by using the Single Escape Chars whenever possible. For escaped
* characters that do not have an associated SEC, default to using <tt>\xFF</tt> Hexadecimal Escapes
* if possible (characters <= <tt>U+00FF</tt>), then default to <tt>\uFFFF</tt>
* Hexadecimal Escapes. This type of escape <u>produces the smallest escaped string possible</u>.
* </p>
* <p>
* This method calls {@link #escapeJavaScript(String, JavaScriptEscapeType, JavaScriptEscapeLevel)}
* with the following preconfigured values:
* </p>
* <ul>
* <li><tt>type</tt>:
* {@link JavaScriptEscapeType#SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA}</li>
* <li><tt>level</tt>:
* {@link JavaScriptEscapeLevel#LEVEL_2_ALL_NON_ASCII_PLUS_BASIC_ESCAPE_SET}</li>
* </ul>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>String</tt> to be escaped.
* @return The escaped result <tt>String</tt>. As a memory-performance improvement, will return the exact
* same object as the <tt>text</tt> input argument if no escaping modifications were required (and
* no additional <tt>String</tt> objects will be created during processing). Will
* return <tt>null</tt> if <tt>text</tt> is <tt>null</tt>.
*/
public static String escapeJavaScript(final String text) {
return escapeJavaScript(text,
JavaScriptEscapeType.SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA,
JavaScriptEscapeLevel.LEVEL_2_ALL_NON_ASCII_PLUS_BASIC_ESCAPE_SET);
}
/**
* <p>
* Perform a (configurable) JavaScript <strong>escape</strong> operation on a <tt>String</tt> input.
* </p>
* <p>
* This method will perform an escape operation according to the specified
* {@link JavaScriptEscapeType} and
* {@link JavaScriptEscapeLevel} argument values.
* </p>
* <p>
* All other <tt>String</tt>-based <tt>escapeJavaScript*(...)</tt> methods call this one with preconfigured
* <tt>type</tt> and <tt>level</tt> values.
* </p>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>String</tt> to be escaped.
* @param type the type of escape operation to be performed, see
* {@link JavaScriptEscapeType}.
* @param level the escape level to be applied, see {@link JavaScriptEscapeLevel}.
* @return The escaped result <tt>String</tt>. As a memory-performance improvement, will return the exact
* same object as the <tt>text</tt> input argument if no escaping modifications were required (and
* no additional <tt>String</tt> objects will be created during processing). Will
* return <tt>null</tt> if <tt>text</tt> is <tt>null</tt>.
*/
public static String escapeJavaScript(final String text,
final JavaScriptEscapeType type, final JavaScriptEscapeLevel level) {
if (type == null) {
throw new IllegalArgumentException("The 'type' argument cannot be null");
}
if (level == null) {
throw new IllegalArgumentException("The 'level' argument cannot be null");
}
return JavaScriptEscapeUtil.escape(text, type, level);
}
/**
* <p>
* Perform a JavaScript level 1 (only basic set) <strong>escape</strong> operation
* on a <tt>char[]</tt> input.
* </p>
* <p>
* <em>Level 1</em> means this method will only escape the JavaScript basic escape set:
* </p>
* <ul>
* <li>The <em>Single Escape Characters</em>:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>).
* Note that <tt>\/</tt> is optional, and will only be used when the <tt>/</tt>
* symbol appears after <tt><</tt>, as in <tt></</tt>. This is to avoid accidentally
* closing <tt><script></tt> tags in HTML. Also, note that <tt>\v</tt>
* (<tt>U+000B</tt>) is actually included as a Single Escape
* Character in the JavaScript (ECMAScript) specification, but will not be used as it
* is not supported by Microsoft Internet Explorer versions < 9.
* </li>
* <li>
* Two ranges of non-displayable, control characters (some of which are already part of the
* <em>single escape characters</em> list): <tt>U+0001</tt> to <tt>U+001F</tt> and
* <tt>U+007F</tt> to <tt>U+009F</tt>.
* </li>
* </ul>
* <p>
* This method calls
* {@link #escapeJavaScript(char[], int, int, Writer, JavaScriptEscapeType, JavaScriptEscapeLevel)}
* with the following preconfigured values:
* </p>
* <ul>
* <li><tt>type</tt>:
* {@link JavaScriptEscapeType#SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA}</li>
* <li><tt>level</tt>:
* {@link JavaScriptEscapeLevel#LEVEL_1_BASIC_ESCAPE_SET}</li>
* </ul>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>char[]</tt> to be escaped.
* @param offset the position in <tt>text</tt> at which the escape operation should start.
* @param len the number of characters in <tt>text</tt> that should be escaped.
* @param writer the <tt>java.io.Writer</tt> to which the escaped result will be written. Nothing will
* be written at all to this writer if <tt>text</tt> is <tt>null</tt>.
* @throws IOException if an input/output exception occurs
*/
public static void escapeJavaScriptMinimal(final char[] text, final int offset, final int len, final Writer writer)
throws IOException {
escapeJavaScript(text, offset, len, writer,
JavaScriptEscapeType.SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA,
JavaScriptEscapeLevel.LEVEL_1_BASIC_ESCAPE_SET);
}
/**
* <p>
* Perform a JavaScript level 2 (basic set and all non-ASCII chars) <strong>escape</strong> operation
* on a <tt>char[]</tt> input.
* </p>
* <p>
* <em>Level 2</em> means this method will escape:
* </p>
* <ul>
* <li>The JavaScript basic escape set:
* <ul>
* <li>The <em>Single Escape Characters</em>:
* <tt>\0</tt> (<tt>U+0000</tt>),
* <tt>\b</tt> (<tt>U+0008</tt>),
* <tt>\t</tt> (<tt>U+0009</tt>),
* <tt>\n</tt> (<tt>U+000A</tt>),
* <tt>\v</tt> (<tt>U+000B</tt>),
* <tt>\f</tt> (<tt>U+000C</tt>),
* <tt>\r</tt> (<tt>U+000D</tt>),
* <tt>\"</tt> (<tt>U+0022</tt>),
* <tt>\'</tt> (<tt>U+0027</tt>),
* <tt>\\</tt> (<tt>U+005C</tt>) and
* <tt>\/</tt> (<tt>U+002F</tt>).
* Note that <tt>\/</tt> is optional, and will only be used when the <tt>/</tt>
* symbol appears after <tt><</tt>, as in <tt></</tt>. This is to avoid accidentally
* closing <tt><script></tt> tags in HTML. Also, note that <tt>\v</tt>
* (<tt>U+000B</tt>) is actually included as a Single Escape
* Character in the JavaScript (ECMAScript) specification, but will not be used as it
* is not supported by Microsoft Internet Explorer versions < 9.
* </li>
* <li>
* Two ranges of non-displayable, control characters (some of which are already part of the
* <em>single escape characters</em> list): <tt>U+0001</tt> to <tt>U+001F</tt> and
* <tt>U+007F</tt> to <tt>U+009F</tt>.
* </li>
* </ul>
* </li>
* <li>All non ASCII characters.</li>
* </ul>
* <p>
* This escape will be performed by using the Single Escape Chars whenever possible. For escaped
* characters that do not have an associated SEC, default to using <tt>\xFF</tt> Hexadecimal Escapes
* if possible (characters <= <tt>U+00FF</tt>), then default to <tt>\uFFFF</tt>
* Hexadecimal Escapes. This type of escape <u>produces the smallest escaped string possible</u>.
* </p>
* <p>
* This method calls
* {@link #escapeJavaScript(char[], int, int, Writer, JavaScriptEscapeType, JavaScriptEscapeLevel)}
* with the following preconfigured values:
* </p>
* <ul>
* <li><tt>type</tt>:
* {@link JavaScriptEscapeType#SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA}</li>
* <li><tt>level</tt>:
* {@link JavaScriptEscapeLevel#LEVEL_2_ALL_NON_ASCII_PLUS_BASIC_ESCAPE_SET}</li>
* </ul>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>char[]</tt> to be escaped.
* @param offset the position in <tt>text</tt> at which the escape operation should start.
* @param len the number of characters in <tt>text</tt> that should be escaped.
* @param writer the <tt>java.io.Writer</tt> to which the escaped result will be written. Nothing will
* be written at all to this writer if <tt>text</tt> is <tt>null</tt>.
* @throws IOException if an input/output exception occurs
*/
public static void escapeJavaScript(final char[] text, final int offset, final int len, final Writer writer)
throws IOException {
escapeJavaScript(text, offset, len, writer,
JavaScriptEscapeType.SINGLE_ESCAPE_CHARS_DEFAULT_TO_XHEXA_AND_UHEXA,
JavaScriptEscapeLevel.LEVEL_2_ALL_NON_ASCII_PLUS_BASIC_ESCAPE_SET);
}
/**
* <p>
* Perform a (configurable) JavaScript <strong>escape</strong> operation on a <tt>char[]</tt> input.
* </p>
* <p>
* This method will perform an escape operation according to the specified
* {@link JavaScriptEscapeType} and
* {@link JavaScriptEscapeLevel} argument values.
* </p>
* <p>
* All other <tt>char[]</tt>-based <tt>escapeJavaScript*(...)</tt> methods call this one with preconfigured
* <tt>type</tt> and <tt>level</tt> values.
* </p>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>char[]</tt> to be escaped.
* @param offset the position in <tt>text</tt> at which the escape operation should start.
* @param len the number of characters in <tt>text</tt> that should be escaped.
* @param writer the <tt>java.io.Writer</tt> to which the escaped result will be written. Nothing will
* be written at all to this writer if <tt>text</tt> is <tt>null</tt>.
* @param type the type of escape operation to be performed, see
* {@link JavaScriptEscapeType}.
* @param level the escape level to be applied, see {@link JavaScriptEscapeLevel}.
* @throws IOException if an input/output exception occurs
*/
public static void escapeJavaScript(final char[] text, final int offset, final int len, final Writer writer,
final JavaScriptEscapeType type, final JavaScriptEscapeLevel level)
throws IOException {
if (writer == null) {
throw new IllegalArgumentException("Argument 'writer' cannot be null");
}
if (type == null) {
throw new IllegalArgumentException("The 'type' argument cannot be null");
}
if (level == null) {
throw new IllegalArgumentException("The 'level' argument cannot be null");
}
final int textLen = (text == null? 0 : text.length);
if (offset < 0 || offset > textLen) {
throw new IllegalArgumentException(
"Invalid (offset, len). offset=" + offset + ", len=" + len + ", text.length=" + textLen);
}
if (len < 0 || (offset + len) > textLen) {
throw new IllegalArgumentException(
"Invalid (offset, len). offset=" + offset + ", len=" + len + ", text.length=" + textLen);
}
JavaScriptEscapeUtil.escape(text, offset, len, writer, type, level);
}
/**
* <p>
* Perform a JavaScript <strong>unescape</strong> operation on a <tt>String</tt> input.
* </p>
* <p>
* No additional configuration arguments are required. Unescape operations
* will always perform <em>complete</em> JavaScript unescape of SECs, x-based, u-based
* and octal escapes.
* </p>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>String</tt> to be unescaped.
* @return The unescaped result <tt>String</tt>. As a memory-performance improvement, will return the exact
* same object as the <tt>text</tt> input argument if no unescaping modifications were required (and
* no additional <tt>String</tt> objects will be created during processing). Will
* return <tt>null</tt> if <tt>text</tt> is <tt>null</tt>.
*/
public static String unescapeJavaScript(final String text) {
return JavaScriptEscapeUtil.unescape(text);
}
/**
* <p>
* Perform a JavaScript <strong>unescape</strong> operation on a <tt>char[]</tt> input.
* </p>
* <p>
* No additional configuration arguments are required. Unescape operations
* will always perform <em>complete</em> JavaScript unescape of SECs, x-based, u-based
* and octal escapes.
* </p>
* <p>
* This method is <strong>thread-safe</strong>.
* </p>
*
* @param text the <tt>char[]</tt> to be unescaped.
* @param offset the position in <tt>text</tt> at which the unescape operation should start.
* @param len the number of characters in <tt>text</tt> that should be unescaped.
* @param writer the <tt>java.io.Writer</tt> to which the unescaped result will be written. Nothing will
* be written at all to this writer if <tt>text</tt> is <tt>null</tt>.
* @throws IOException if an input/output exception occurs
*/
public static void unescapeJavaScript(final char[] text, final int offset, final int len, final Writer writer)
throws IOException{
if (writer == null) {
throw new IllegalArgumentException("Argument 'writer' cannot be null");
}
final int textLen = (text == null? 0 : text.length);
if (offset < 0 || offset > textLen) {
throw new IllegalArgumentException(
"Invalid (offset, len). offset=" + offset + ", len=" + len + ", text.length=" + textLen);
}
if (len < 0 || (offset + len) > textLen) {
throw new IllegalArgumentException(
"Invalid (offset, len). offset=" + offset + ", len=" + len + ", text.length=" + textLen);
}
JavaScriptEscapeUtil.unescape(text, offset, len, writer);
}
private JavaScriptEscape() {
super();
}
}