Apple

package com.tos;

import java.io.UnsupportedEncodingException;

import java.net.URLEncoder;

import java.net.URLDecoder;

import java.text.StringCharacterIterator;

/**

* Convenience methods for altering special characters related to URLs,

* regular expressions, and HTML tags.

*/

public final class EscapeCharacters {

/**

* Synonym for <tt>URLEncoder.encode(String, "UTF-8")</tt>.

*

* Used to ensure that HTTP query strings are in proper form, by escaping

* special characters such as spaces.

*

* An example use case for this method is a login scheme in which, after successful

* login, the user is redirected to the "original" target destination. Such a target

* might be passed around as a request parameter. Such a request parameter

* will have a URL as its value, as in "LoginTarget=Blah.jsp?this=that&blah=boo", and

* would need to be URL-encoded in order to escape its special characters.

*

* It is important to note that if a query string appears in an <tt>HREF</tt>

* attribute, then there are two issues - ensuring the query string is valid HTTP

* (it is URL-encoded), and ensuring it is valid HTML (ensuring the ampersand is escaped).

*/

public static String forURL(String aURLFragment){

String result = null;

try {

result = URLEncoder.encode(aURLFragment, "UTF-8");

}

catch (UnsupportedEncodingException ex){

throw new RuntimeException("UTF-8 not supported", ex);

}

return result;

}

public static String fromURL(String aURLFragment){

String result = null;

try {

result = URLDecoder.decode(aURLFragment, "UTF-8");

}

catch (UnsupportedEncodingException ex){

throw new RuntimeException("UTF-8 not supported", ex);

}

return result;

}

/**

* Replace characters having special meaning inside HTML tags

* with their escaped equivalents, using character entities such as <tt>'&'</tt>.

*

* The escaped characters are :

* <ul>

* <li> <

* <li> >

* <li> "

* <li> '

* <li> \

* <li> &

* </ul>

*

* Use cases for this method include :

*<ul>

* <li>render ineffective all HTML present in arbitrary text input

* by a user (in a message board, for example)

* <li>ensure that arbitrary text appearing inside a tag does not "confuse"

* the tag. For example, <tt>HREF=''</tt>

* does not comply with strict HTML because of the ampersand, and should be changed to

* <tt>HREF=''</tt>. This is commonly seen in building

* query strings. (In JSTL, the c:url tag performs this task automatically.)

*</ul>

*/

public static String forHTMLTag(String aTagFragment){

final StringBuffer result = new StringBuffer();

final StringCharacterIterator iterator = new StringCharacterIterator(aTagFragment);

char character = iterator.current();

while (character != StringCharacterIterator.DONE ){

if (character == '<') {

result.append("<");

}

else if (character == '>') {

result.append(">");

}

else if (character == '\"') {

result.append(""");

}

else if (character == '\'') {

result.append("'");

}

else if (character == '\\') {

result.append("\");

}

else if (character == '&') {

result.append("&");

}

else {

//the char is not a special one

//add it to the result as is

result.append(character);

}

character = iterator.next();

}

return result.toString();

}

/**

* Replace characters having special meaning in regular expressions

* with their escaped equivalents.

*

* The escaped characters include :

*<ul>

*<li>.

*<li>\

*<li>?, * , and +

*<li>&

*<li>:

*<li>{ and }

*<li>[ and ]

*<li>( and )

*<li>^ and $

*</ul>

*

*/

public static String forRegex(String aRegexFragment){

final StringBuffer result = new StringBuffer();

final StringCharacterIterator iterator = new StringCharacterIterator(aRegexFragment);

char character = iterator.current();

while (character != StringCharacterIterator.DONE ){

/*

* All literals need to have backslashes doubled.

*/

if (character == '.') {

result.append("\\.");

}

else if (character == '\\') {

result.append("\\\\");

}

else if (character == '?') {

result.append("\\?");

}

else if (character == '*') {

result.append("\\*");

}

else if (character == '+') {

result.append("\\+");

}

else if (character == '&') {

result.append("\\&");

}

else if (character == ':') {

result.append("\\:");

}

else if (character == '{') {

result.append("\\{");

}

else if (character == '}') {

result.append("\\}");

}

else if (character == '[') {

result.append("\\[");

}

else if (character == ']') {

result.append("\\]");

}

else if (character == '(') {

result.append("\$");

}

else if (character == ')') {

result.append("\$");

}

else if (character == '^') {

result.append("\\^");

}

else if (character == '$') {

result.append("\\$");

}

else {

//the char is not a special one

//add it to the result as is

result.append(character);

}

character = iterator.next();

}

return result.toString();

}

}

References:
	>toHTMLString (From: Dev WO <email@hidden>)