Author: scottbw
Date: Thu Sep 27 13:46:59 2012
New Revision: 1391011
URL: http://svn.apache.org/viewvc?rev=1391011&view=rev
Log:
Handle special HTML entities correctly - see WOOKIE-380
Modified:
incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
Modified:
incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
URL:
http://svn.apache.org/viewvc/incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java?rev=1391011&r1=1391010&r2=1391011&view=diff
==============================================================================
--- incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
(original)
+++ incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java Thu
Sep 27 13:46:59 2012
@@ -57,6 +57,13 @@ public class HtmlCleaner implements IHtm
properties.setOmitXmlDeclaration(true);
properties.setUseCdataForScriptAndStyle(true);
properties.setUseEmptyElementTags(false);
+ //
+ // Ensure we handle special HTML entities like copyright etc
+ // See WOOKIE-380
+ //
+ properties.setTranslateSpecialEntities(true);
+ properties.setTransSpecialEntitiesToNCR(true);
+
}
/* (non-Javadoc)