Author: scottbw
Date: Sun Oct 7 11:56:41 2012
New Revision: 1395279
URL: http://svn.apache.org/viewvc?rev=1395279&view=rev
Log:
Altered HtmlCleaner config to recognise unicode decimal numeric characters.
This *almost* fixes WOOKIE-380 however hex unicode characters still don't work
properly.
Modified:
incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
Modified:
incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
URL:
http://svn.apache.org/viewvc/incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java?rev=1395279&r1=1395278&r2=1395279&view=diff
==============================================================================
--- incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java
(original)
+++ incubator/wookie/trunk/src/org/apache/wookie/util/html/HtmlCleaner.java Sun
Oct 7 11:56:41 2012
@@ -63,6 +63,8 @@ public class HtmlCleaner implements IHtm
//
properties.setTranslateSpecialEntities(true);
properties.setTransSpecialEntitiesToNCR(true);
+ properties.setAdvancedXmlEscape(true);
+ properties.setRecognizeUnicodeChars(false);
}