Merge pull request #529 from k9mail/ignore_meta_refresh
Sanitize HTML to remove meta refresh
This commit is contained in:
commit
4db57dfc85
3 changed files with 153 additions and 1 deletions
54
k9mail/src/main/java/com/fsck/k9/helper/HtmlSanitizer.java
Normal file
54
k9mail/src/main/java/com/fsck/k9/helper/HtmlSanitizer.java
Normal file
|
@ -0,0 +1,54 @@
|
|||
package com.fsck.k9.helper;
|
||||
|
||||
|
||||
import org.htmlcleaner.CleanerProperties;
|
||||
import org.htmlcleaner.HtmlCleaner;
|
||||
import org.htmlcleaner.HtmlSerializer;
|
||||
import org.htmlcleaner.SimpleHtmlSerializer;
|
||||
import org.htmlcleaner.TagNode;
|
||||
|
||||
|
||||
public class HtmlSanitizer {
|
||||
private static final HtmlCleaner HTML_CLEANER;
|
||||
private static final HtmlSerializer HTML_SERIALIZER;
|
||||
|
||||
static {
|
||||
CleanerProperties properties = createCleanerProperties();
|
||||
HTML_CLEANER = new HtmlCleaner(properties);
|
||||
HTML_SERIALIZER = new SimpleHtmlSerializer(properties);
|
||||
}
|
||||
|
||||
|
||||
private HtmlSanitizer() {}
|
||||
|
||||
public static String sanitize(String html) {
|
||||
TagNode rootNode = HTML_CLEANER.clean(html);
|
||||
|
||||
removeMetaRefresh(rootNode);
|
||||
|
||||
return HTML_SERIALIZER.getAsString(rootNode, "UTF8");
|
||||
}
|
||||
|
||||
private static CleanerProperties createCleanerProperties() {
|
||||
CleanerProperties properties = new CleanerProperties();
|
||||
|
||||
// See http://htmlcleaner.sourceforge.net/parameters.php for descriptions
|
||||
properties.setNamespacesAware(false);
|
||||
properties.setAdvancedXmlEscape(false);
|
||||
properties.setOmitXmlDeclaration(true);
|
||||
properties.setOmitDoctypeDeclaration(false);
|
||||
properties.setTranslateSpecialEntities(false);
|
||||
properties.setRecognizeUnicodeChars(false);
|
||||
|
||||
return properties;
|
||||
}
|
||||
|
||||
private static void removeMetaRefresh(TagNode rootNode) {
|
||||
for (TagNode element : rootNode.getElementListByName("meta", true)) {
|
||||
String httpEquiv = element.getAttributeByName("http-equiv");
|
||||
if (httpEquiv != null && httpEquiv.trim().equalsIgnoreCase("refresh")) {
|
||||
element.removeFromTree();
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
|
@ -11,6 +11,8 @@ import android.widget.Toast;
|
|||
import com.fsck.k9.K9;
|
||||
import com.fsck.k9.R;
|
||||
import com.fsck.k9.helper.HtmlConverter;
|
||||
import com.fsck.k9.helper.HtmlSanitizer;
|
||||
|
||||
|
||||
public class MessageWebView extends RigidWebView {
|
||||
|
||||
|
@ -123,7 +125,9 @@ public class MessageWebView extends RigidWebView {
|
|||
}
|
||||
content += HtmlConverter.cssStylePre();
|
||||
content += "</head><body>" + text + "</body></html>";
|
||||
loadDataWithBaseURL("http://", content, "text/html", "utf-8", null);
|
||||
|
||||
String sanitizedContent = HtmlSanitizer.sanitize(content);
|
||||
loadDataWithBaseURL("http://", sanitizedContent, "text/html", "utf-8", null);
|
||||
resumeTimers();
|
||||
}
|
||||
|
||||
|
|
|
@ -0,0 +1,94 @@
|
|||
package com.fsck.k9.helper;
|
||||
|
||||
|
||||
import org.junit.Test;
|
||||
|
||||
import static org.junit.Assert.assertEquals;
|
||||
|
||||
|
||||
public class HtmlSanitizerTest {
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshInHead() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshBetweenHeadAndBody() {
|
||||
String html = "<html>" +
|
||||
"<head></head><meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\">" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshInBody() {
|
||||
String html = "<html>" +
|
||||
"<head></head>" +
|
||||
"<body><meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\">Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshWithUpperCaseAttributeValue() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=\"REFRESH\" content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshWithMixedCaseAttributeValue() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=\"Refresh\" content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshWithoutQuotesAroundAttributeValue() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=refresh content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshWithSpacesInAttributeValue() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=\"refresh \" content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMultipleMetaRefreshTags() {
|
||||
String html = "<html>" +
|
||||
"<head><meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\"></head>" +
|
||||
"<body><meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\">Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head></head><body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
|
||||
@Test
|
||||
public void shouldRemoveMetaRefreshButKeepOtherMetaTags() {
|
||||
String html = "<html>" +
|
||||
"<head>" +
|
||||
"<meta http-equiv=\"content-type\" content=\"text/html; charset=UTF-8\">" +
|
||||
"<meta http-equiv=\"refresh\" content=\"1; URL=http://example.com/\">" +
|
||||
"</head>" +
|
||||
"<body>Message</body>" +
|
||||
"</html>";
|
||||
assertEquals("<html><head><meta http-equiv=\"content-type\" content=\"text/html; charset=UTF-8\" /></head>" +
|
||||
"<body>Message</body></html>", HtmlSanitizer.sanitize(html));
|
||||
}
|
||||
}
|
Loading…
Reference in a new issue