Popular Posts
Read exif using metadata extraction metadata extraction version : 2.3.1 metadata extraction import java.io.File; import java.io.FileNotFoundException; import java.util.Iterato... Chrome Extension: Easy Cookie A simple cookie viewer/editor : Easy Cookie It's easy to view cookies at a web site Simply add a new cookie ... pushState & ajax page loading Index.cshtml <html> <head>     <title></title>     <link href="//netdna.bootstrapcdn.com/twitter-bootstrap/...
Blog Archive
Stats
HtmlCleaner
HtmlCleaner Version : 2.1
import java.io.IOException;

import org.htmlcleaner.CleanerProperties;
import org.htmlcleaner.HtmlCleaner;
import org.htmlcleaner.TagNode;

public class Test {

    private String refactory(String htmlSource) {
        HtmlCleaner cleaner = new HtmlCleaner();
        // 設定清除選項
        CleanerProperties p = cleaner.getProperties();
        p.setOmitComments(false); // 不清除註解(有bug, 造成結構與原本不同)
        p.setPruneTags("style,script"); // 去掉style, script標籤

        TagNode node = null;
        try {
            node = cleaner.clean(htmlSource);
        } catch (IOException e) {
            e.printStackTrace();
        }
        // 重整結構
        return cleaner.getInnerHtml(node);
    }
}