Popular Posts
Add file to google drive using Google.Apis.Auth.OAuth2; using Google.Apis.Drive.v2; using Google.Apis.Drive.v2.Data; using Google.Apis.Services; using Google.Apis.Ut... Enable SSL connection for Jsoup import org.jsoup.Connection; import org.jsoup.Jsoup; import javax.net.ssl.*; import java.io.IOException; import java.security.KeyManagement... JavaMail sample import java.io.File; import java.io.UnsupportedEncodingException; import java.util.Date; import java.util.Properties; import javax.activati...
Blog Archive
Stats
HtmlCleaner
HtmlCleaner Version : 2.1
import java.io.IOException;

import org.htmlcleaner.CleanerProperties;
import org.htmlcleaner.HtmlCleaner;
import org.htmlcleaner.TagNode;

public class Test {

    private String refactory(String htmlSource) {
        HtmlCleaner cleaner = new HtmlCleaner();
        // 設定清除選項
        CleanerProperties p = cleaner.getProperties();
        p.setOmitComments(false); // 不清除註解(有bug, 造成結構與原本不同)
        p.setPruneTags("style,script"); // 去掉style, script標籤

        TagNode node = null;
        try {
            node = cleaner.clean(htmlSource);
        } catch (IOException e) {
            e.printStackTrace();
        }
        // 重整結構
        return cleaner.getInnerHtml(node);
    }
}