Clean and fix html with HtmlCleaner java library

package com.origami.sgm.util;

import org.htmlcleaner.CleanerProperties;
import org.htmlcleaner.HtmlCleaner;
import org.htmlcleaner.SimpleHtmlSerializer;
import org.htmlcleaner.TagNode;

/**
 *
 * @author Fernando
 */
public abstract class HtmlUtil {
    
    public static String cleanHtml(String htmlText){
        
        HtmlCleaner cleaner = new HtmlCleaner();
        
        CleanerProperties props = cleaner.getProperties();
        
        TagNode node = cleaner.clean(htmlText);
        
        SimpleHtmlSerializer htmlSerializer = new SimpleHtmlSerializer(props);
        
        // remove <?xml definition tag:
        String htmlResult = htmlSerializer.getAsString(node).replaceAll("\\<\\?xml(.+?)\\?\\>", "").trim();
        
        return htmlResult;
    }
    
}