/*
* Copyright (C) 2000 - 2009 TagServlet Ltd
*
* This file is part of Open BlueDragon (OpenBD) CFML Server Engine.
*
* OpenBD is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* Free Software Foundation,version 3.
*
* OpenBD is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with OpenBD. If not, see http://www.gnu.org/licenses/
*
* Additional permission under GNU GPL version 3 section 7
*
* If you modify this Program, or any covered work, by linking or combining
* it with any of the JARS listed in the README.txt (or a modified version of
* (that library), containing parts covered by the terms of that JAR, the
* licensors of this Program grant you additional permission to convey the
* resulting work.
* README.txt @ http://www.openbluedragon.org/license/README.txt
*
* http://www.openbluedragon.org/
*/
package com.naryx.tagfusion.expression.function.ext;
import java.io.StringReader;
import java.io.StringWriter;
import org.w3c.tidy.Tidy;
import org.w3c.tidy.TidyMessage;
import org.w3c.tidy.TidyMessageListener;
import com.naryx.tagfusion.cfm.engine.cfArgStructData;
import com.naryx.tagfusion.cfm.engine.cfData;
import com.naryx.tagfusion.cfm.engine.cfSession;
import com.naryx.tagfusion.cfm.engine.cfStringData;
import com.naryx.tagfusion.cfm.engine.cfmRunTimeException;
import com.naryx.tagfusion.expression.function.functionBase;
/*
* Provides a wrapper to the JTidy release
*/
public class HtmlCleanUp extends functionBase {
private static final long serialVersionUID = 1L;
public HtmlCleanUp(){
min = 1; max = 1;
setNamedParams( new String[]{ "string" } );
}
public String[] getParamInfo(){
return new String[]{
"html block",
};
}
public java.util.Map getInfo(){
return makeInfo(
"string",
"Runs the W3 Tidy utility against the passed in HTML, performing a series of cleanup and HTML repair routines",
ReturnType.STRING );
}
public cfData execute(cfSession _session, cfArgStructData argStruct ) throws cfmRunTimeException {
try{
Tidy tidy = new Tidy();
final StringBuilder errors = new StringBuilder(32);
tidy.setMessageListener( new TidyMessageListener(){
public void messageReceived(TidyMessage mess) {
errors.append( "Line: " + mess.getLine() + "." + mess.getColumn() + "; " + mess.getMessage() + "\r\n" );
}
});
tidy.setSmartIndent( false );
tidy.setSpaces( 2 );
tidy.setTabsize( 2 );
tidy.setWraplen( 0 );
tidy.setLogicalEmphasis( true );
tidy.setMakeClean( true );
tidy.setQuiet( true );
tidy.setDropEmptyParas( true );
tidy.setXHTML( true );
tidy.setXmlSpace( true );
tidy.setTrimEmptyElements( true );
tidy.setBreakBeforeBR( false );
tidy.setUpperCaseTags( false );
tidy.setUpperCaseAttrs( false );
tidy.setWord2000( true );
tidy.setFixUri(false);
tidy.setFixBackslash( false );
tidy.setIndentAttributes( false );
tidy.setShowWarnings( false );
tidy.setShowErrors( 1 );
tidy.setOnlyErrors( false );
tidy.setPrintBodyOnly( false );
tidy.setJoinClasses( true );
tidy.setJoinStyles( true );
String inHtml = getNamedStringParam(argStruct,"string","");
StringReader reader = new StringReader( inHtml );
StringWriter writer = new StringWriter();
tidy.parse( reader, writer );
if ( errors.length() != 0 ){
throwException( _session, errors.toString() );
return null;
}else{
String outHtml = writer.toString();
int c1 = outHtml.indexOf("<body>");
if ( c1 >= 0 ){
outHtml = outHtml.substring( c1 + 6 );
c1 = outHtml.lastIndexOf("</body>");
if ( c1 >= 0 ){
outHtml = outHtml.substring( 0, c1 );
}
}
return new cfStringData( outHtml );
}
}catch( Exception e ){
throwException( _session, e.getMessage() );
return null;
}
}
}