DocumentConverterHelper.java example

Explorer
infoglue-master
- src
  - java
- test
  - java
    - org
      - infoglue
        cms
        applications
        contenttool
        ContentCategoryActionTest.java
        managementtool
        CategoryActionTest.java
        InstallationValidatorAction.java
        RepositoryTester.java
        ViewContentTypeDefinitionActionTest.java
        mydesktoptool
        actions
        ViewMyDesktopToolStartPageActionTest.java
        controllers
        CategoryControllerTest.java
        ContentCategoryControllerTest.java
        ContentStateControllerTest.java
        ContentTypeDefinitionControllerTest.java
        MysqlJDBCServiceTest.java
        PublicationControllerTest.java
        SiteNodeVersionControllerTest.java
        WorkflowControllerTest.java
        entities
        ValidationTestCase.java
        management
        CategoryTest.java
        ValidationItem.java
        mydesktop
        WorkflowVOTest.java
        publishing
        EditionBrowserTest.java
        util
        FakeFilterConfig.java
        FakeHttpServletRequest.java
        FakeHttpServletResponse.java
        FakeHttpSession.java
        FakeServletContext.java
        InfoGlueTestCase.java
        WebWorkTestCase.java
        WorkflowTestCase.java
        workflow
        OwnerStepFilterTest.java
        workflow
        CreateNewsTest.java
        NewsWorkflowTestCase.java
        deliver
        controllers
        ContentDeliveryControllerTest.java
/* ===============================================================================
 *
 * Part of the InfoGlue Content Management Platform (www.infoglue.org)
 *
 * ===============================================================================
 *
 *  Copyright (C)
 * 
 * This program is free software; you can redistribute it and/or modify it under
 * the terms of the GNU General Public License version 2, as published by the
 * Free Software Foundation. See the file LICENSE.html for more information.
 * 
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY, including the implied warranty of MERCHANTABILITY or FITNESS
 * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
 * 
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc. / 59 Temple
 * Place, Suite 330 / Boston, MA 02111-1307 / USA.
 *
 * ===============================================================================
 */

package org.infoglue.cms.util;

import java.io.BufferedOutputStream;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.io.Writer;
import java.util.Enumeration;
import java.util.Iterator;
import java.util.List;
import java.util.StringTokenizer;
import java.util.zip.ZipEntry;
import java.util.zip.ZipException;
import java.util.zip.ZipFile;

import javax.servlet.http.HttpServletRequest;

import org.apache.log4j.Logger;
import org.infoglue.deliver.applications.databeans.ConvertedDocumentBean;
import org.jdom.Document;
import org.jdom.Element;
import org.jdom.Namespace;
import org.jdom.input.SAXBuilder;
import org.jdom.xpath.XPath;

import com.artofsolving.jodconverter.DocumentConverter;
import com.artofsolving.jodconverter.openoffice.connection.OpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.connection.SocketOpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.converter.OpenOfficeDocumentConverter;

public class DocumentConverterHelper 
{
	private final static Logger logger 	= Logger.getLogger(DocumentConverterHelper.class.getName());
	private static Namespace officeNs 	= Namespace.getNamespace("office", "urn:oasis:names:tc:opendocument:xmlns:office:1.0");
	private static Namespace textNs 	= Namespace.getNamespace("text", "urn:oasis:names:tc:opendocument:xmlns:text:1.0");
	
	public ConvertedDocumentBean convert(HttpServletRequest request, File aDocFile, String aTitle, String aMenuTextLength, List aCssList, String rewrite, String keepMenuExpanded) 
	{
		ConvertedDocumentBean convertedDocument = new ConvertedDocumentBean();
		int menuMaxLength						= 20;
		
		logger.info("-----------------------------------------------");
		logger.info("Doc file: " + aDocFile.getAbsolutePath());
		logger.info("Title: " + aTitle);
		logger.info("Menu text length: " + aMenuTextLength);
		logger.info("CSS list: " + aCssList);
		logger.info("Rewrite: " + rewrite);
		logger.info("-----------------------------------------------");
		
		try
		{			
			if (aTitle == null || aTitle.trim().equals(""))
			{
				aTitle = "Inneh�llsf�rteckning";
			}
			
			if (aMenuTextLength == null || aMenuTextLength.trim().equals(""))
			{
				aMenuTextLength = "20";
			}
			
			try
			{
				menuMaxLength = new Integer(aMenuTextLength).intValue();
			}
			catch(NumberFormatException nfe)
			{
				// Do nothing. Use the default value of 20 instead.
			}
			
			OpenOfficeConnection connection = new SocketOpenOfficeConnection(8100);			
			
			//------------------------
			// Setup the output files
			//------------------------
			
			String fileName 		= aDocFile.getName().substring(0, aDocFile.getName().indexOf("."));
			int idIndex 			= fileName.indexOf("_");
			String digitalAssetPath = CmsPropertyHandler.getDigitalAssetPath();
			String folderName		= "";
			
			if(idIndex > -1)
			{
				String fileIdString = fileName.substring(0, idIndex);
				int fileId 			= Integer.parseInt(fileIdString);
				folderName 	= "" + (fileId / 1000);
				digitalAssetPath	= digitalAssetPath + File.separator + folderName;
			}
								
			//----------------------------------------
			// Add the name of the folder to the path
			//----------------------------------------
			
			digitalAssetPath 		= digitalAssetPath + File.separator + fileName;
			
			logger.info("Directory to write files to: " + digitalAssetPath);			
			
			//-------------------------------------------------
			// Add a folder where the files are to be written.
			//-------------------------------------------------
			
			String newFilePath 		= digitalAssetPath + File.separator + fileName;
						
			File pdfFile 			= new File(newFilePath + ".pdf");
			File odtFile 			= new File(newFilePath + ".odt");
			File htmlFile 			= new File(newFilePath + ".html");
			File contentXmlFile 	= new File(digitalAssetPath + File.separator + "content.xml");;
			
			//----------------------------------------------
			// Check if the doc has already been converted.
			// If it has, we don't need another conversion.
			//----------------------------------------------
			
			File documentDir = new File(digitalAssetPath);
			if (!documentDir.exists() || rewrite.equals("true"))
			{
				logger.info("The directory " + digitalAssetPath + " does not exist. Creating it.");
				
				documentDir.mkdir();
				
				logger.info("The directory " + digitalAssetPath + " was successfully created.");
				
				logger.info("Connecting to server...");								
				
				connection.connect();
				
				logger.info("Connection ok");
				
				logger.info("Conversion START");
					
				convertDocument(aDocFile, htmlFile, connection);
				if(!aDocFile.getName().substring(aDocFile.getName().indexOf(".") + 1).equalsIgnoreCase("odt"))
				{
					convertDocument(aDocFile, odtFile, connection);
				}
				else
				{
					odtFile = aDocFile;
				}

				convertDocument(aDocFile, pdfFile, connection);
				connection.disconnect();
				
				logger.info("Conversion END");			
				
				//------------------------------------------------
				// Extract the content.xml file from the ODT file
				// so we can parse the XML and generate the TOC
				//------------------------------------------------
				
				logger.info("Extracting content.xml...");
				
				logger.info("odtFile: " + odtFile.getPath());
				
				logger.info("target path: : " + digitalAssetPath);
				
				contentXmlFile = extractContentXml(odtFile, digitalAssetPath);
				
				logger.info("Done extracting content.xml");
				
				//--------------------------------------------------------
				// Insert the anchors, remove the TOC, remove CSS styles
				// and add a link to the CMS-CSS to the the HTML handbook
				// (Since we've just generated a new nav above)
				//--------------------------------------------------------
				
				logger.info("Updating handbook with extra info");
				
				adaptHandbook(htmlFile, aCssList);
				
				logger.info("Done updating handbook with extra info");
			}
			//--------------------------------
			// Get the URL:s to the resources
			//--------------------------------
			
			logger.info("Extracting URL:s to resources.");
			
			String digitalAssetUrl = CmsPropertyHandler.getDigitalAssetBaseUrl();
			
			//----------------------------------------------------------------
			// Add the contextPath to the URL to avoid problems with niceURIs.
			//-----------------------------------------------------------------
			
			String contextPath = request.getContextPath();
			
			digitalAssetUrl = contextPath + "/" + digitalAssetUrl;
			
			//--------------------------------
			// Add the folder name to the URL
			//--------------------------------
			
			if (!folderName.equals(""))
			{
				digitalAssetUrl = digitalAssetUrl + "/" + folderName;
			}
						
			String htmlFileUrl 	= digitalAssetUrl + "/" + fileName + "/" + htmlFile.getName();
			String pdfFileUrl	= digitalAssetUrl + "/" + fileName + "/" + pdfFile.getName();
			String odtFileUrl	= digitalAssetUrl + "/" + fileName + "/" + odtFile.getName();
			
			logger.info("htmlFileUrl: " + htmlFileUrl);
			logger.info("pdfFileUrl: " + pdfFileUrl);
			logger.info("odtFileUrl: " + odtFileUrl);
			
			//--------------------------
			// Generate HTML TOC string
			//--------------------------
			
			logger.info("Generating TOC...");
			
			String tocString 	= generateHtmlToc(contentXmlFile, htmlFileUrl, aTitle, menuMaxLength, keepMenuExpanded);

			logger.info("Done generating TOC");
			
			convertedDocument.setHtmlFileUrl(htmlFileUrl);
			convertedDocument.setPdfFileUrl(pdfFileUrl);
			convertedDocument.setOdtFileUrl(odtFileUrl);
			convertedDocument.setTocString(tocString);
		}
		catch(Exception e)
		{
			logger.error("An error occurred when converting document:" + e.getMessage(), e);
		}
		
		logger.info("END");
		
		return convertedDocument;
	}
	
	private static String generateHtmlToc(File aContentXmlFile, String aHtmlFileUrl, String aTitle, int aMenuMaxLength, String keepMenuExpanded) throws Exception 
	{		
		logger.info("Start generating HTML TOC: xmlFile: " + aContentXmlFile.getPath() + ", htmlFileUrl: " + aHtmlFileUrl);
		
		SAXBuilder builder 	= new SAXBuilder();
		Document doc 		= builder.build(aContentXmlFile);
		List tocElements	= null;
		
		//--------------------------------------------------------------
		// Find the element in the XML containing the Table Of Contents
		//--------------------------------------------------------------
		
		try
		{
			XPath xpath 					= XPath.newInstance("/descendant::text:index-body[1]");
			xpath.addNamespace(officeNs);
			xpath.addNamespace(textNs);
			
			Object temp						= xpath.selectSingleNode(doc);
			
			if (temp != null)
			{
				Element textIndexBodyElement 	= (Element)temp;
				tocElements						= textIndexBodyElement.getChildren();
			}			
		}
		catch(Exception e)
		{
			throw new Exception("The document structure is incorrect. Please create a document containing a table of contents. " + e.getMessage());
		}
		
		//------------------------------------
		// Generate the HTML for the TOC menu
		//------------------------------------
		
		if (tocElements != null)
		{
			logger.info("Found TOC elements, generating TOC.");
			StringBuffer htmlMenuSb = new StringBuffer();			
			generateHtml(tocElements.toArray(), htmlMenuSb, aHtmlFileUrl, aTitle, aMenuMaxLength, keepMenuExpanded);		
			return htmlMenuSb.toString();
		}
		else
		{
			throw new Exception ("The list of TOC elements was null.");
		}
	}

	private static StringBuffer generateHtml(Object[] aTocElements, StringBuffer aReturnSb, String aHtmlFileUrl, String aTitle, int aMenuMaxLength, String keepMenuExpanded) throws Exception 
	{				
		Element child 					= null;
		Element grandChild				= null;
		String elementText				= "";		
		String headingNumber			= "";
		int startPosition 				= 0;
		String previousHeadingNumber 	= ""; 
		int level						= 0;
		int previousLevel				= 0;
		int numberOfEndUls 				= 0;
		StringTokenizer st				= null;
		int linkCounter					= 0;		
		String croppedElementText		= "";
		int cropCounter					= 0;
		boolean willCrop				= false;
		
		boolean keepMenuExpandedBoolean = "true".equalsIgnoreCase(keepMenuExpanded);
		
		String javaScriptToExpandAndCollapse;
		StringBuilder headingIds = new StringBuilder();
		
		if(keepMenuExpandedBoolean)
		{
			javaScriptToExpandAndCollapse = "\n<script type='text/javascript'> \n" +
			"function expandOrCollapse(id, eventHandle){ \n" +
			"if (!eventHandle) var eventHandle = window.event; \n" +
			"if (eventHandle) eventHandle.cancelBubble = true; \n" +
			"if (eventHandle.stopPropagation) eventHandle.stopPropagation();\n" +
			"var theElement = document.getElementById(id); \n" +
			"if ( theElement == null ) \n" +
			"{return;} \n" +
			"var listElementStyle=theElement.style; \n" +
			"if (listElementStyle.display!='none') \n" +
			"{listElementStyle.display='none';} \n" +
			"else \n" +
			"{listElementStyle.display='block';} \n" +
			"} \n" +
			"</script>\n";
		}
		else
		{		
			for(Object tmpChild : aTocElements)
			{
				if(tmpChild != null && !((Element)tmpChild).getText().equals(""))
				{
					String tmp = ((Element)tmpChild).getText().substring(0, ((Element)tmpChild).getText().indexOf(" ")).replace(".", "");
					
					headingIds.append(tmp);
					headingIds.append(",");
				}
				else if (((Element)tmpChild).getText() == null || ((Element)tmpChild).getText().equals(""))
				{
					grandChild = ((Element)tmpChild).getChild("a", textNs);
					
					if (grandChild != null && grandChild.getText().indexOf(" ") != -1)
					{
						String tmp = grandChild.getText().substring(0, grandChild.getText().indexOf(" ")).replace(".", "");
						headingIds.append(tmp);
						headingIds.append(",");
					}
				}
			}
			
			javaScriptToExpandAndCollapse =
			"\n<script type='text/javascript'> \n" +
			"String.prototype.startsWith = function(prefix) {return this.indexOf(prefix) === 0;}\n" +
			"function expandOrCollapse(id, eventHandle){ \n" +
			"if (!eventHandle) var eventHandle = window.event; \n" +
			"if (eventHandle) eventHandle.cancelBubble = true; \n" +
			"if (eventHandle.stopPropagation) eventHandle.stopPropagation();\n" +
			"var ids = '" + headingIds.toString() + "';\n" +
			"var myArray = ids.split(','); \n" +
			"for(var i=0;i<myArray.length; i++){ \n" +
			"	if(document.getElementById(myArray[i]) != null){\n" +
			"		if(id.startsWith(myArray[i])){\n" +
			"			document.getElementById(myArray[i]).style.display='block';}\n" +
			"		else{document.getElementById(myArray[i]).style.display='none';}\n" +
			"}\n}\n}\n" +
			"</script>\n";
		}
		
		aReturnSb.append(javaScriptToExpandAndCollapse);
		
		aReturnSb.append("<div id=\"submenu\">");
		aReturnSb.append("<div class=\"menuheader\">" + aTitle + "</div>");

		logger.info("TOC generation start. Number of TOC elements: " + aTocElements.length);
		
		while (startPosition < aTocElements.length)
		{		
			logger.info("");
			logger.info("-------------- New TOC element (startPosition: " + startPosition + ") ------------");
			
			child 			= (Element)aTocElements[startPosition];
			elementText 	= child.getText();	
			
			logger.info("Child name: " + elementText);
		
			//-----------------------------------------------------------------------------
			// If no text was found, check if there is a link-node below this node.
			// If so, use the text from the link node instead. This is necessary to handle 
			// TOCs generated by newer versions of Word.
			//-----------------------------------------------------------------------------
			
			if (elementText == null || elementText.equals(""))
			{
				logger.info("No text found on child, looking for link child instead.");
				
				grandChild = child.getChild("a", textNs);
				
				if (grandChild != null)
				{
					elementText = grandChild.getText();	
				
					logger.info("Grandchild text: " + elementText);
				}
				else
				{
					logger.info("No grandchild was found...");
				}
			}
			
			if (elementText != null && !elementText.equals("") && elementText.indexOf(" ") != -1)
			{
				headingNumber 	= elementText.substring(0, elementText.indexOf(" "));				
				st 				= new StringTokenizer(headingNumber, ".");
				level 			= st.countTokens();				
				
				logger.info("Heading number: " + headingNumber + ", level: " + level + ", text: " + elementText);
				
				if (level > previousLevel)
				{
					String attributes = previousHeadingNumber.equals("") ? "" : " id='" + previousHeadingNumber.replace(".", "") + "' style=\"display:none\"";
					aReturnSb.append("<ul" + attributes + ">");
				}
				else if(level < previousLevel)
				{
					aReturnSb.append("</li>");
					numberOfEndUls = previousLevel - level;

					for (int i = 0; i < numberOfEndUls; i ++)
					{
						aReturnSb.append("</ul></li>");					
					}
				}
				else
				{
					aReturnSb.append("</li>");
				}
				
				//-----------------------------------------------------------------
				// If there is a page number at the end of the line, get rid of it
				//-----------------------------------------------------------------
				
				cropCounter = elementText.length();
				char myChar = elementText.charAt(cropCounter - 1);
				
				while (cropCounter > 0 && Character.isDigit(myChar))
				{		
					cropCounter --;
					myChar = elementText.charAt(cropCounter);
					willCrop = true;
				}
				
				if (willCrop)
				{
					cropCounter ++;
					logger.info("Removing trailing line number.");
				}
				
				if (cropCounter < elementText.length())
				{
					elementText = elementText.substring(0, cropCounter);
				}
				else
				{
					logger.info("The cropCounter ended up outside the string (cropCounter: " + cropCounter + ", elementText.length: " + elementText.length() + ")");
				}
				//------------------------------------------------------------------------
				// Crop the text and add "..." if it's longer than the allowed max length
				//------------------------------------------------------------------------
				
				if (elementText.length() > aMenuMaxLength)
				{
					logger.info("Text too long, cropping");
					
					croppedElementText = elementText.substring(0, aMenuMaxLength) + "...";
				}
				else
				{
					croppedElementText = elementText;
				}
				
				logger.info("Adding TOC <li> element on level " + level + ": " + croppedElementText + ", linkCounter: " + linkCounter);				
				String onClickExpandOrCollapse = (startPosition + 1) <= aTocElements.length ?  " onclick=\"expandOrCollapse('" + headingNumber.replace(".", "") + "',event);\"" : "";
				String onClickScroll = " onclick=\"window.frames['handbookFrame'].scrollToAnchor('link" + linkCounter + "'); return false;\"";
				
				aReturnSb.append("\n<li" + onClickExpandOrCollapse + "><p><a target=\"handbookFrame\" href=\"" + aHtmlFileUrl + "#link" + linkCounter + "\" title=\"" + elementText + "\"" + onClickScroll + ">" + croppedElementText + "</a></p>");
				previousHeadingNumber 	= headingNumber;
				previousLevel 			= level;
				linkCounter ++;
			}
			else
			{
				logger.info("This node does not meet the requirements for a TOC element: " + elementText);				
			}
			startPosition = startPosition + 1;
		}
		
		aReturnSb.append("\n</li></ul>");
		logger.info("TOC generation end.");
		
		aReturnSb.append("\n</div>");

		return aReturnSb;		
	}
	
	public static void adaptHandbook(File aHandbookHtmlFile, List aCssList) throws Exception
	{
		String originalHtmlContent 		= readFileIntoString(aHandbookHtmlFile);
		String htmlContentWithoutToc	= removeTocFromHtml(originalHtmlContent);
		String htmlContentWithAnchors 	= insertAnchorsAndJavaScript(htmlContentWithoutToc);
		String htmlWithProperCss		= fixCss(htmlContentWithAnchors, aCssList);
		writeStringToFile(aHandbookHtmlFile, htmlWithProperCss);
	}
	
	private static String fixCss(String aHtmlContent, List aCssList)
	{		
		logger.info("About to add the CSS links to the page");
		
		StringBuffer sb 				= new StringBuffer();		
		int cssStartIndex 				= aHtmlContent.indexOf("<STYLE TYPE=\"text/css\">");	
		if (cssStartIndex >= 0)
		{
			String start 					= aHtmlContent.substring(0, cssStartIndex);
			String temp 					= aHtmlContent.substring(cssStartIndex + 1);
			String end 						= temp.substring(temp.indexOf("</STYLE>") + 8);		
			StringBuffer linkedCssString 	= new StringBuffer();
			Iterator it 					= aCssList.iterator();
			String cssString 				= "";
			
			while (it.hasNext())
			{
				cssString = (String)it.next();
				
				logger.info("Adding CSS: " + cssString);
				
				cssString = "<link href=\"" + cssString + "\" rel=\"stylesheet\" type=\"text/css\" />" + '\n';
				linkedCssString.append(cssString);
			}
			
			sb.append(start);
			sb.append(linkedCssString.toString());
			sb.append(end);	
		}
		logger.info("Done adding CSS links.");
		
		return sb.toString();
	}
	
	private static String removeTocFromHtml(String aHtmlContent)
	{
		logger.info("About to remove TOC from HTML");
		
		StringBuffer sb 	= new StringBuffer();
		
		int tocStartIndex 	= -1;
		
		//--------------------------------------------------
		// Look for the start of the TOC if it's in English
		//--------------------------------------------------
		
		tocStartIndex		= aHtmlContent.indexOf("<DIV ID=\"Table of Contents1\" DIR=\"LTR\">");
		
		//--------------------------------------------------
		// Look for the start of the TOC if it's in Swedish
		//--------------------------------------------------
		
		if (tocStartIndex == -1)
		{
			tocStartIndex	= aHtmlContent.indexOf("<DIV ID=\"Innehållsförteckning1\" DIR=\"LTR\">");
		}
		
		if (tocStartIndex > -1)
		{		
			logger.info("The HTML string contains a TOC beginning at position " + tocStartIndex + ". Removing it.");
			
			String start 	= aHtmlContent.substring(0, tocStartIndex);
			String temp 	= aHtmlContent.substring(tocStartIndex + 1);
			String end 		= temp.substring(temp.indexOf("</DIV>") + 6);
			
			sb.append(start);
			sb.append(end);
			
			logger.info("The TOC was succesfully removed.");
		}
		else
		{
			logger.info("No TOC found in the HTML string.");
			
			sb.append(aHtmlContent);
		}
		return sb.toString();
	}

	private static String insertAnchorsAndJavaScript(String aOriginalHtmlContent) 
	{		
		StringBuffer modifiedHtmlContent 	= new StringBuffer();
		StringTokenizer st 					= new StringTokenizer(aOriginalHtmlContent, System.getProperty("line.separator"));
		String lineString					= "";
		int linkCounter						= 0;
		
		
		
		while (st.hasMoreTokens())
		{
			lineString = st.nextToken();
			
			if(lineString.indexOf("<HEAD>") > -1)
			{
				String str = "\n<script type='text/javascript'> \n" +
				"function scrollToAnchor(anchorID){ \n" +
				"if(anchorID!=null){ \n" +
				"anchorPos = document.getElementById(anchorID).offsetTop;\n" +
				"document.body.scrollTop = anchorPos;}}\n" +
				"</script>";
				
				lineString = lineString.concat(str);
			}
			
			if (lineString.indexOf("<H1") > -1)
			{			
				lineString = lineString.replaceAll("<H1", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H1");				
				linkCounter ++;	
			}
			else if (lineString.indexOf("<H2") > -1)
			{
				lineString = lineString.replaceAll("<H2", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H2");				
				linkCounter ++;	
			}
			else if (lineString.indexOf("<H3") > -1)
			{
				lineString = lineString.replaceAll("<H3", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H3");				
				linkCounter ++;	
			}
			else if (lineString.indexOf("<H4") > -1)
			{
				lineString = lineString.replaceAll("<H4", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H4");				
				linkCounter ++;	
			}
			
			modifiedHtmlContent.append(lineString + System.getProperty("line.separator"));		
		}		
		return modifiedHtmlContent.toString();
	}

	public static String readFileIntoString(File aFile) throws Exception
	{
		StringBuffer contents 	= new StringBuffer();
	    BufferedReader input 	= null;
	    try 
	    {	     
	    	input 				= new BufferedReader( new FileReader(aFile) );
	    	String line 		= null;
	      
	    	while (( line = input.readLine()) != null)
	    	{
	    		contents.append(line);
	    		contents.append(System.getProperty("line.separator"));
	    	}
	    }
	    catch (Exception e) 
	    {
	    	throw (e);
	    }	  
	    finally 
	    {
	    	if (input!= null) 
    		{	         
    			input.close();
    		}		   
	    }
	    return contents.toString();
	}
	
	public static void writeStringToFile(File aFile, String aContents) throws FileNotFoundException, IOException
	{		
		if (aFile == null) 
		{
			throw new IllegalArgumentException("File should not be null.");
		}
		if (!aFile.exists()) 
		{
			throw new FileNotFoundException ("File does not exist: " + aFile);
		}
		if (!aFile.isFile()) 
		{
			throw new IllegalArgumentException("Should not be a directory: " + aFile);
		}
		if (!aFile.canWrite()) 
		{
			throw new IllegalArgumentException("File cannot be written: " + aFile);
		}
		
		Writer output = null;
		
		try 
		{		
			output = new BufferedWriter( new FileWriter(aFile) );
			output.write( aContents );
		}
		finally 
		{		
			if (output != null)
			{
				output.close();
			}
		}		
	}
	
	public static void listChildren(Element aParentElement)
	{
		if (aParentElement == null)
		{
			logger.info("The supplied Element was null");
		}
		else
		{
			logger.info("Children to " + aParentElement.getNamespacePrefix() + ":" + aParentElement.getName() + ": ");
			logger.info("---------------------------------");
			List children 		= aParentElement.getChildren();		
			Iterator it 		= children.iterator();		
			while(it.hasNext())
			{
				Element child = (Element)it.next();
				logger.info(child.getNamespacePrefix() + ":" + child.getName() + "=" + child.getText());
			}
			logger.info("---------------------------------");
		}
	}

	public static void convertDocument(File aInputFile, File aOutputFile, OpenOfficeConnection aConnection)
	{							
		String fileType = "";
		fileType 		= aOutputFile.getAbsolutePath().substring(aOutputFile.getAbsolutePath().lastIndexOf(".") + 1);
		
		logger.info("Converting document to " + fileType + "...");

		//--------------------------------------------
		// Connect to server and create the converter
		//--------------------------------------------
		
		DocumentConverter converter = new OpenOfficeDocumentConverter(aConnection); 
				
		//---------------------------------------------
		// Convert the document to the selected format
		//---------------------------------------------
		
		logger.info("Converting from " + aInputFile.getPath() + " to " + aOutputFile.getPath());
		
		converter.convert(aInputFile, aOutputFile);
		
		logger.info("Conversion complete");
	}
	
	public static File extractContentXml(File aOdtFile, String aTargetDirectory) throws ZipException, IOException
	{
		logger.info("Target directory for content.xml: " + aTargetDirectory);
		
		File contentXmlFile = null;
		ZipFile  zipFile 	= new ZipFile(aOdtFile);		
		Enumeration entries = zipFile.entries();

		while(entries.hasMoreElements()) 
		{			
			ZipEntry entry = (ZipEntry)entries.nextElement();
			
			if (entry.getName().equals("content.xml"))
			{	
				logger.info("Found the content.xml file.");
				
				contentXmlFile = new File(aTargetDirectory + File.separator + entry.getName());
				
				logger.info("Copying entry " + entry.getName() + " from ODT file to " + contentXmlFile.getPath());
				
				copyInputStream(zipFile.getInputStream(entry), new BufferedOutputStream(new FileOutputStream(contentXmlFile)));
				
				logger.info("Success!");
				
				break;
			}			
		}	
		zipFile.close();
		
		logger.info("Content XML extraction successful.");
		
		return(contentXmlFile);
	}
	
	public static final void copyInputStream(InputStream in, OutputStream out) throws IOException
	{
		byte[] buffer = new byte[1024];
	    int len;

	    while((len = in.read(buffer)) >= 0)
	    {
	    	out.write(buffer, 0, len);
	    }
	    
	    in.close();
	    out.close();
	}
}