Source Code of org.infoglue.cms.util.DocumentConverterHelper

/* ===============================================================================
 *
 * Part of the InfoGlue Content Management Platform (www.infoglue.org)
 *
 * ===============================================================================
 *
 *  Copyright (C)
 * 
 * This program is free software; you can redistribute it and/or modify it under
 * the terms of the GNU General Public License version 2, as published by the
 * Free Software Foundation. See the file LICENSE.html for more information.
 * 
 * This program is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY, including the implied warranty of MERCHANTABILITY or FITNESS
 * FOR A PARTICULAR PURPOSE. See the GNU General Public License for more details.
 * 
 * You should have received a copy of the GNU General Public License along with
 * this program; if not, write to the Free Software Foundation, Inc. / 59 Temple
 * Place, Suite 330 / Boston, MA 02111-1307 / USA.
 *
 * ===============================================================================
 */


package org.infoglue.cms.util;


import java.io.BufferedOutputStream;
import java.io.BufferedReader;
import java.io.BufferedWriter;
import java.io.File;
import java.io.FileNotFoundException;
import java.io.FileOutputStream;
import java.io.FileReader;
import java.io.FileWriter;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.io.Writer;
import java.util.Enumeration;
import java.util.Iterator;
import java.util.List;
import java.util.StringTokenizer;
import java.util.zip.ZipEntry;
import java.util.zip.ZipException;
import java.util.zip.ZipFile;


import javax.servlet.http.HttpServletRequest;


import org.apache.log4j.Logger;
import org.infoglue.deliver.applications.databeans.ConvertedDocumentBean;
import org.jdom.Document;
import org.jdom.Element;
import org.jdom.Namespace;
import org.jdom.input.SAXBuilder;
import org.jdom.xpath.XPath;


import com.artofsolving.jodconverter.DocumentConverter;
import com.artofsolving.jodconverter.openoffice.connection.OpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.connection.SocketOpenOfficeConnection;
import com.artofsolving.jodconverter.openoffice.converter.OpenOfficeDocumentConverter;


public class DocumentConverterHelper 
{
  private final static Logger logger   = Logger.getLogger(DocumentConverterHelper.class.getName());
  private static Namespace officeNs   = Namespace.getNamespace("office", "urn:oasis:names:tc:opendocument:xmlns:office:1.0");
  private static Namespace textNs   = Namespace.getNamespace("text", "urn:oasis:names:tc:opendocument:xmlns:text:1.0");
  
  public ConvertedDocumentBean convert(HttpServletRequest request, File aDocFile, String aTitle, String aMenuTextLength, List aCssList, String rewrite, String keepMenuExpanded) 
  {
    ConvertedDocumentBean convertedDocument = new ConvertedDocumentBean();
    int menuMaxLength            = 20;
    
    logger.info("-----------------------------------------------");
    logger.info("Doc file: " + aDocFile.getAbsolutePath());
    logger.info("Title: " + aTitle);
    logger.info("Menu text length: " + aMenuTextLength);
    logger.info("CSS list: " + aCssList);
    logger.info("Rewrite: " + rewrite);
    logger.info("-----------------------------------------------");
    
    try
    {      
      if (aTitle == null || aTitle.trim().equals(""))
      {
        aTitle = "Inneh�llsf�rteckning";
      }
      
      if (aMenuTextLength == null || aMenuTextLength.trim().equals(""))
      {
        aMenuTextLength = "20";
      }
      
      try
      {
        menuMaxLength = new Integer(aMenuTextLength).intValue();
      }
      catch(NumberFormatException nfe)
      {
        // Do nothing. Use the default value of 20 instead.
      }
      
      OpenOfficeConnection connection = new SocketOpenOfficeConnection(8100);      
      
      //------------------------
      // Setup the output files
      //------------------------
      
      String fileName     = aDocFile.getName().substring(0, aDocFile.getName().indexOf("."));
      int idIndex       = fileName.indexOf("_");
      String digitalAssetPath = CmsPropertyHandler.getDigitalAssetPath();
      String folderName    = "";
      
      if(idIndex > -1)
      {
        String fileIdString = fileName.substring(0, idIndex);
        int fileId       = Integer.parseInt(fileIdString);
        folderName   = "" + (fileId / 1000);
        digitalAssetPath  = digitalAssetPath + File.separator + folderName;
      }
                
      //----------------------------------------
      // Add the name of the folder to the path
      //----------------------------------------
      
      digitalAssetPath     = digitalAssetPath + File.separator + fileName;
      
      logger.info("Directory to write files to: " + digitalAssetPath);      
      
      //-------------------------------------------------
      // Add a folder where the files are to be written.
      //-------------------------------------------------
      
      String newFilePath     = digitalAssetPath + File.separator + fileName;
            
      File pdfFile       = new File(newFilePath + ".pdf");
      File odtFile       = new File(newFilePath + ".odt");
      File htmlFile       = new File(newFilePath + ".html");
      File contentXmlFile   = new File(digitalAssetPath + File.separator + "content.xml");;
      
      //----------------------------------------------
      // Check if the doc has already been converted.
      // If it has, we don't need another conversion.
      //----------------------------------------------
      
      File documentDir = new File(digitalAssetPath);
      if (!documentDir.exists() || rewrite.equals("true"))
      {
        logger.info("The directory " + digitalAssetPath + " does not exist. Creating it.");
        
        documentDir.mkdir();
        
        logger.info("The directory " + digitalAssetPath + " was successfully created.");
        
        logger.info("Connecting to server...");                
        
        connection.connect();
        
        logger.info("Connection ok");
        
        logger.info("Conversion START");
          
        convertDocument(aDocFile, htmlFile, connection);
        if(!aDocFile.getName().substring(aDocFile.getName().indexOf(".") + 1).equalsIgnoreCase("odt"))
        {
          convertDocument(aDocFile, odtFile, connection);
        }
        else
        {
          odtFile = aDocFile;
        }


        convertDocument(aDocFile, pdfFile, connection);
        connection.disconnect();
        
        logger.info("Conversion END");      
        
        //------------------------------------------------
        // Extract the content.xml file from the ODT file
        // so we can parse the XML and generate the TOC
        //------------------------------------------------
        
        logger.info("Extracting content.xml...");
        
        logger.info("odtFile: " + odtFile.getPath());
        
        logger.info("target path: : " + digitalAssetPath);
        
        contentXmlFile = extractContentXml(odtFile, digitalAssetPath);
        
        logger.info("Done extracting content.xml");
        
        //--------------------------------------------------------
        // Insert the anchors, remove the TOC, remove CSS styles
        // and add a link to the CMS-CSS to the the HTML handbook
        // (Since we've just generated a new nav above)
        //--------------------------------------------------------
        
        logger.info("Updating handbook with extra info");
        
        adaptHandbook(htmlFile, aCssList);
        
        logger.info("Done updating handbook with extra info");
      }
      //--------------------------------
      // Get the URL:s to the resources
      //--------------------------------
      
      logger.info("Extracting URL:s to resources.");
      
      String digitalAssetUrl = CmsPropertyHandler.getDigitalAssetBaseUrl();
      
      //----------------------------------------------------------------
      // Add the contextPath to the URL to avoid problems with niceURIs.
      //-----------------------------------------------------------------
      
      String contextPath = request.getContextPath();
      
      digitalAssetUrl = contextPath + "/" + digitalAssetUrl;
      
      //--------------------------------
      // Add the folder name to the URL
      //--------------------------------
      
      if (!folderName.equals(""))
      {
        digitalAssetUrl = digitalAssetUrl + "/" + folderName;
      }
            
      String htmlFileUrl   = digitalAssetUrl + "/" + fileName + "/" + htmlFile.getName();
      String pdfFileUrl  = digitalAssetUrl + "/" + fileName + "/" + pdfFile.getName();
      String odtFileUrl  = digitalAssetUrl + "/" + fileName + "/" + odtFile.getName();
      
      logger.info("htmlFileUrl: " + htmlFileUrl);
      logger.info("pdfFileUrl: " + pdfFileUrl);
      logger.info("odtFileUrl: " + odtFileUrl);
      
      //--------------------------
      // Generate HTML TOC string
      //--------------------------
      
      logger.info("Generating TOC...");
      
      String tocString   = generateHtmlToc(contentXmlFile, htmlFileUrl, aTitle, menuMaxLength, keepMenuExpanded);


      logger.info("Done generating TOC");
      
      convertedDocument.setHtmlFileUrl(htmlFileUrl);
      convertedDocument.setPdfFileUrl(pdfFileUrl);
      convertedDocument.setOdtFileUrl(odtFileUrl);
      convertedDocument.setTocString(tocString);
    }
    catch(Exception e)
    {
      logger.error("An error occurred when converting document:" + e.getMessage(), e);
    }
    
    logger.info("END");
    
    return convertedDocument;
  }
  
  private static String generateHtmlToc(File aContentXmlFile, String aHtmlFileUrl, String aTitle, int aMenuMaxLength, String keepMenuExpanded) throws Exception 
  {    
    logger.info("Start generating HTML TOC: xmlFile: " + aContentXmlFile.getPath() + ", htmlFileUrl: " + aHtmlFileUrl);
    
    SAXBuilder builder   = new SAXBuilder();
    Document doc     = builder.build(aContentXmlFile);
    List tocElements  = null;
    
    //--------------------------------------------------------------
    // Find the element in the XML containing the Table Of Contents
    //--------------------------------------------------------------
    
    try
    {
      XPath xpath           = XPath.newInstance("/descendant::text:index-body[1]");
      xpath.addNamespace(officeNs);
      xpath.addNamespace(textNs);
      
      Object temp            = xpath.selectSingleNode(doc);
      
      if (temp != null)
      {
        Element textIndexBodyElement   = (Element)temp;
        tocElements            = textIndexBodyElement.getChildren();
      }      
    }
    catch(Exception e)
    {
      throw new Exception("The document structure is incorrect. Please create a document containing a table of contents. " + e.getMessage());
    }
    
    //------------------------------------
    // Generate the HTML for the TOC menu
    //------------------------------------
    
    if (tocElements != null)
    {
      logger.info("Found TOC elements, generating TOC.");
      StringBuffer htmlMenuSb = new StringBuffer();      
      generateHtml(tocElements.toArray(), htmlMenuSb, aHtmlFileUrl, aTitle, aMenuMaxLength, keepMenuExpanded);    
      return htmlMenuSb.toString();
    }
    else
    {
      throw new Exception ("The list of TOC elements was null.");
    }
  }


  private static StringBuffer generateHtml(Object[] aTocElements, StringBuffer aReturnSb, String aHtmlFileUrl, String aTitle, int aMenuMaxLength, String keepMenuExpanded) throws Exception 
  {        
    Element child           = null;
    Element grandChild        = null;
    String elementText        = "";    
    String headingNumber      = "";
    int startPosition         = 0;
    String previousHeadingNumber   = ""; 
    int level            = 0;
    int previousLevel        = 0;
    int numberOfEndUls         = 0;
    StringTokenizer st        = null;
    int linkCounter          = 0;    
    String croppedElementText    = "";
    int cropCounter          = 0;
    boolean willCrop        = false;
    
    boolean keepMenuExpandedBoolean = "true".equalsIgnoreCase(keepMenuExpanded);
    
    String javaScriptToExpandAndCollapse;
    StringBuilder headingIds = new StringBuilder();
    
    if(keepMenuExpandedBoolean)
    {
      javaScriptToExpandAndCollapse = "\n<script type='text/javascript'> \n" +
      "function expandOrCollapse(id, eventHandle){ \n" +
      "if (!eventHandle) var eventHandle = window.event; \n" +
      "if (eventHandle) eventHandle.cancelBubble = true; \n" +
      "if (eventHandle.stopPropagation) eventHandle.stopPropagation();\n" +
      "var theElement = document.getElementById(id); \n" +
      "if ( theElement == null ) \n" +
      "{return;} \n" +
      "var listElementStyle=theElement.style; \n" +
      "if (listElementStyle.display!='none') \n" +
      "{listElementStyle.display='none';} \n" +
      "else \n" +
      "{listElementStyle.display='block';} \n" +
      "} \n" +
      "</script>\n";
    }
    else
    {    
      for(Object tmpChild : aTocElements)
      {
        if(tmpChild != null && !((Element)tmpChild).getText().equals(""))
        {
          String tmp = ((Element)tmpChild).getText().substring(0, ((Element)tmpChild).getText().indexOf(" ")).replace(".", "");
          
          headingIds.append(tmp);
          headingIds.append(",");
        }
        else if (((Element)tmpChild).getText() == null || ((Element)tmpChild).getText().equals(""))
        {
          grandChild = ((Element)tmpChild).getChild("a", textNs);
          
          if (grandChild != null && grandChild.getText().indexOf(" ") != -1)
          {
            String tmp = grandChild.getText().substring(0, grandChild.getText().indexOf(" ")).replace(".", "");
            headingIds.append(tmp);
            headingIds.append(",");
          }
        }
      }
      
      javaScriptToExpandAndCollapse =
      "\n<script type='text/javascript'> \n" +
      "String.prototype.startsWith = function(prefix) {return this.indexOf(prefix) === 0;}\n" +
      "function expandOrCollapse(id, eventHandle){ \n" +
      "if (!eventHandle) var eventHandle = window.event; \n" +
      "if (eventHandle) eventHandle.cancelBubble = true; \n" +
      "if (eventHandle.stopPropagation) eventHandle.stopPropagation();\n" +
      "var ids = '" + headingIds.toString() + "';\n" +
      "var myArray = ids.split(','); \n" +
      "for(var i=0;i<myArray.length; i++){ \n" +
      "  if(document.getElementById(myArray[i]) != null){\n" +
      "    if(id.startsWith(myArray[i])){\n" +
      "      document.getElementById(myArray[i]).style.display='block';}\n" +
      "    else{document.getElementById(myArray[i]).style.display='none';}\n" +
      "}\n}\n}\n" +
      "</script>\n";
    }
    
    aReturnSb.append(javaScriptToExpandAndCollapse);
    
    aReturnSb.append("<div id=\"submenu\">");
    aReturnSb.append("<div class=\"menuheader\">" + aTitle + "</div>");


    logger.info("TOC generation start. Number of TOC elements: " + aTocElements.length);
    
    while (startPosition < aTocElements.length)
    {    
      logger.info("");
      logger.info("-------------- New TOC element (startPosition: " + startPosition + ") ------------");
      
      child       = (Element)aTocElements[startPosition];
      elementText   = child.getText();  
      
      logger.info("Child name: " + elementText);
    
      //-----------------------------------------------------------------------------
      // If no text was found, check if there is a link-node below this node.
      // If so, use the text from the link node instead. This is necessary to handle 
      // TOCs generated by newer versions of Word.
      //-----------------------------------------------------------------------------
      
      if (elementText == null || elementText.equals(""))
      {
        logger.info("No text found on child, looking for link child instead.");
        
        grandChild = child.getChild("a", textNs);
        
        if (grandChild != null)
        {
          elementText = grandChild.getText();  
        
          logger.info("Grandchild text: " + elementText);
        }
        else
        {
          logger.info("No grandchild was found...");
        }
      }
      
      if (elementText != null && !elementText.equals("") && elementText.indexOf(" ") != -1)
      {
        headingNumber   = elementText.substring(0, elementText.indexOf(" "));        
        st         = new StringTokenizer(headingNumber, ".");
        level       = st.countTokens();        
        
        logger.info("Heading number: " + headingNumber + ", level: " + level + ", text: " + elementText);
        
        if (level > previousLevel)
        {
          String attributes = previousHeadingNumber.equals("") ? "" : " id='" + previousHeadingNumber.replace(".", "") + "' style=\"display:none\"";
          aReturnSb.append("<ul" + attributes + ">");
        }
        else if(level < previousLevel)
        {
          aReturnSb.append("</li>");
          numberOfEndUls = previousLevel - level;


          for (int i = 0; i < numberOfEndUls; i ++)
          {
            aReturnSb.append("</ul></li>");          
          }
        }
        else
        {
          aReturnSb.append("</li>");
        }
        
        //-----------------------------------------------------------------
        // If there is a page number at the end of the line, get rid of it
        //-----------------------------------------------------------------
        
        cropCounter = elementText.length();
        char myChar = elementText.charAt(cropCounter - 1);
        
        while (cropCounter > 0 && Character.isDigit(myChar))
        {    
          cropCounter --;
          myChar = elementText.charAt(cropCounter);
          willCrop = true;
        }
        
        if (willCrop)
        {
          cropCounter ++;
          logger.info("Removing trailing line number.");
        }
        
        if (cropCounter < elementText.length())
        {
          elementText = elementText.substring(0, cropCounter);
        }
        else
        {
          logger.info("The cropCounter ended up outside the string (cropCounter: " + cropCounter + ", elementText.length: " + elementText.length() + ")");
        }
        //------------------------------------------------------------------------
        // Crop the text and add "..." if it's longer than the allowed max length
        //------------------------------------------------------------------------
        
        if (elementText.length() > aMenuMaxLength)
        {
          logger.info("Text too long, cropping");
          
          croppedElementText = elementText.substring(0, aMenuMaxLength) + "...";
        }
        else
        {
          croppedElementText = elementText;
        }
        
        logger.info("Adding TOC <li> element on level " + level + ": " + croppedElementText + ", linkCounter: " + linkCounter);        
        String onClickExpandOrCollapse = (startPosition + 1) <= aTocElements.length ?  " onclick=\"expandOrCollapse('" + headingNumber.replace(".", "") + "',event);\"" : "";
        String onClickScroll = " onclick=\"window.frames['handbookFrame'].scrollToAnchor('link" + linkCounter + "'); return false;\"";
        
        aReturnSb.append("\n<li" + onClickExpandOrCollapse + "><p><a target=\"handbookFrame\" href=\"" + aHtmlFileUrl + "#link" + linkCounter + "\" title=\"" + elementText + "\"" + onClickScroll + ">" + croppedElementText + "</a></p>");
        previousHeadingNumber   = headingNumber;
        previousLevel       = level;
        linkCounter ++;
      }
      else
      {
        logger.info("This node does not meet the requirements for a TOC element: " + elementText);        
      }
      startPosition = startPosition + 1;
    }
    
    aReturnSb.append("\n</li></ul>");
    logger.info("TOC generation end.");
    
    aReturnSb.append("\n</div>");


    return aReturnSb;    
  }
  
  public static void adaptHandbook(File aHandbookHtmlFile, List aCssList) throws Exception
  {
    String originalHtmlContent     = readFileIntoString(aHandbookHtmlFile);
    String htmlContentWithoutToc  = removeTocFromHtml(originalHtmlContent);
    String htmlContentWithAnchors   = insertAnchorsAndJavaScript(htmlContentWithoutToc);
    String htmlWithProperCss    = fixCss(htmlContentWithAnchors, aCssList);
    writeStringToFile(aHandbookHtmlFile, htmlWithProperCss);
  }
  
  private static String fixCss(String aHtmlContent, List aCssList)
  {    
    logger.info("About to add the CSS links to the page");
    
    StringBuffer sb         = new StringBuffer();    
    int cssStartIndex         = aHtmlContent.indexOf("<STYLE TYPE=\"text/css\">");  
    if (cssStartIndex >= 0)
    {
      String start           = aHtmlContent.substring(0, cssStartIndex);
      String temp           = aHtmlContent.substring(cssStartIndex + 1);
      String end             = temp.substring(temp.indexOf("</STYLE>") + 8);    
      StringBuffer linkedCssString   = new StringBuffer();
      Iterator it           = aCssList.iterator();
      String cssString         = "";
      
      while (it.hasNext())
      {
        cssString = (String)it.next();
        
        logger.info("Adding CSS: " + cssString);
        
        cssString = "<link href=\"" + cssString + "\" rel=\"stylesheet\" type=\"text/css\" />" + '\n';
        linkedCssString.append(cssString);
      }
      
      sb.append(start);
      sb.append(linkedCssString.toString());
      sb.append(end);  
    }
    logger.info("Done adding CSS links.");
    
    return sb.toString();
  }
  
  private static String removeTocFromHtml(String aHtmlContent)
  {
    logger.info("About to remove TOC from HTML");
    
    StringBuffer sb   = new StringBuffer();
    
    int tocStartIndex   = -1;
    
    //--------------------------------------------------
    // Look for the start of the TOC if it's in English
    //--------------------------------------------------
    
    tocStartIndex    = aHtmlContent.indexOf("<DIV ID=\"Table of Contents1\" DIR=\"LTR\">");
    
    //--------------------------------------------------
    // Look for the start of the TOC if it's in Swedish
    //--------------------------------------------------
    
    if (tocStartIndex == -1)
    {
      tocStartIndex  = aHtmlContent.indexOf("<DIV ID=\"Inneh&aring;llsf&ouml;rteckning1\" DIR=\"LTR\">");
    }
    
    if (tocStartIndex > -1)
    {    
      logger.info("The HTML string contains a TOC beginning at position " + tocStartIndex + ". Removing it.");
      
      String start   = aHtmlContent.substring(0, tocStartIndex);
      String temp   = aHtmlContent.substring(tocStartIndex + 1);
      String end     = temp.substring(temp.indexOf("</DIV>") + 6);
      
      sb.append(start);
      sb.append(end);
      
      logger.info("The TOC was succesfully removed.");
    }
    else
    {
      logger.info("No TOC found in the HTML string.");
      
      sb.append(aHtmlContent);
    }
    return sb.toString();
  }


  private static String insertAnchorsAndJavaScript(String aOriginalHtmlContent) 
  {    
    StringBuffer modifiedHtmlContent   = new StringBuffer();
    StringTokenizer st           = new StringTokenizer(aOriginalHtmlContent, System.getProperty("line.separator"));
    String lineString          = "";
    int linkCounter            = 0;
    
    
    
    while (st.hasMoreTokens())
    {
      lineString = st.nextToken();
      
      if(lineString.indexOf("<HEAD>") > -1)
      {
        String str = "\n<script type='text/javascript'> \n" +
        "function scrollToAnchor(anchorID){ \n" +
        "if(anchorID!=null){ \n" +
        "anchorPos = document.getElementById(anchorID).offsetTop;\n" +
        "document.body.scrollTop = anchorPos;}}\n" +
        "</script>";
        
        lineString = lineString.concat(str);
      }
      
      if (lineString.indexOf("<H1") > -1)
      {      
        lineString = lineString.replaceAll("<H1", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H1");        
        linkCounter ++;  
      }
      else if (lineString.indexOf("<H2") > -1)
      {
        lineString = lineString.replaceAll("<H2", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H2");        
        linkCounter ++;  
      }
      else if (lineString.indexOf("<H3") > -1)
      {
        lineString = lineString.replaceAll("<H3", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H3");        
        linkCounter ++;  
      }
      else if (lineString.indexOf("<H4") > -1)
      {
        lineString = lineString.replaceAll("<H4", "<A NAME=\"link" + linkCounter + "\" ID=\"link" + linkCounter + "\"></A><H4");        
        linkCounter ++;  
      }
      
      modifiedHtmlContent.append(lineString + System.getProperty("line.separator"));    
    }    
    return modifiedHtmlContent.toString();
  }


  public static String readFileIntoString(File aFile) throws Exception
  {
    StringBuffer contents   = new StringBuffer();
      BufferedReader input   = null;
      try 
      {       
        input         = new BufferedReader( new FileReader(aFile) );
        String line     = null;
        
        while (( line = input.readLine()) != null)
        {
          contents.append(line);
          contents.append(System.getProperty("line.separator"));
        }
      }
      catch (Exception e) 
      {
        throw (e);
      }    
      finally 
      {
        if (input!= null) 
        {           
          input.close();
        }       
      }
      return contents.toString();
  }
  
  public static void writeStringToFile(File aFile, String aContents) throws FileNotFoundException, IOException
  {    
    if (aFile == null) 
    {
      throw new IllegalArgumentException("File should not be null.");
    }
    if (!aFile.exists()) 
    {
      throw new FileNotFoundException ("File does not exist: " + aFile);
    }
    if (!aFile.isFile()) 
    {
      throw new IllegalArgumentException("Should not be a directory: " + aFile);
    }
    if (!aFile.canWrite()) 
    {
      throw new IllegalArgumentException("File cannot be written: " + aFile);
    }
    
    Writer output = null;
    
    try 
    {    
      output = new BufferedWriter( new FileWriter(aFile) );
      output.write( aContents );
    }
    finally 
    {    
      if (output != null)
      {
        output.close();
      }
    }    
  }
  
  public static void listChildren(Element aParentElement)
  {
    if (aParentElement == null)
    {
      logger.info("The supplied Element was null");
    }
    else
    {
      logger.info("Children to " + aParentElement.getNamespacePrefix() + ":" + aParentElement.getName() + ": ");
      logger.info("---------------------------------");
      List children     = aParentElement.getChildren();    
      Iterator it     = children.iterator();    
      while(it.hasNext())
      {
        Element child = (Element)it.next();
        logger.info(child.getNamespacePrefix() + ":" + child.getName() + "=" + child.getText());
      }
      logger.info("---------------------------------");
    }
  }


  public static void convertDocument(File aInputFile, File aOutputFile, OpenOfficeConnection aConnection)
  {              
    String fileType = "";
    fileType     = aOutputFile.getAbsolutePath().substring(aOutputFile.getAbsolutePath().lastIndexOf(".") + 1);
    
    logger.info("Converting document to " + fileType + "...");


    //--------------------------------------------
    // Connect to server and create the converter
    //--------------------------------------------
    
    DocumentConverter converter = new OpenOfficeDocumentConverter(aConnection); 
        
    //---------------------------------------------
    // Convert the document to the selected format
    //---------------------------------------------
    
    logger.info("Converting from " + aInputFile.getPath() + " to " + aOutputFile.getPath());
    
    converter.convert(aInputFile, aOutputFile);
    
    logger.info("Conversion complete");
  }
  
  public static File extractContentXml(File aOdtFile, String aTargetDirectory) throws ZipException, IOException
  {
    logger.info("Target directory for content.xml: " + aTargetDirectory);
    
    File contentXmlFile = null;
    ZipFile  zipFile   = new ZipFile(aOdtFile);    
    Enumeration entries = zipFile.entries();


    while(entries.hasMoreElements()) 
    {      
      ZipEntry entry = (ZipEntry)entries.nextElement();
      
      if (entry.getName().equals("content.xml"))
      {  
        logger.info("Found the content.xml file.");
        
        contentXmlFile = new File(aTargetDirectory + File.separator + entry.getName());
        
        logger.info("Copying entry " + entry.getName() + " from ODT file to " + contentXmlFile.getPath());
        
        copyInputStream(zipFile.getInputStream(entry), new BufferedOutputStream(new FileOutputStream(contentXmlFile)));
        
        logger.info("Success!");
        
        break;
      }      
    }  
    zipFile.close();
    
    logger.info("Content XML extraction successful.");
    
    return(contentXmlFile);
  }
  
  public static final void copyInputStream(InputStream in, OutputStream out) throws IOException
  {
    byte[] buffer = new byte[1024];
      int len;


      while((len = in.read(buffer)) >= 0)
      {
        out.write(buffer, 0, len);
      }
      
      in.close();
      out.close();
  }
}
Source Code of org.infoglue.cms.util.DocumentConverterHelper

Related Classes of org.infoglue.cms.util.DocumentConverterHelper