/*
* Copyright (C) 2009 eXo Platform SAS.
*
* This is free software; you can redistribute it and/or modify it
* under the terms of the GNU Lesser General Public License as
* published by the Free Software Foundation; either version 2.1 of
* the License, or (at your option) any later version.
*
* This software is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Lesser General Public License for more details.
*
* You should have received a copy of the GNU Lesser General Public
* License along with this software; if not, write to the Free
* Software Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA
* 02110-1301 USA, or see the FSF site: http://www.fsf.org.
*/
package org.exoplatform.services.document.impl;
import org.exoplatform.commons.utils.QName;
import org.exoplatform.services.document.DCMetaData;
import org.exoplatform.services.document.DocumentReadException;
import org.xml.sax.Attributes;
import org.xml.sax.InputSource;
import org.xml.sax.SAXException;
import org.xml.sax.XMLReader;
import org.xml.sax.helpers.DefaultHandler;
import java.io.IOException;
import java.io.InputStream;
import java.util.Properties;
import java.util.zip.ZipEntry;
import java.util.zip.ZipInputStream;
import javax.xml.parsers.ParserConfigurationException;
import javax.xml.parsers.SAXParser;
import javax.xml.parsers.SAXParserFactory;
/**
* Created by The eXo Platform SAS .
*
* @author Gennady Azarenkov
* @version $Id: $
*/
public class OpenOfficeDocumentReader extends BaseDocumentReader
{
/*
* (non-Javadoc)
*
* @see org.exoplatform.services.document.DocumentReader#getMimeTypes()
*/
public String[] getMimeTypes()
{
return new String[]{"application/vnd.oasis.opendocument.database", "application/vnd.oasis.opendocument.formula",
"application/vnd.oasis.opendocument.graphics", "application/vnd.oasis.opendocument.presentation",
"application/vnd.oasis.opendocument.spreadsheet", "application/vnd.oasis.opendocument.text"};
}
/*
* (non-Javadoc)
*
* @see org.exoplatform.services.document.DocumentReader#getContentAsText(java.
* io.InputStream)
*/
public String getContentAsText(InputStream is) throws IOException, DocumentReadException
{
if (is == null)
{
throw new NullPointerException("InputStream is null.");
}
try
{
SAXParserFactory saxParserFactory = SAXParserFactory.newInstance();
saxParserFactory.setValidating(false);
SAXParser saxParser;
saxParser = saxParserFactory.newSAXParser();
XMLReader xmlReader = saxParser.getXMLReader();
xmlReader.setFeature("http://xml.org/sax/features/validation", false);
xmlReader.setFeature("http://apache.org/xml/features/nonvalidating/load-external-dtd", false);
ZipInputStream zis = new ZipInputStream(is);
ZipEntry ze = zis.getNextEntry();
if (ze == null)
{
return "";
}
while (!ze.getName().equals("content.xml"))
{
ze = zis.getNextEntry();
}
OpenOfficeContentHandler contentHandler = new OpenOfficeContentHandler();
xmlReader.setContentHandler(contentHandler);
try
{
xmlReader.parse(new InputSource(zis));
}
finally
{
try
{
zis.close();
}
catch (IOException e)
{
}
}
return contentHandler.getContent();
}
catch (ParserConfigurationException e)
{
throw new DocumentReadException(e.getMessage(), e);
}
catch (SAXException e)
{
throw new DocumentReadException(e.getMessage(), e);
}
finally
{
if (is != null)
try
{
if (is != null)
try
{
is.close();
}
catch (IOException e)
{
}
is.close();
}
catch (IOException e)
{
}
}
}
public String getContentAsText(InputStream is, String encoding) throws IOException, DocumentReadException
{
// Ignore encoding
return getContentAsText(is);
}
/*
* (non-Javadoc)
*
* @see org.exoplatform.services.document.DocumentReader#getProperties(java.io.
* InputStream)
*/
public Properties getProperties(InputStream is) throws IOException, DocumentReadException
{
try
{
SAXParserFactory saxParserFactory = SAXParserFactory.newInstance();
saxParserFactory.setValidating(false);
SAXParser saxParser = saxParserFactory.newSAXParser();
XMLReader xmlReader = saxParser.getXMLReader();
xmlReader.setFeature("http://xml.org/sax/features/validation", false);
xmlReader.setFeature("http://apache.org/xml/features/nonvalidating/load-external-dtd", false);
ZipInputStream zis = new ZipInputStream(is);
ZipEntry ze = zis.getNextEntry();
while (!ze.getName().equals("meta.xml"))
{
ze = zis.getNextEntry();
}
OpenOfficeMetaHandler metaHandler = new OpenOfficeMetaHandler();
xmlReader.setContentHandler(metaHandler);
try
{
xmlReader.parse(new InputSource(zis));
}
finally
{
zis.close();
}
return metaHandler.getProperties();
}
catch (ParserConfigurationException e)
{
throw new DocumentReadException(e.getMessage(), e);
}
catch (SAXException e)
{
throw new DocumentReadException(e.getMessage(), e);
}
finally
{
if (is != null)
try
{
is.close();
}
catch (IOException e)
{
}
}
}
// --------------------------------------------< OpenOfficeContentHandler >
private class OpenOfficeContentHandler extends DefaultHandler
{
private StringBuilder content;
private boolean appendChar;
public OpenOfficeContentHandler()
{
content = new StringBuilder();
appendChar = false;
}
/**
* Returns the text content extracted from parsed content.xml
*/
public String getContent()
{
return content.toString();
}
public void startElement(String namespaceURI, String localName, String rawName, Attributes atts)
throws SAXException
{
if (rawName.startsWith("text:"))
{
appendChar = true;
}
}
public void characters(char[] ch, int start, int length) throws SAXException
{
if (appendChar)
{
content.append(ch, start, length).append(" ");
}
}
public void endElement(java.lang.String namespaceURI, java.lang.String localName, java.lang.String qName)
throws SAXException
{
appendChar = false;
}
}
private class OpenOfficeMetaHandler extends DefaultHandler
{
private Properties props;
private QName curPropertyName;
private StringBuilder curPropertyValue;
public OpenOfficeMetaHandler()
{
props = new Properties();
curPropertyValue = new StringBuilder();
}
public Properties getProperties()
{
return props;
}
public void startElement(String namespaceURI, String localName, String rawName, Attributes atts)
throws SAXException
{
if (rawName.startsWith("dc:"))
{
curPropertyName = new QName(DCMetaData.DC_NAMESPACE, rawName.substring(3));
}
}
public void characters(char[] ch, int start, int length) throws SAXException
{
if (curPropertyName != null)
{
curPropertyValue.append(ch, start, length);
}
}
public void endElement(java.lang.String namespaceURI, java.lang.String localName, java.lang.String qName)
throws SAXException
{
if (curPropertyName != null)
{
props.put(curPropertyName, curPropertyValue.toString());
curPropertyValue = new StringBuilder();
curPropertyName = null;
}
}
}
}