/*
* $Header: /home/cvs/jakarta-commons-sandbox/jelly/src/java/org/apache/commons/jelly/tags/xml/ParseTag.java,v 1.9 2002/06/26 09:24:35 jstrachan Exp $
* $Revision: 1.9 $
* $Date: 2002/06/26 09:24:35 $
*
* ====================================================================
*
* The Apache Software License, Version 1.1
*
* Copyright (c) 1999-2002 The Apache Software Foundation. All rights
* reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
*
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
*
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in
* the documentation and/or other materials provided with the
* distribution.
*
* 3. The end-user documentation included with the redistribution, if
* any, must include the following acknowlegement:
* "This product includes software developed by the
* Apache Software Foundation (http://www.apache.org/)."
* Alternately, this acknowlegement may appear in the software itself,
* if and wherever such third-party acknowlegements normally appear.
*
* 4. The names "The Jakarta Project", "Commons", and "Apache Software
* Foundation" must not be used to endorse or promote products derived
* from this software without prior written permission. For written
* permission, please contact apache@apache.org.
*
* 5. Products derived from this software may not be called "Apache"
* nor may "Apache" appear in their names without prior written
* permission of the Apache Group.
*
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
* DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
* ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
* USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
* SUCH DAMAGE.
* ====================================================================
*
* This software consists of voluntary contributions made by many
* individuals on behalf of the Apache Software Foundation. For more
* information on the Apache Software Foundation, please see
* <http://www.apache.org/>.
*
* $Id: ParseTag.java,v 1.9 2002/06/26 09:24:35 jstrachan Exp $
*/
package org.apache.commons.jelly.tags.html;
import org.apache.commons.jelly.XMLOutput;
import org.apache.commons.jelly.tags.xml.ParseTagSupport;
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.cyberneko.html.parsers.SAXParser;
import org.dom4j.Document;
import org.dom4j.io.SAXReader;
/** A tag which parses some HTML and defines a variable with the parsed Document.
* The HTML can either be specified as its body or can be passed in via the
* html property which can be a Reader, InputStream, URL or String URI.
*
* @author <a href="mailto:jstrachan@apache.org">James Strachan</a>
* @version $Revision: 1.9 $
*/
public class ParseTag extends ParseTagSupport {
/** The Log to which logging calls will be made. */
private static final Log log = LogFactory.getLog(ParseTag.class);
/** The HTML to parse, either a String URI, a Reader or InputStream */
private Object html;
public ParseTag() {
}
// Tag interface
//-------------------------------------------------------------------------
public void doTag(XMLOutput output) throws Exception {
if (getVar() == null) {
throw new IllegalArgumentException("The var attribute cannot be null");
}
Document document = null;
if (html == null) {
document = parseBody(output);
}
else {
document = parse(html);
}
context.setVariable(getVar(), document);
}
// Properties
//-------------------------------------------------------------------------
/** Sets the source of the HTML which is either a String URI, Reader or InputStream */
public void setHtml(Object html) {
this.html = html;
}
// Implementation methods
//-------------------------------------------------------------------------
/**
* Factory method to create a new SAXReader
*/
protected SAXReader createSAXReader() throws Exception {
// installs the NeckHTML parser
SAXParser parser = new SAXParser();
parser.setProperty(
"http://cyberneko.org/html/properties/names/elems",
"match"
);
parser.setProperty(
"http://cyberneko.org/html/properties/names/attrs",
"match"
);
return new SAXReader( parser );
}
}