1 /*
2 * $Header: /home/cvs/jakarta-commons-sandbox/jelly/src/java/org/apache/commons/jelly/tags/xml/ParseTag.java,v 1.9 2002/06/26 09:24:35 jstrachan Exp $
3 * $Revision: 1.9 $
4 * $Date: 2002/06/26 09:24:35 $
5 *
6 * ====================================================================
7 *
8 * The Apache Software License, Version 1.1
9 *
10 * Copyright (c) 1999-2002 The Apache Software Foundation. All rights
11 * reserved.
12 *
13 * Redistribution and use in source and binary forms, with or without
14 * modification, are permitted provided that the following conditions
15 * are met:
16 *
17 * 1. Redistributions of source code must retain the above copyright
18 * notice, this list of conditions and the following disclaimer.
19 *
20 * 2. Redistributions in binary form must reproduce the above copyright
21 * notice, this list of conditions and the following disclaimer in
22 * the documentation and/or other materials provided with the
23 * distribution.
24 *
25 * 3. The end-user documentation included with the redistribution, if
26 * any, must include the following acknowlegement:
27 * "This product includes software developed by the
28 * Apache Software Foundation (http://www.apache.org/)."
29 * Alternately, this acknowlegement may appear in the software itself,
30 * if and wherever such third-party acknowlegements normally appear.
31 *
32 * 4. The names "The Jakarta Project", "Commons", and "Apache Software
33 * Foundation" must not be used to endorse or promote products derived
34 * from this software without prior written permission. For written
35 * permission, please contact apache@apache.org.
36 *
37 * 5. Products derived from this software may not be called "Apache"
38 * nor may "Apache" appear in their names without prior written
39 * permission of the Apache Group.
40 *
41 * THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
42 * WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
43 * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
44 * DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
45 * ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
46 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
47 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
48 * USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
49 * ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
50 * OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
51 * OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
52 * SUCH DAMAGE.
53 * ====================================================================
54 *
55 * This software consists of voluntary contributions made by many
56 * individuals on behalf of the Apache Software Foundation. For more
57 * information on the Apache Software Foundation, please see
58 * <http://www.apache.org/>.
59 *
60 * $Id: ParseTag.java,v 1.9 2002/06/26 09:24:35 jstrachan Exp $
61 */
62 package org.apache.commons.jelly.tags.html;
63
64 import org.apache.commons.jelly.XMLOutput;
65 import org.apache.commons.jelly.tags.xml.ParseTagSupport;
66
67 import org.apache.commons.logging.Log;
68 import org.apache.commons.logging.LogFactory;
69
70 import org.cyberneko.html.parsers.SAXParser;
71
72 import org.dom4j.Document;
73 import org.dom4j.io.SAXReader;
74
75
76 /*** A tag which parses some HTML and defines a variable with the parsed Document.
77 * The HTML can either be specified as its body or can be passed in via the
78 * html property which can be a Reader, InputStream, URL or String URI.
79 *
80 * @author <a href="mailto:jstrachan@apache.org">James Strachan</a>
81 * @version $Revision: 1.9 $
82 */
83 public class ParseTag extends ParseTagSupport {
84
85 /*** The Log to which logging calls will be made. */
86 private static final Log log = LogFactory.getLog(ParseTag.class);
87
88 /*** The HTML to parse, either a String URI, a Reader or InputStream */
89 private Object html;
90
91 public ParseTag() {
92 }
93
94 // Tag interface
95 //-------------------------------------------------------------------------
96 public void doTag(XMLOutput output) throws Exception {
97 if (getVar() == null) {
98 throw new IllegalArgumentException("The var attribute cannot be null");
99 }
100 Document document = null;
101 if (html == null) {
102 document = parseBody(output);
103 }
104 else {
105 document = parse(html);
106 }
107 context.setVariable(getVar(), document);
108 }
109
110 // Properties
111 //-------------------------------------------------------------------------
112 /*** Sets the source of the HTML which is either a String URI, Reader or InputStream */
113 public void setHtml(Object html) {
114 this.html = html;
115 }
116
117
118 // Implementation methods
119 //-------------------------------------------------------------------------
120
121 /***
122 * Factory method to create a new SAXReader
123 */
124 protected SAXReader createSAXReader() throws Exception {
125 // installs the NeckHTML parser
126 SAXParser parser = new SAXParser();
127 parser.setProperty(
128 "http://cyberneko.org/html/properties/names/elems",
129 "match"
130 );
131 parser.setProperty(
132 "http://cyberneko.org/html/properties/names/attrs",
133 "match"
134 );
135 return new SAXReader( parser );
136 }
137 }
This page was automatically generated by Maven