1 /*
2 * $Id: HtmlParser.java 3373 2008-05-12 16:21:24Z xlv $
3 *
4 * Copyright 2001, 2002 by Bruno Lowagie.
5 *
6 * The contents of this file are subject to the Mozilla Public License Version 1.1
7 * (the "License"); you may not use this file except in compliance with the License.
8 * You may obtain a copy of the License at http://www.mozilla.org/MPL/
9 *
10 * Software distributed under the License is distributed on an "AS IS" basis,
11 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
12 * for the specific language governing rights and limitations under the License.
13 *
14 * The Original Code is 'iText, a free JAVA-PDF library'.
15 *
16 * The Initial Developer of the Original Code is Bruno Lowagie. Portions created by
17 * the Initial Developer are Copyright (C) 1999, 2000, 2001, 2002 by Bruno Lowagie.
18 * All Rights Reserved.
19 * Co-Developer of the code is Paulo Soares. Portions created by the Co-Developer
20 * are Copyright (C) 2000, 2001, 2002 by Paulo Soares. All Rights Reserved.
21 *
22 * Contributor(s): all the names of the contributors are added in the source code
23 * where applicable.
24 *
25 * Alternatively, the contents of this file may be used under the terms of the
26 * LGPL license (the "GNU LIBRARY GENERAL PUBLIC LICENSE"), in which case the
27 * provisions of LGPL are applicable instead of those above. If you wish to
28 * allow use of your version of this file only under the terms of the LGPL
29 * License and not to allow others to use your version of this file under
30 * the MPL, indicate your decision by deleting the provisions above and
31 * replace them with the notice and other provisions required by the LGPL.
32 * If you do not delete the provisions above, a recipient may use your version
33 * of this file under either the MPL or the GNU LIBRARY GENERAL PUBLIC LICENSE.
34 *
35 * This library is free software; you can redistribute it and/or modify it
36 * under the terms of the MPL as stated above or under the terms of the GNU
37 * Library General Public License as published by the Free Software Foundation;
38 * either version 2 of the License, or any later version.
39 *
40 * This library is distributed in the hope that it will be useful, but WITHOUT
41 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
42 * FOR A PARTICULAR PURPOSE. See the GNU Library general Public License for more
43 * details.
44 *
45 * If you didn't download this code from the following link, you should check if
46 * you aren't using an obsolete version:
47 * http://www.lowagie.com/iText/
48 */
49
50 package com.lowagie.text.html;
51
52 import java.io.IOException;
53 import java.io.InputStream;
54 import java.io.Reader;
55
56 import org.xml.sax.InputSource;
57 import org.xml.sax.SAXException;
58
59 import com.lowagie.text.DocListener;
60 import com.lowagie.text.ExceptionConverter;
61 import com.lowagie.text.xml.XmlParser;
62
63 /**
64 * This class can be used to parse some HTML files.
65 */
66
67 public class HtmlParser extends XmlParser {
68
69 /**
70 * Constructs an HtmlParser.
71 */
72
73 public HtmlParser() {
74 super();
75 }
76
77 /**
78 * Parses a given file.
79 * @param document the document the parser will write to
80 * @param is the InputSource with the content
81 */
82
83 public void go(DocListener document, InputSource is) {
84 try {
85 parser.parse(is, new SAXmyHtmlHandler(document));
86 }
87 catch(SAXException se) {
88 throw new ExceptionConverter(se);
89 }
90 catch(IOException ioe) {
91 throw new ExceptionConverter(ioe);
92 }
93 }
94
95 /**
96 * Parses a given file that validates with the iText DTD and writes the content to a document.
97 * @param document the document the parser will write to
98 * @param is the InputSource with the content
99 */
100
101 public static void parse(DocListener document, InputSource is) {
102 HtmlParser p = new HtmlParser();
103 p.go(document, is);
104 }
105
106 /**
107 * Parses a given file.
108 * @param document the document the parser will write to
109 * @param file the file with the content
110 */
111
112 public void go(DocListener document, String file) {
113 try {
114 parser.parse(file, new SAXmyHtmlHandler(document));
115 }
116 catch(SAXException se) {
117 throw new ExceptionConverter(se);
118 }
119 catch(IOException ioe) {
120 throw new ExceptionConverter(ioe);
121 }
122 }
123
124 /**
125 * Parses a given file that validates with the iText DTD and writes the content to a document.
126 * @param document the document the parser will write to
127 * @param file the file with the content
128 */
129
130 public static void parse(DocListener document, String file) {
131 HtmlParser p = new HtmlParser();
132 p.go(document, file);
133 }
134
135 /**
136 * Parses a given file.
137 * @param document the document the parser will write to
138 * @param is the InputStream with the content
139 */
140
141 public void go(DocListener document, InputStream is) {
142 try {
143 parser.parse(new InputSource(is), new SAXmyHtmlHandler(document));
144 }
145 catch(SAXException se) {
146 throw new ExceptionConverter(se);
147 }
148 catch(IOException ioe) {
149 throw new ExceptionConverter(ioe);
150 }
151 }
152
153 /**
154 * Parses a given file that validates with the iText DTD and writes the content to a document.
155 * @param document the document the parser will write to
156 * @param is the InputStream with the content
157 */
158
159 public static void parse(DocListener document, InputStream is) {
160 HtmlParser p = new HtmlParser();
161 p.go(document, new InputSource(is));
162 }
163
164 /**
165 * Parses a given file.
166 * @param document the document the parser will write to
167 * @param is the Reader with the content
168 */
169
170 public void go(DocListener document, Reader is) {
171 try {
172 parser.parse(new InputSource(is), new SAXmyHtmlHandler(document));
173 }
174 catch(SAXException se) {
175 throw new ExceptionConverter(se);
176 }
177 catch(IOException ioe) {
178 throw new ExceptionConverter(ioe);
179 }
180 }
181
182 /**
183 * Parses a given file that validates with the iText DTD and writes the content to a document.
184 * @param document the document the parser will write to
185 * @param is the Reader with the content
186 */
187
188 public static void parse(DocListener document, Reader is) {
189 HtmlParser p = new HtmlParser();
190 p.go(document, new InputSource(is));
191 }
192 }