| java.lang.Object com.caucho.xml.AbstractParser com.caucho.xml.XmlParser com.caucho.xml.LooseHtml
LooseHtml | public class LooseHtml extends XmlParser (Code) | | A forgiving HTML parser interface.
The forgiving HTML parser is useful for extracting information from
the web since many sites have not-quite-standard HTML.
To parse a file into a DOM Document use
Document doc = new Html().parseDocument("foo.html");
To parse a string into a DOM Document use
String html = "<h1>small test</h1>";
Document doc = new Html().parseDocumentString(html);
To parse a file using the SAX API use
Html html = new Html();
html.setContentHandler(myContentHandler);
html.parse("foo.html");
|
LooseHtml | public LooseHtml()(Code) | | Create a new forgiving HTML parser
|
Methods inherited from com.caucho.xml.AbstractParser | void clear()(Code)(Java Doc) public ContentHandler getContentHandler()(Code)(Java Doc) public DTDHandler getDTDHandler()(Code)(Java Doc) public String getDefaultEncoding()(Code)(Java Doc) public boolean getEntitiesAsText()(Code)(Java Doc) public EntityResolver getEntityResolver()(Code)(Java Doc) public ErrorHandler getErrorHandler()(Code)(Java Doc) public boolean getFeature(String name) throws SAXNotRecognizedException(Code)(Java Doc) public boolean getForgiving()(Code)(Java Doc) public boolean getJsp()(Code)(Java Doc) public Object getProperty(String name) throws SAXNotRecognizedException(Code)(Java Doc) public boolean getResinInclude()(Code)(Java Doc) public Path getSearchPath()(Code)(Java Doc) public boolean getSkipComments()(Code)(Java Doc) void init()(Code)(Java Doc) public boolean isCoalescing()(Code)(Java Doc) public boolean isNamespaceAware()(Code)(Java Doc) public boolean isNamespacePrefixes()(Code)(Java Doc) public boolean isSAXNamespaces()(Code)(Java Doc) public boolean isValidating()(Code)(Java Doc) protected InputStream openSource(InputSource source) throws IOException, SAXException(Code)(Java Doc) public InputStream openStream(String systemId, String publicId) throws IOException, SAXException(Code)(Java Doc) public InputStream openStream(String systemId, String publicId, EntityResolver entityResolver) throws IOException, SAXException(Code)(Java Doc) protected InputStream openStream(String systemId, String publicId, EntityResolver entityResolver, boolean isTop) throws IOException, SAXException(Code)(Java Doc) public InputStream openTopStream(String systemId, String publicId) throws IOException, SAXException(Code)(Java Doc) public void parse(InputSource source) throws IOException, SAXException(Code)(Java Doc) public void parse(InputStream is) throws IOException, SAXException(Code)(Java Doc) public void parse(InputStream is, String systemId) throws IOException, SAXException(Code)(Java Doc) public void parse(String systemId) throws IOException, SAXException(Code)(Java Doc) public void parse(Path path) throws IOException, SAXException(Code)(Java Doc) public Document parseDocument(InputSource source) throws IOException, SAXException(Code)(Java Doc) public Document parseDocument(String systemId) throws IOException, SAXException(Code)(Java Doc) public Document parseDocument(Path path) throws IOException, SAXException(Code)(Java Doc) public Document parseDocument(InputStream is) throws IOException, SAXException(Code)(Java Doc) public Document parseDocument(InputStream is, String systemId) throws IOException, SAXException(Code)(Java Doc) public void parseDocument(QDocument doc, InputStream is, String systemId) throws IOException, SAXException(Code)(Java Doc) public Document parseDocumentString(String string) throws IOException, SAXException(Code)(Java Doc) public void parseImpl(InputStream is, String systemId) throws IOException, SAXException(Code)(Java Doc) abstract Document parseInt(ReadStream is) throws IOException, SAXException(Code)(Java Doc) public void parseString(String string) throws IOException, SAXException(Code)(Java Doc) public void setAutodetectXml(boolean autodetectXml)(Code)(Java Doc) public void setCoalescing(boolean isCoalescing)(Code)(Java Doc) public void setConfig(DocumentBuilderFactory factory)(Code)(Java Doc) public void setContentHandler(ContentHandler handler)(Code)(Java Doc) public void setDTDHandler(DTDHandler handler)(Code)(Java Doc) public void setDefaultEncoding(String encoding)(Code)(Java Doc) public void setDocumentHandler(DocumentHandler handler)(Code)(Java Doc) public void setEntitiesAsText(boolean entitiesAsText)(Code)(Java Doc) public void setEntityResolver(EntityResolver resolver)(Code)(Java Doc) public void setErrorHandler(ErrorHandler handler)(Code)(Java Doc) public void setExpandEntities(boolean expandEntities)(Code)(Java Doc) public void setFeature(String name, boolean value) throws SAXNotSupportedException(Code)(Java Doc) public void setFilename(String filename)(Code)(Java Doc) public void setForgiving(boolean forgiving)(Code)(Java Doc) public void setJsp(boolean isJsp)(Code)(Java Doc) public void setLexicalHandler(LexicalHandler handler)(Code)(Java Doc) public void setLocale(Locale locale)(Code)(Java Doc) public void setNamespaceAware(boolean isNamespaceAware)(Code)(Java Doc) public void setNamespacePrefixes(boolean isNamespaces)(Code)(Java Doc) public void setOwner(QDocument doc)(Code)(Java Doc) public void setProperty(String name, Object obj) throws SAXNotSupportedException(Code)(Java Doc) public void setResinInclude(boolean doResinInclude)(Code)(Java Doc) public void setSAXNamespaces(boolean isNamespaces)(Code)(Java Doc) public void setSearchPath(Path path)(Code)(Java Doc) public void setSkipComments(boolean skipComments)(Code)(Java Doc) public void setSkipWhitespace(boolean skipWhitespace)(Code)(Java Doc) public void setToLower(boolean toLower)(Code)(Java Doc) public void setValidating(boolean isValidating)(Code)(Java Doc)
|
|
|