public final class CmsHtmlExtractor extends java.lang.Object
| Modifier and Type | Method and Description |
|---|---|
static java.lang.String |
extractText(java.io.InputStream in,
java.lang.String encoding)
Extract the text from a HTML page.
|
static java.lang.String |
extractText(java.lang.String content,
java.lang.String encoding)
Extract the text from a HTML page.
|
public static java.lang.String extractText(java.io.InputStream in, java.lang.String encoding) throws org.htmlparser.util.ParserException, java.io.UnsupportedEncodingException
in - the html content input streamencoding - the encoding of the contentorg.htmlparser.util.ParserException - if the parsing of the HTML failedjava.io.UnsupportedEncodingException - if the given encoding is not supportedpublic static java.lang.String extractText(java.lang.String content, java.lang.String encoding) throws org.htmlparser.util.ParserException, java.io.UnsupportedEncodingException
content - the html contentencoding - the encoding of the contentorg.htmlparser.util.ParserException - if the parsing of the HTML failedjava.io.UnsupportedEncodingException - if the given encoding is not supported