public final class CmsHtmlExtractor
extends java.lang.Object
| 限定符和类型 | 方法和说明 |
|---|---|
static java.lang.String |
extractText(java.io.InputStream in,
java.lang.String encoding)
Extract the text from a HTML page.
|
static java.lang.String |
extractText(java.lang.String content,
java.lang.String encoding)
Extract the text from a HTML page.
|
public static java.lang.String extractText(java.io.InputStream in,
java.lang.String encoding)
throws org.htmlparser.util.ParserException,
java.io.UnsupportedEncodingException
in - the html content input streamencoding - the encoding of the contentorg.htmlparser.util.ParserException - if the parsing of the HTML failedjava.io.UnsupportedEncodingException - if the given encoding is not supportedpublic static java.lang.String extractText(java.lang.String content,
java.lang.String encoding)
throws org.htmlparser.util.ParserException,
java.io.UnsupportedEncodingException
content - the html contentencoding - the encoding of the contentorg.htmlparser.util.ParserException - if the parsing of the HTML failedjava.io.UnsupportedEncodingException - if the given encoding is not supported