import net.htmlparser.jericho.*; public class HTMLParserExample { public static void main(String[] args) throws Exception { Source source = new Source(html); source.fullSequentialParse(); Element h1Element = source.getFirstElement(HTMLElementName.H1); String title = h1Element.getTextExtractor().toString(); Element pElement = source.getFirstElement(HTMLElementName.P); String text = pElement.getTextExtractor().toString(); } }


上一篇:
下一篇:
切换中文