import org.jsoup.Jsoup; import org.jsoup.nodes.Document; import org.jsoup.select.Elements; import org.semarglproject.rdf.ParseException; import org.semarglproject.rdf.rdfa.RdfaParser; import org.semarglproject.source.StreamProcessor; public class RDFaHtmlParserExample { public static void main(String[] args) { Document document = Jsoup.parse("<html><body><div vocab=\"http://schema.org/\" typeof=\"Person\"><span property=\"name\">John Doe</span></div></body></html>"); StreamProcessor streamProcessor = new StreamProcessor(RdfaParser.connect(RDFaParser.RDFaParserFactory.getInstance())); try { streamProcessor.process(document.html(), "http://example.com"); } catch (ParseException e) { e.printStackTrace(); } Elements elements = document.select("[property]"); for (org.jsoup.nodes.Element element : elements) { String property = element.attr("property"); String value = element.text(); System.out.println(property + ": " + value); } } }


上一篇:
下一篇:
切换中文