import org.ops4j.pax.carrot.api.Options; import org.ops4j.pax.carrot.html.HtmlParser; import org.ops4j.pax.carrot.html.HtmlParserImpl; import org.ops4j.pax.carrot.html.dom.HtmlDocument; public class HtmlParserExample { public static void main(String[] args) { HtmlParser parser = new HtmlParserImpl(); String html = "<html><body><h1>Hello, World!</h1></body></html>"; Options options = new Options(); HtmlDocument document = parser.parse(html, options); // ... } } import org.ops4j.pax.carrot.api.Options; import org.ops4j.pax.carrot.html.HtmlParser; import org.ops4j.pax.carrot.html.HtmlParserImpl; import org.ops4j.pax.carrot.html.dom.HtmlDocument; import org.ops4j.pax.carrot.html.dom.HtmlElement; import org.ops4j.pax.carrot.xpath.XPath; public class XPathExample { public static void main(String[] args) { HtmlParser parser = new HtmlParserImpl(); String html = "<html><body><h1>Hello, World!</h1></body></html>"; Options options = new Options(); HtmlDocument document = parser.parse(html, options); XPath xpath = new XPath("/html/body/h1"); HtmlElement element = xpath.evaluateFirst(document); System.out.println(element.getText()); } } import org.ops4j.pax.carrot.api.Options; import org.ops4j.pax.carrot.html.HtmlParser; import org.ops4j.pax.carrot.html.HtmlParserImpl; import org.ops4j.pax.carrot.html.dom.HtmlDocument; import org.ops4j.pax.carrot.html.transform.DefaultHtmlDocumentTransformer; import org.ops4j.pax.carrot.html.transform.HtmlDocumentTransformer; public class HtmlTransformationExample { public static void main(String[] args) { HtmlParser parser = new HtmlParserImpl(); String html = "<html><body><h1>Hello, World!</h1></body></html>"; Options options = new Options(); HtmlDocument document = parser.parse(html, options); HtmlDocumentTransformer transformer = new DefaultHtmlDocumentTransformer(); document = transformer.transform(document); System.out.println(document.serialize()); } }


上一篇:
下一篇:
切换中文