import org.ops4j.pax.carrot.api.Options;
import org.ops4j.pax.carrot.html.HtmlParser;
import org.ops4j.pax.carrot.html.HtmlParserImpl;
import org.ops4j.pax.carrot.html.dom.HtmlDocument;
public class HtmlParserExample {
public static void main(String[] args) {
HtmlParser parser = new HtmlParserImpl();
String html = "<html><body><h1>Hello, World!</h1></body></html>";
Options options = new Options();
HtmlDocument document = parser.parse(html, options);
// ...
}
}
import org.ops4j.pax.carrot.api.Options;
import org.ops4j.pax.carrot.html.HtmlParser;
import org.ops4j.pax.carrot.html.HtmlParserImpl;
import org.ops4j.pax.carrot.html.dom.HtmlDocument;
import org.ops4j.pax.carrot.html.dom.HtmlElement;
import org.ops4j.pax.carrot.xpath.XPath;
public class XPathExample {
public static void main(String[] args) {
HtmlParser parser = new HtmlParserImpl();
String html = "<html><body><h1>Hello, World!</h1></body></html>";
Options options = new Options();
HtmlDocument document = parser.parse(html, options);
XPath xpath = new XPath("/html/body/h1");
HtmlElement element = xpath.evaluateFirst(document);
System.out.println(element.getText());
}
}
import org.ops4j.pax.carrot.api.Options;
import org.ops4j.pax.carrot.html.HtmlParser;
import org.ops4j.pax.carrot.html.HtmlParserImpl;
import org.ops4j.pax.carrot.html.dom.HtmlDocument;
import org.ops4j.pax.carrot.html.transform.DefaultHtmlDocumentTransformer;
import org.ops4j.pax.carrot.html.transform.HtmlDocumentTransformer;
public class HtmlTransformationExample {
public static void main(String[] args) {
HtmlParser parser = new HtmlParserImpl();
String html = "<html><body><h1>Hello, World!</h1></body></html>";
Options options = new Options();
HtmlDocument document = parser.parse(html, options);
HtmlDocumentTransformer transformer = new DefaultHtmlDocumentTransformer();
document = transformer.transform(document);
System.out.println(document.serialize());
}
}