Sample code for 30+ languages & platforms
Java

Download HTML from URL and Convert to XML

See more HTML-to-XML/Text Examples

Downloads an HTML page from a URL and converts it to XML.

Chilkat Java Downloads

Java
import com.chilkatsoft.*;

public class ChilkatExample {

  static {
    try {
        System.loadLibrary("chilkat");
    } catch (UnsatisfiedLinkError e) {
      System.err.println("Native code library failed to load.\n" + e);
      System.exit(1);
    }
  }

  public static void main(String argv[])
  {
    boolean success = false;

    // Note: This example requires the Chilkat Bundle license.

    // Any string argument automatically begins the 30-day trial.
    CkGlobal glob = new CkGlobal();
    success = glob.UnlockBundle("30-day trial");
    if (success != true) {
        System.out.println(glob.lastErrorText());
        return;
        }

    CkHttp http = new CkHttp();

    String html;
    html = http.quickGetStr("http://www.intel.com/");
    if (http.get_LastMethodSuccess() != true) {
        System.out.println(http.lastErrorText());
        return;
        }

    CkHtmlToXml htmlToXml = new CkHtmlToXml();

    // Indicate the charset of the output XML we'll want.
    htmlToXml.put_XmlCharset("utf-8");

    // Set the HTML:
    htmlToXml.put_Html(html);

    // Convert to XML:
    String xml;
    xml = htmlToXml.toXml();

    // Save the XML to a file.
    // Make sure your charset here matches the charset
    // used for the XmlCharset property.
    success = htmlToXml.WriteStringToFile(xml,"qa_output/out.xml","utf-8");

    System.out.println("Finished.");
  }
}