Chilkat
HOME
Android™
ASP
Visual Basic
VB.NET
C#
iOS (IPhone)
Objective-C
C++
C
MFC
Delphi
FoxPro
Java
Perl
PHP Extension
PHP ActiveX
Python
PowerShell
Ruby
SQL Server
VBScript
|
Extract all HTML Objects from a Web PageDemonstrates how to download a Web page (at a URL) and extract all HTML objects. Eg. images, links, CSS files, JavaScript files, etc.
import com.chilkatsoft.*; public class ChilkatExample { static { try { System.loadLibrary("chilkat"); } catch (UnsatisfiedLinkError e) { System.err.println("Native code library failed to load.\n" + e); System.exit(1); } } public static void main(String argv[]) { CkMht mht = new CkMht(); boolean success; success = mht.UnlockComponent("Anything for 30-day trial"); if (success != true) { System.out.println(mht.lastErrorText()); return; } // Download a URL into an in-memory MHT web archive contained // in a string variable: String mhtDoc; mhtDoc = mht.getMHT("http://www.gopackaging.com/"); if (mhtDoc == null ) { System.out.println(mht.lastErrorText()); return; } // Now extract the HTML and embedded objects: String unpackDir; unpackDir = "/Users/chilkat/temp/"; String htmlFilename; htmlFilename = "gopackaging.html"; String partsSubdir; partsSubdir = "objects"; // Extract to /Users/chilkat/temp/gopackaging.html. // images and other embedded objects are placed in // /Users/chilkat/temp/objects. Directories are automatically // created if they don't already exist. success = mht.UnpackMHTString(mhtDoc,unpackDir,htmlFilename,partsSubdir); if (success != true) { System.out.println(mht.lastErrorText()); } else { System.out.println("Unpacked!"); } } } |
© 2000-2010 Chilkat Software, Inc. All Rights Reserved.