(CkPython) Download HTML from URL and Convert to XML
Downloads an HTML page from a URL and converts it to XML.
import sys
import chilkat
# Note: This example requires the Chilkat Bundle license.
# Any string argument automatically begins the 30-day trial.
glob = chilkat.CkGlobal()
success = glob.UnlockBundle("30-day trial")
if (success != True):
print(glob.lastErrorText())
sys.exit()
http = chilkat.CkHttp()
html = http.quickGetStr("http://www.intel.com/")
if (http.get_LastMethodSuccess() != True):
print(http.lastErrorText())
sys.exit()
htmlToXml = chilkat.CkHtmlToXml()
# Indicate the charset of the output XML we'll want.
htmlToXml.put_XmlCharset("utf-8")
# Set the HTML:
htmlToXml.put_Html(html)
# Convert to XML:
xml = htmlToXml.toXml()
# Save the XML to a file.
# Make sure your charset here matches the charset
# used for the XmlCharset property.
success = htmlToXml.WriteStringToFile(xml,"qa_output/out.xml","utf-8")
print("Finished.")
|