Chilkat2-Python
Chilkat2-Python
HTTP GET -- Read Response from Stream
See more REST Examples
Demonstrates how to send an HTTP GET for a web page, and then read the response from a Stream. The purpose is to fulfill a situation such as the following: "I have a URL and just want the <head> </head> portion of the HTML. This would avoid having to download a potentially enormous web page just to get at header information, such as the <styles>."Chilkat Chilkat2-Python Downloads
import sys
import chilkat2
success = False
# This example requires the Chilkat API to have been previously unlocked.
# See Global Unlock Sample for sample code.
rest = chilkat2.Rest()
# In this example, we'll get the web page at http://www.nytimes.com/pages/business/index.html
# The domain is "www.nytimes.com", and the path is "/pages/business/index.html"
# If we have only the full URL to begin with, it can be loaded into the Chilkat URL object to
# access the parts:
url = chilkat2.Url()
url.ParseUrl("http://www.nytimes.com/pages/business/index.html")
bAutoReconnect = True
success = rest.Connect(url.Host,url.Port,url.Ssl,bAutoReconnect)
# Send the GET request (This sends the GET request, but does not read the response.)
success = rest.SendReqNoBody("GET",url.Path)
if (success != True):
print(rest.LastErrorText)
sys.exit()
# Read the response header.
responseStatusCode = rest.ReadResponseHeader()
if (responseStatusCode < 0):
print(rest.LastErrorText)
sys.exit()
print("Response status code = " + str(responseStatusCode))
# We expect a 200 response status.
if (responseStatusCode != 200):
# If the response status code is not 200, we could check for a redirect status code and
# then follow it, read the entire response (as shown here), or just call rest.Disconnect
errResponse = rest.ReadRespBodyString()
if (rest.LastMethodSuccess != True):
print(rest.LastErrorText)
else:
print(errResponse)
sys.exit()
bodyStream = chilkat2.Stream()
# Set a 10 second read timeout for the stream.
# (Give up if no data arrives within 10 seconds after calling a read method.)
bodyStream.ReadTimeoutMs = 10000
# Create a background thread task to read the response body (which feeds
# it to the bodyStream object.)
# readResponseBodyTask is a CkTask
readResponseBodyTask = rest.ReadRespBodyStreamAsync(bodyStream,True)
# Start the task.
success = readResponseBodyTask.Run()
# Read the HTTP response body until the "</head>" is seen, or until
# the end-of-stream is reached.
sbBody = chilkat2.StringBuilder()
exitLoop = False
while not exitLoop and (bodyStream.EndOfStream != True) :
bodyText = bodyStream.ReadString()
if (bodyStream.LastMethodSuccess == True):
sbBody.Append(bodyText)
if (sbBody.Contains("</head>",False)):
exitLoop = True
else:
exitLoop = True
# Cancel the remainder of the task...
readResponseBodyTask.Cancel()
# Ensure we're disconnected from the server.
maxWaitMs = 50
rest.Disconnect(maxWaitMs)
print("----")
print(sbBody.GetAsString())
print("----")
print("Successfully received the body up to the desired point.")