Sample code for 30+ languages & platforms
Chilkat2-Python

HTTP GET -- Read Response from Stream

See more REST Examples

Demonstrates how to send an HTTP GET for a web page, and then read the response from a Stream. The purpose is to fulfill a situation such as the following: "I have a URL and just want the <head> </head> portion of the HTML. This would avoid having to download a potentially enormous web page just to get at header information, such as the <styles>."

Chilkat Chilkat2-Python Downloads

Chilkat2-Python
import sys
import chilkat2

success = False

# This example requires the Chilkat API to have been previously unlocked.
# See Global Unlock Sample for sample code.

rest = chilkat2.Rest()

# In this example, we'll get the web page at http://www.nytimes.com/pages/business/index.html
# The domain is "www.nytimes.com", and the path is "/pages/business/index.html"

# If we have only the full URL to begin with, it can be loaded into the Chilkat URL object to
# access the parts:
url = chilkat2.Url()
url.ParseUrl("http://www.nytimes.com/pages/business/index.html")

bAutoReconnect = True
success = rest.Connect(url.Host,url.Port,url.Ssl,bAutoReconnect)

# Send the GET request (This sends the GET request, but does not read the response.)
success = rest.SendReqNoBody("GET",url.Path)
if (success != True):
    print(rest.LastErrorText)
    sys.exit()

# Read the response header.
responseStatusCode = rest.ReadResponseHeader()
if (responseStatusCode < 0):
    print(rest.LastErrorText)
    sys.exit()

print("Response status code = " + str(responseStatusCode))

# We expect a 200 response status.
if (responseStatusCode != 200):

    # If the response status code is not 200, we could check for a redirect status code and 
    # then follow it, read the entire response (as shown here), or just call rest.Disconnect
    errResponse = rest.ReadRespBodyString()
    if (rest.LastMethodSuccess != True):
        print(rest.LastErrorText)
    else:
        print(errResponse)

    sys.exit()

bodyStream = chilkat2.Stream()
# Set a 10 second read timeout for the stream. 
# (Give up if no data arrives within 10 seconds after calling a read method.)
bodyStream.ReadTimeoutMs = 10000

# Create a background thread task to read the response body (which feeds
# it to the bodyStream object.)
# readResponseBodyTask is a CkTask
readResponseBodyTask = rest.ReadRespBodyStreamAsync(bodyStream,True)

# Start the task. 
success = readResponseBodyTask.Run()

# Read the HTTP response body until the "</head>" is seen, or until
# the end-of-stream is reached.

sbBody = chilkat2.StringBuilder()
exitLoop = False
while not exitLoop and (bodyStream.EndOfStream != True) :

    bodyText = bodyStream.ReadString()
    if (bodyStream.LastMethodSuccess == True):
        sbBody.Append(bodyText)
        if (sbBody.Contains("</head>",False)):
            exitLoop = True

    else:
        exitLoop = True

# Cancel the remainder of the task...
readResponseBodyTask.Cancel()

# Ensure we're disconnected from the server.
maxWaitMs = 50
rest.Disconnect(maxWaitMs)

print("----")
print(sbBody.GetAsString())
print("----")
print("Successfully received the body up to the desired point.")