Reptile 01-urllib commonly used functions

from urllib import request
from urllib import parse
# 1 Read page
url="http://www.baidu.com"
resp=request.urlopen(url)
# Print (resp.getcode ()) # fetch response code
# Print (resp.read ()) # read pages
# Print (resp.readline ()) # reads a line
# Print (resp.readlines () [1]) # returns a list of pages to read

# 2 Download
request.urlretrieve ( "http://www.baidu.com", "baidu.html") # download page
request.urlretrieve("https://bkimg.cdn.bcebos.com/pic/38dbb6fd5266d0167927ca029b2bd40735fa35d9?x-bce-process=image/resize,m_lfit,w_268,limit_1/format,f_jpg","Jay.jpg")

# 3. Codecs
params = { "wd": "Jay"}
qs = parse.urlencode (params) # coding
sq = parse.parse_qs (qs) # decodes
print(sq)

# 4 header information acquisition request
result = parse.urlparse (url)
print (result) # All information
print(result.scheme)
print (result.netloc)
print(result.path)
print(result.params)
print(result.query)
print(result.fragment)

result2=parse.urlsplit(url)
print (result2) # All information
print(result2.scheme)
print (result2.netloc)
print(result2.path)
#print (result2.params) does not parse as this one and the rest
print(result2.query)
print(result2.fragment)

  

Guess you like

Origin www.cnblogs.com/wcyMiracle/p/12460626.html