urllib库
urllib库是自带的一个http请求库,包含以下几个常用模块:
-- urllib.request 请求模块
-- urllib.error 异常处理模块
-- urllib.parse url解析模块
1.urllib.request(url)
>>>import urllib.request #导入模块
>>>response = request.urlopen('http://www.xlzweb.top') #请求打开网页
>>>print(response.read().decode('utf-8')) #read()读取内容,decode()以utf-8编码格式显示
2.urllib.request(url,data = None,headers=None) / urllib.parse
>>>from urllib import request,parse #导入request,parse模块
>>>
>>>url = 'http://www.xlzweb.top'
>>>dict = { 'name':'zhangsan' }
>>>headers = { 'User-Agent':'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/60.0.3100.0 Safari/537.36','Host':'httpbin.org' }
>>>data = bytes(parse.urlencode(tict),encoding='utf8') #设置编码格式
>>>req = request.Request(url,data=data,headers=headers) #加入data参数和请求头,向页面发出请求
>>>response = request.urlopen(req) #打开页面
>>>print(request.read().decode('utf-8')) #读取页面
3.urllib.error
>>>from urllib import request,error
>>>
>>>try:
>>> response = request.urlopen('http://www.baidu.com')
>>>except Exception as e:
>>> print(e.reason)
>>>else:
>>> print('Request Successfully')