add python_spider

master
xianhu 2016-10-16 10:09:57 +08:00
parent 8ffd4d3258
commit 54a152483b
1 changed files with 5 additions and 5 deletions

View File

@ -23,7 +23,7 @@ response = urllib.request.urlopen(request, timeout=10)
# 发送数据即在urlopen()或者Request()中添加data参数 # 发送数据即在urlopen()或者Request()中添加data参数
url = "http://localhost/login.php" url = "http://localhost/login.php"
data = urllib.parse.urlencode({"act": "login", "email": "xianhu@qq.com", "password": "123456"}) data = urllib.parse.urlencode({"act": "login", "email": "xianhu@qq.com", "password": "123456"})
request1 = urllib.request.Request(url, data) # POST方法 request1 = urllib.request.Request(url, data) # POST方法
request2 = urllib.request.Request(url + "?%s" % data) # GET方法 request2 = urllib.request.Request(url + "?%s" % data) # GET方法
response = urllib.request.urlopen(request, timeout=10) response = urllib.request.urlopen(request, timeout=10)
@ -31,7 +31,7 @@ response = urllib.request.urlopen(request, timeout=10)
# 发送Header即在urlopen()或者Request()中添加headers参数 # 发送Header即在urlopen()或者Request()中添加headers参数
headers = {"User-Agent": "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT)"} headers = {"User-Agent": "Mozilla/4.0 (compatible; MSIE 5.5; Windows NT)"}
request = urllib.request.Request(url, data=data, headers=headers) # 参数中添加header参数 request = urllib.request.Request(url, data=data, headers=headers) # 参数中添加header参数
request.add_header("Referer", "http://www.baidu.com") # add_header函数另一种添加header的方法 request.add_header("Referer", "http://www.baidu.com") # add_header函数另一种添加header的方法
response = urllib.request.urlopen(request, timeout=10) response = urllib.request.urlopen(request, timeout=10)
@ -49,10 +49,10 @@ except urllib.error.HTTPError as e:
# 使用代理以防止IP被封或IP次数受限 # 使用代理以防止IP被封或IP次数受限
proxy = urllib.request.ProxyHandler({"http": "111.123.76.12:8080"}) proxy = urllib.request.ProxyHandler({"http": "111.123.76.12:8080"})
opener = urllib.request.build_opener(proxy) # 利用代理创建opener实例OpenerDirector实例 opener = urllib.request.build_opener(proxy) # 利用代理创建opener实例OpenerDirector实例
response = opener.open("https://www.baidu.com/") # 直接利用opener实例打开url response = opener.open("https://www.baidu.com/") # 直接利用opener实例打开url
urllib.request.install_opener(opener) # 安装、设置全局的opener然后利用urlopen打开url urllib.request.install_opener(opener) # 安装、设置全局的opener然后利用urlopen打开url
response = urllib.request.urlopen("https://www.baidu.com/") response = urllib.request.urlopen("https://www.baidu.com/")