1 #coding=utf-8
2 import requests
3 from lxml import etree
4
5 url = 'http://www.heibanke.com/lesson/crawler_ex01/'
6 password = 0
7 #要提交的表单
8 payload = {
9 'password':password,
10 'username':123
11 }
12
13 while password<=30:
14 #获取response
15 payload['password'] = password
16 r = requests.post(url,data = payload)
17 #获取二进制文本,并且从utf-8解码
18 html = r.content.decode('utf-8')
19 #用etree获取页面
20 page = etree.HTML(html)
21 #提取信息
22 info = page.xpath('/html/body/div/div/div/h3/text()')
23 #print info[0]
24 if u'您输入的密码错误, 请重新输入' in info[0]:
25 password = password+1
26 else:
27 break
28
29 print password