import requests
import re
def add_url(url,num):
return url+num
def next(url):
global flag
content = requests.get(url)
content = content.text.encode('utf-8')
pattern = re.compile(r'下一个你需要输入的数字是(.*?)\.')
num = pattern.findall(content)
if len(num)>0:
print num[0]
return num
else:
print content
def main():
flag = 1
url = 'http://www.heibanke.com/lesson/crawler_ex00/'
content = requests.get(url)
content = content.text.encode('utf-8')
pattern = re.compile(r'你需要在网址后输入数字(.*?)</h3>')
num = pattern.findall(content)
print num[0]
while(flag==1):
try:
num = next(add_url(url,num[0]))
except Exception as e:
flag = 0
print e
print '[!]works have already done yet'
if __name__ == '__main__':
main()
![这里写图片描述](https://i-blog.csdnimg.cn/blog_migrate/60b700a1a1deadc569c7927774703fad.png)
import requests
import re
url = 'http://www.heibanke.com/lesson/crawler_ex01/'
content = requests.get(url)
content = content.content
pattern = re.compile(r"name='csrfmiddlewaretoken' value='(.*)' />")
result1 = pattern.findall(content)
for i in range(1,30):
data={
'csrfmiddlewaretoken':result1[0],
'username':'aa',
'password':i,
}
content = requests.post(url,data=data)
if '您输入的密码错误' in content.content:
print '[*]'+'尝试'+str(i)+'失败'
else:
print '[!]'+'尝试'+str(i)+'成功'
print content.content
![这里写图片描述](https://i-blog.csdnimg.cn/blog_migrate/50da4a92e3aa4322561814195f2defe0.png)