python爬取牛客网面试题
python使用requests库爬取牛客网面试题
代码如下:
import pymysql
import requests
from lxml import html
import datetime
import time
import re
# import multiprocessing
class SpiderNKW(object):
def spider(self, sn):
'''nkw'''
url = 'https://www.nowcoder.com/ta/review-test/review?page={0}'.format(sn)
resp = requests.get(url)
# html文档
resp = requests.get(url, headers={
'user-agent': 'Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/63.0.3239.26 Safari/537.36 Core/1.63.6776.400 QQBrowser/10.3.2601.400',
})
resp.encoding = 'utf-8'
rest = resp.text
print('问题{0}:'.format(sn))
# 问题