彩票数据爬虫收集,保存在CSV文件中,代码如下
# -*- coding: utf-8 -*-
# author:Apples
from requests import get
from bs4 import BeautifulSoup
from user_agent import generate_user_agent
import time
def request_content(start, end):
url_link = 'https://datachart.500.com/ssq/history/newinc/history.php?start={0}&end={1}'.format(start, end)
headers = {
'User-Agent': generate_user_agent(device_type='desktop', os=('mac', 'linux', 'win', 'android'))
}
response = get(url_link, headers=headers, timeout=6)
page_content = BeautifulSoup(response.content, "html.parser")
html_tag = page_content.find_all('tbody', id='tdata')[0]
return html_tag.find_all('tr', 't_tr1')
class ssqclazz:
def __init__(self):
self.period = '' # 期号
self.red_1 = '' # 红球