"""
1.确定要爬取的网站目标
2.分析网站的结构
3.请求网络 - 获取服务器返回的数据
4解析数据 - 提取所需要的内容
5.保存数据
"""
"""
1.确定要爬取的网站目标
2.分析网站的结构
3.请求网络 - 获取服务器返回的数据
4解析数据 - 提取所需要的内容
5.保存数据
"""
from lxml.html import etree
from tkinter import *
import requests
header = {
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9",
"Accept-Encoding": "gzip, deflate, br",
"Accept-Language": "zh-CN,zh;q=0.9,en;q=0.8,en-GB;q=0.7,en-US;q=0.6",
"Cache-Control": "max-age=0",
"Connection": "keep-alive",
"Cookie": "LOVEAPP_SESSID=15532afb00fc3226bccd541aecca9649ab8dc7c2; _ga=GA1.2.1048495854.1664884678; _gid=GA1.2.1511991182.1664884678; __root_domain_v=.ipip.net; _qddaz=QD.195864884678593; _qdd