爬虫
Weach
学生
展开
-
爬虫学习--BeautifulSoup库
from bs4 import BeautifulSoup html_doc = """ <!DOCTYPE html> <!--STATUS OK--> <html> <head> <meta content="text/html;charset=utf-8" http-equiv="content-type"/> <meta content="IE=Edge" http-equiv="X-UA-Compatible"/>原创 2021-04-22 17:05:40 · 96 阅读 · 0 评论 -
爬虫学习--requests库
import json import requests from requests.exceptions import RequestException import faker from multiprocessing import Pool fake = faker.Factory.create() headers = { 'Connection': 'keep-alive', 'User-Agent': fake.user_agent() } # 获取网页代码通用框架 def ge原创 2021-04-22 17:02:35 · 87 阅读 · 2 评论