第四节:电商信息爬取项目实战项目
课程目标
- 学习如何通过playwright完成某宝商品信息爬取
课程内容
编码实现
import json
from playwright.sync_api import sync_playwright
import time
from tqdm import tqdm
import pandas as pd
with sync_playwright() as p:
browser = p.chromium.launch(headless=False)
with open("cookies.json", 'r') as f:
storage_state = json.load(f)
page = browser.new_page()
page.goto("https://uland.taobao.com/sem/tbsearch?localImgKey=&page=1&q=%E5%B7%A5%E8%A3%85%E8%A3%A4&tab=all&#