python爬虫爬取古诗词内容,并存入mysql
爬取结果展示:
代码如下:
from urllib import request
import re,os
import pymysql
import time
base_url = "https://so.gushiwen.org"
shiwen_url='https://www.gushiwen.org/shiwen/'
def get_model_url(shiwen_url):
html=get_html(shiwen_url)
res = '<a href="https://so\.gushiwen\.org/(.*?)\.aspx">(.*?)</a>'
urls=re.compile(res).findall(html)
return urls
def conn_mysql():
url