import requests import re import csv import codecs urls = [] urls.append("https://y.qq.com/") urls.append("https://www.kugou.com/") urls.append("https://music.163.com/") urls.append("https://www.bilibili.com/") urls.append("https://music.91q.com/") with open("C://Users//86171//PythonProject//study//pachong//test.csv", "ab+") as f: f.write(codecs.BOM_UTF8) f = open("C://Users//86171//PythonProject//study//pachong//test.csv", "a+", encoding="utf-8") csvwriter = csv.writer(f) csvwriter.writerow(["音乐库", "音乐库特色", "音乐库介绍"]) for url in urls: resp = requests.get(url) print(resp.encoding) resp.encoding = 'GBK' obj1 = re.compile(r'<title.*?>(?P<title>.*?)</title>', re.S) obj2 = re.compile(r'<meta.*?name="keywords".*?content="(?P<keywords>.*?)".*?>', re.S) obj3 = re.compile(r'<meta.*?name="description".*?content="(?P<description>.*?)".*?>', re.S) resp.encoding = 'utf-8' result1 = obj1.finditer(resp.text) result2 = obj2.finditer(resp.text) result3 = obj3.finditer(resp.text) lis = [] for it in result1: print("音乐库:", it.group("title")) lis.append(it.group("title")) for it in result2: print("音乐库特色:", it.group("keywords")) lis.append(it.group("keywords")) for it in result3: print("音乐库介绍:", it.group("description")) lis.append(it.group("description")) print(lis) print() csvwriter.writerow(lis) resp.close() print('数据爬取完成!') f.close()