这个问题怎么解决啊!用的utf8
但是却有ASCII解码的错误,有没有大神帮忙看一下!
import urllib.parse import urllib.request import re import urllib.error def run_spider(url, page): html1 = urllib.request.urlopen(url).read() html1 = str(html1) pat1 = '<div id="plist".+? <div class="page clearfix">' result1 = re.compile(pat1).findall(html1) result1=result1[0] pat2 = '<img width="220" height="220" data-img="1" data-lazy-img="//(.+?\.jpg)' pictures = re.compile(pat2).findall(result1) i = 1 for picture in pictures: filename1 = "C:/Users/85095/myproj1/myproj1/woqu/" + str(page) + str(i) + ".jpg" try: urllib.request.urlretrieve(picture, filename=filename1) except urllib.error.URLError as e: if hasattr(e, "code"): i += 1 if hasattr(e, "reason"): i += 1 i += 1