1.content= response.content.decode(‘gb2312’, ‘ignore’) html = etree.HTML(content) 2.html = etree.HTML(response.text)