1.content= response.content.decode(‘gb2312’, ‘ignore’) html = etree.HTML(content)
2.html = etree.HTML(response.text)