from lxml import etree import requests url = 'http://www.shihuo.cn/youhui/474770.html#qk=youhui_list' response = requests.get(url) text = etree.HTML(response.text) tt = text.xpath("//div[@class='article']") info = tt[0].xpath("string(.)")