import refrom urllib import requestfrom lxml import etreetesturl="http://news.163.com/rank/"with request.urlopen(testurl) as f: print('Status:', f.status, f.reason) #网页的编码格式只取一次,默认所有的编码方式都是这个 decode=(f.headers['Content-Type'].split(';')[1]).split('=')[1] data = f.read().decode(decode.lower()) infos = re.findall(r' ', data, re.S) for i in range(len(infos)): print('%s-%s'%(i,infos[i][0])) print('选择新闻类型') k=input() if k.isdigit()and int(k) .*?',data,re.S) newdom=etree.HTML(new) newitems=newdom.xpath("//div[@id='endText'and @class='post_text']/p/text()") for n in newitems: print(n) print('=======================输入y继续') if 'y'==input():continue else:break;