《xpath下载百度新闻链接》路径匹配

#conding=utf-8

from lxml import html
import requests
import csv

header={
'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/69.0.3497.100 Safari/537.36'
}

response=requests.get('http://top.baidu.com/buzz?b=1&fr=20811',headers=header)

response.encoding=response.apparent_encoding
tree=html.fromstring(response.text)

name=tree.xpath('//td[@class="keyword"]/a[1]/text()')
url=tree.xpath('//td[@class="keyword"]/a[1]/@href')
print(name)
print(url)
colum=['名称','地址']
date=zip(name,url)
with open('data.csv',mode='w',encoding='utf-8',newline='') as file:
writer=csv.writer(file)
writer.writerow(colum)
writer.writerows(date)
原文地址:https://www.cnblogs.com/huazhou695/p/9876635.html