爬取新型冠状病毒数据

ExcelName = 'D:/2.13.csv'
links1=[]
links2=[]
links3=[]
links4=[]

selector=lxml.etree.HTML(html)
links1=selector.xpath('//*[@id="app2"]/div[1]/ul[2]/li/span[1]/text()')
links2=selector.xpath('//*[@id="app2"]/div[1]/ul[2]/li/span[2]/text()')
links3=selector.xpath('//*[@id="app2"]/div[1]/ul[2]/li/span[3]/text()')
links4=selector.xpath('//*[@id="app2"]/div[1]/ul[2]/li/span[4]/text()')



# for i in range(len(links1)):
#    print(links1[i])
#    print(links2[i])
#    print(links3[i])
#    print(links4[i])


with open(ExcelName, 'w', encoding='utf-8', newline='') as csvfile:
    writer = csv.writer(csvfile)
    writer.writerow(["省份","确诊","死亡","治愈",""])


for i in range(len(links1)):
   with open(ExcelName, 'a', encoding='utf-8', newline='') as csvfile:
      writer = csv.writer(csvfile)
      writer.writerow([links1[i],links2[i],links3[i],links4[i]])

  网址:http://health.people.com.cn/GB/26466/431463/431576/index.html

效果:

原文地址:https://www.cnblogs.com/NCLONG/p/12305336.html