个人冲刺(二)

对苏宁详情页的爬取
# -*- coding:utf-8 -*-
import requests
import re

headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36(KHTML, like Gecko) Chrome/83.0.4103.106 Safari/537.36"
}
# url = "http://www.imomoe.la/"
#
# res = requests.get(url).text.encode('iso-8859-1').decode('gbk')
# print(res)
# getK = re.compile(r'<span><a href=".*?">.*?</a></span><a href=".*?" title=".*?">(.*?)</a>')
# keyL = re.findall(getK, res)
# print(keyL)

url = "https://product.suning.com/0070088010/11009048498.html?"
res = requests.get(url).text
getK = re.compile(r'<span>货号</span> </div> </td> <td class="val">(.*?)</td>')
keyL = re.findall(getK, res)
print(keyL)
原文地址:https://www.cnblogs.com/mumulailai/p/14911865.html