pyquery

1.安装

使用国内镜像源

pip install pyquery  -i  http://pypi.douban.com/simple/ --trusted-host pypi.douban.com

2.Demo

from pyquery import PyQuery as pq
import requests

# url初始化
doc = pq('https://www.58pic.com/c/0-104-0-1.html', verify=False)
# print(doc)
# print(type(doc))

# css三种选择器
ul = doc('ul')
# print(ul('li'))
# print(ul.find('li'))
# print(ul.children())

# 父元素
ulparent = ul.parent()
# print(ulparent)

# 祖节点
ulroot = ul.parent()
# print(ulroot)

# 兄弟节点
rootsiblings = ulroot.siblings()
# print(rootsiblings)

# 遍历元素
ulchild = ul.find('li')
# print(ulchild)
for item in ulchild.items():
    # print(item)
    # print(type(item))
    pass

# 获取元素属性
# print(ul.attr('class'))

# 获取文本信息
# print(ul.text())

# 获取html
# print(ul.html())

# DOM操作

# remove_class() add_class()
print(ul)
ul.remove_class('more-wrap')
print(ul)
ul.add_class('more-wrap')
print(ul)

# 属性操作
ul.attr('name','cys')
print(ul)
# css操作
ul.css('font-size','14px')
print(ul)

# 移除节点
ul.find('li').remove()
print(ul)


#######################################################################

# 文件初始化
# doc = pq(filename='a2.html')
# print(type(doc))
# print(type(doc('head')))

#######################################################################

# 字符串初始化
# response = requests.get('https://www.58pic.com/c/0-104-0-2.html',verify=False)
# data = response.content.decode('gbk')
# doc = pq(data)
# print(type(doc))
# print(type(doc('head')))

参考:https://www.cnblogs.com/zhaof/p/6935473.html

原文地址:https://www.cnblogs.com/chenyishi/p/10615929.html