Pyquery


In [53]:
import pyquery

html = """<html>
<body>
<a href="foo">
<svg aria-label="star" />
123
</a>

<a href="second">
<svg aria-label="star" />
125
</a>

<a href="third" aria-label="Stargazers">
125
</a>

</body>
</html>
"""

d = pyquery.PyQuery(html)
# print('d', d)
# print('')
# print(d('a'))
# print('')
# print(d('a')('svg'))
# print('')
# print(d('a')('svg'))
# print('')

for node in d('a').items():
    print(node.find('svg').attr['aria-label'])
    print('')

#     for node in d('a'):
#     print(node.text_content())
#     print(dir(node))
#     print(dir(node[0]))
print(d('a').text())
print(type(d('a')))
print(type(d('a')[0]))
print('d a text', d('a')[0].text)
# print(dir(d('a')))
#  print(d('a').items()[0])

for node in d('a').items():
#     print('node', node)
    print(node.find('svg').attr['aria-label'])
    print(node.attr['aria-label'])
    print(node.text())


star

star

None

123 125 125
<class 'pyquery.pyquery.PyQuery'>
<class 'lxml.etree._Element'>
d a text 

star
None
123
star
None
125
None
Stargazers
125