擅长:python、mysql、java
<p>尝试使用lxml模块和xpath。我想差不多了</p>
<pre><code>import urllib.request
from lxml import etree
url = "https://datarecovery.com/rd/default-passwords/"
htmlparser = etree.HTMLParser()
response = urllib.request.urlopen(url)
tree = etree.parse(response, htmlparser)
user_list = []
xpathparent = '/html/body/div[1]/div[2]/div[2]/div/div/div/div[1]/div/div/table/tbody/tr'
xpathselector = '/html/body/div[1]/div[2]/div[2]/div/div/div/div[1]/div/div/table/tbody/tr[2]/td[5]/span'
table_user = tree.xpath(xpathparent)
for item in table_user:
x_path = (tree.getpath(item))
user = tree.xpath(x_path + '/td[5]/span')
if len(user) > 0:
user_name = user[0].text
else:
user_name = ''
user_list.append(user_name)
</code></pre>