代码第二次循环时bs4中出现错误

from bs4 import BeautifulSoup import requests murl = ['https://www.amazon.in/dp/B07XY541GH/','https://www.amazon.in/dp/B085J17VVP/'] def track(url): req = requests.get(url) soup = BeautifulSoup(req.content, 'html5lib') pr = soup.find('span', id='priceblock_ourprice').getText() con_pr = pr[1:] converted_price = con_pr.strip() newprice = '' for con in converted_price: if con != ',': newprice = newprice + con newprice = float(newprice) return newprice def main(): for url in murl: price = track(url) print(price) main()

2990.0 Traceback (most recent call last): File "test.py", line 28, in <module> main() File "test.py", line 25, in main price = track(url) File "test.py", line 13, in track pr = soup.find('span', id='priceblock_ourprice').getText() AttributeError: 'NoneType' object has no attribute 'getText'

1条回答

网友

1楼 · 发布于 2024-09-26 22:07:32

以下是解决方案，请尝试：

import requests
from bs4 import BeautifulSoup

murl = ['https://www.amazon.in/dp/B07XY541GH/', 'https://www.amazon.in/dp/B085J17VVP/']


def track(url):
    req = requests.get(url, headers={
        "user-agent": "Mozilla/5.0 (X11; Linux x86_64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/88.0.4324.87 Safari/537.36"})
    soup = BeautifulSoup(req.content, 'html5lib')

    pr = soup.find('span', id=lambda x: x and x.startswith('priceblock_')).text
    con_pr = pr[1:]
    converted_price = con_pr.strip()
    newprice = ''
    for con in converted_price:
        if con != ',':
            newprice = newprice + con
    newprice = float(newprice)
    return newprice


def main():
    for url in murl:
        price = track(url)
        print(price)


main()

使用错过的用户aget。大多数情况下，它应该用于解析
元素标记对象没有getText（）方法
两个站点的Id不相同

相关问题更多 >

编程相关推荐

热门问题

热门文章