擅长:python、mysql、java
<pre class="lang-py prettyprint-override"><code>import requests
from bs4 import BeautifulSoup
import json
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64; rv:89.0) Gecko/20100101 Firefox/89.0'
}
def main(url):
r = requests.get(url, headers=headers)
soup = BeautifulSoup(r.text, 'lxml')
goal = soup.select_one('script').string.split("=", 1)[1]
print(json.loads(goal)['productIds'])
main('https://www.adidas.com.sg/yeezy')
</code></pre>
<p>输出:</p>
<pre><code>['GZ0953', 'GZ0954', 'GZ0955', 'GZ5551', 'GZ5554']
</code></pre>