创建一个Python网络爬虫来获取谷歌Play商店应用程序的元数据

# Function to crawl Google Play Store and obtain data def web_crawl(app_id): import os, sys, urllib2 try: # Obtain the URL for the app url = "https://play.google.com/store/apps/details?id=" + app_id # open url for reading response = urllib2.urlopen(url) # Get path of py file to store txt file locally fpath = os.path.dirname(os.path.realpath(sys.argv[0])) # Open file to store app metadata with open(fpath + "\web_crawl.txt", "w") as f: f.write("Google Play Store Web Crawler \n") f.write("Metadata for " + app_id + "\n") f.write("*************************************** \n") f.write("Icon: " + "\n") f.write("Title: " + "\n") f.write("Description: " + "\n") f.write("Screenshots: " + "\n") # Added subtitle f.write("Subtitle: " + "\n") # Close file after write f.close() except urllib2.HTTPError, e: print("HTTP Error: ") print(e.code) except urllib2.URLError, e: print("URL Error: ") print(e.args) # Call web_crawl function web_crawl("com.cmplay.tiles2")

1条回答

网友

1楼 · 发布于 2024-06-25 23:19:00

我建议你用美容素。首先，使用以下代码

from bs4 import BeautifulSoup
r = requests.get("url");
# optionally check status code here
soup = BeautifulSoup(r.text)

使用soup对象可以使用选择器从页面中提取元素

相关问题更多 >

编程相关推荐

热门问题

热门文章