刮取跳过部分页面url，不会将所有值写入CSV

title_and_urls = {} #dictionary totalNumberOfPages = 12 for x in range(1,int(totalNumberOfPages)+1): url_pages = 'https://abd.com/api?&page=' +str(x)+'&year=2017' resp = requests.get(url_pages, timeout=60) soup = BeautifulSoup(resp.text, 'lxml') for div in soup.find_all('div', {"class": "block2"}): a = div.find('a') h3 = a.find('h3') print(h3,url_pages) #prints correct title_and_urls[h3.text] = base_enthu_url+a.attrs['href'] print(title_and_urls) with open('dict.csv', 'wb') as csv_file: writer = csv.writer(csv_file) for key, value in title_and_urls.items(): writer.writerow([key, value])

1条回答

网友

1楼 · 发布于 2024-10-01 00:20:30

使用try函数

**title_and_urls = {} #dictionary
totalNumberOfPages = 12
for x in range(1,int(totalNumberOfPages)+1):
    try:
        url_pages = 'https://abd.com/api?&page=' +str(x)+'&year=2017'
        resp = requests.get(url_pages, timeout=60)
        soup = BeautifulSoup(resp.text, 'lxml')
        for div in soup.find_all('div', {"class": "block2"}):
            a = div.find('a')
            h3 = a.find('h3')
            print(h3,url_pages) #prints correct
            title_and_urls[h3.text] = base_enthu_url+a.attrs['href']
    except:
        pass


with open('dict.csv', 'wb') as csv_file:
    writer = csv.writer(csv_file)
    for key, value in title_and_urls.items():
       writer.writerow([key, value])**

相关问题更多 >

编程相关推荐

热门问题

热门文章