在Python中出现异常时继续

def get_readability_data(db, url, doc_id, rank, index): readability_data = {} readability_data['url'] = url readability_data['rank'] = rank user_agent = 'Mozilla/5.0 (Windows NT 6.1; Win64; x64)' headers = { 'User-Agent' : user_agent } try: req = urllib.request.Request(url) response = urllib.request.urlopen(req) content = response.read() readable_article = Document(content).summary() soup = BeautifulSoup(readable_article, "lxml") text = soup.body.get_text() try: readability_data['flesch_reading_ease'] = textstat.flesch_reading_ease(text) readability_data['smog_index'] = textstat.smog_index(text) readability_data['flesch_kincaid_grade'] = textstat.flesch_kincaid_grade(text) readability_data['coleman_liau'] = textstat.coleman_liau_index(text) readability_data['automated_readability_index'] = textstat.automated_readability_index(text) readability_data['dale_chall_score'] = textstat.dale_chall_readability_score(text) readability_data['linear_write_formula'] = textstat.linsear_write_formula(text) readability_data['gunning_fog'] = textstat.gunning_fog(text) readability_data['total_words'] = textstat.lexicon_count(text) readability_data['difficult_words'] = textstat.difficult_words(text) readability_data['syllables'] = textstat.syllable_count(text) readability_data['sentences'] = textstat.sentence_count(text) readability_data['readability_consensus'] = textstat.text_standard(text) readability_data['readability_scores_date'] = time.strftime("%a %b %d %H:%M:%S %Y") # use the doc_id to make sure we're saving this in the appropriate place readability = json.dumps(readability_data, sort_keys=True, indent=4 * ' ') doc = db.get(doc_id) data = json.loads(readability) doc['search_details']['search_details'][index]['readability'] = data #print(doc['search_details']['search_details'][index]) db.save(doc) time.sleep(.5) except: # catch *all* exceptions e = sys.exc_info()[0] write_to_page( "<p>---ERROR---: %s</p>" % e ) except urllib.error.HTTPError as err: print(err.code)

if __name__ == '__main__': db = connect_to_db(parse_args()) print("~~~~~~~~~~" + " GETTING IDs " + "~~~~~~~~~~") ids = get_ids(db) for i in ids: details = get_urls(db, i) for d in details: get_readability_data(db, d['url'], d['id'], d['rank'], d['index'])

1条回答

网友

1楼 · 发布于 2024-09-28 22:30:31

通常，保持try: except:块越小越好。我将把你的textstat函数包装在某种修饰符中，它捕捉到预期的异常，并返回函数输出和捕捉到的异常。在

例如：

def catchExceptions(exception):  #decorator with args (sorta boilerplate)
    def decorator(func):
        def wrapper(*args, **kwargs):
            try:
                retval = func(*args, **kwargs)
            except exception as e:
                return None, e
            else:
                return retval, None
        return wrapper
    return decorator

@catchExceptions(ZeroDivisionError)
def testfunc(x):
    return 11/x

print testfunc(0)
print '  -'
print testfunc(3)

印刷品：

^{pr2}$

相关问题更多 >

编程相关推荐

热门问题

热门文章