NLTK WordNetElementMatizer中的多线程？

import nltk from nltk.corpus import sentiwordnet as swn def SentimentA(doc, file_path): sentences = nltk.sent_tokenize(doc) # print(sentences) stokens = [nltk.word_tokenize(sent) for sent in sentences] taggedlist = [] for stoken in stokens: taggedlist.append(nltk.pos_tag(stoken)) wnl = nltk.WordNetLemmatizer() score_list = [] for idx, taggedsent in enumerate(taggedlist): score_list.append([]) for idx2, t in enumerate(taggedsent): newtag = '' lemmatized = wnl.lemmatize(t[0]) if t[1].startswith('NN'): newtag = 'n' elif t[1].startswith('JJ'): newtag = 'a' elif t[1].startswith('V'): newtag = 'v' elif t[1].startswith('R'): newtag = 'r' else: newtag = '' if (newtag != ''): synsets = list(swn.senti_synsets(lemmatized, newtag)) score = 0 if (len(synsets) > 0): for syn in synsets: score += syn.pos_score() - syn.neg_score() score_list[idx].append(score / len(synsets)) return SentiCal(score_list)

1条回答

网友

1楼 · 发布于 2024-06-18 03:42:38

快速破解：

import nltk
from nltk.corpus import sentiwordnet as swn
# Do this first, that'll do something eval() 
# to "materialize" the LazyCorpusLoader
next(swn.all_senti_synsets()) 

# Your other code here.

更多细节稍后。。。还在打字吗

相关问题更多 >

编程相关推荐

热门问题

热门文章