Mincemeat映射函数返回字典

import re import glob import mincemeat from collections import Counter text_files = glob.glob('test/*') def file_contents(file_name): f = open(file_name) try: return f.read() finally: f.close() datasource = dict((file_name, file_contents(file_name)) for file_name in text_files) def mapfn(key, value): for line in value.splitlines(): wordsinsentence = line.split(":::") authors = wordsinsentence[1].split("::") # print authors words = str(wordsinsentence[2]) words = re.sub(r'([^\s\w-])+', '', words) # re.sub(r'[^a-zA-Z0-9: ]', '', words) words = words.split(" ") for author in authors: for word in words: word = word.replace("-"," ") word = word.lower() yield author, word def reducefn(key, value): return Counter(value) s = mincemeat.Server() s.datasource = datasource s.mapfn = mapfn s.reducefn = reducefn results = s.run_server(password="changeme") # print results i = open('outfile','w') i.write(str(results)) i.close()

2条回答

网友

1楼 · 编辑于 2024-06-02 20:07:38

我看到你的代码运行正常。输出类似于{authorname:Counter（{'word1'：countofword1，'word2'：countofword2，'word3'：countofword3，…}）。在

那就是说。删除此处的代码，因为它违反了Coursera荣誉准则。在

网友

2楼 · 编辑于 2024-06-02 20:07:38

在计数器之前检查reducefn中的值数据结构。在

def reducefn(key, value):

    print(value)

    return Counter(value)

相关问题更多 >

编程相关推荐

热门问题

热门文章