多词搜索无法正常工作（Python）

def start(): location = raw_input("What is the folder containing the data you like processed located? ") #location = "C:/Code/Samples/Dates/2015-06-07/Large-Scale Data Parsing/Data Files" if os.path.exists(location) == True: #Tests to see if user entered a valid path file_extension = raw_input("What is the file type (.txt for example)? ") search_for(location,file_extension) else: print "I'm sorry, but the file location you have entered does not exist. Please try again." start() def search_for(location,file_extension): querylist = [] n = 5 while n == 5: search_query = raw_input("What would you like to search for in each file? Use'Done' to indicate that you have finished your request. ") #list = ["CD90-N5722-15C", "CD90-NB810-4C", "CP90-N2475-8", "CD90-VN530-22B"] if search_query == "Done": print "Your queries are:",querylist print "" content = os.listdir(location) run(content,file_extension,location,querylist) n = 0 else: querylist.append(search_query) continue def run(content,file_extension,location,querylist): for item in content: if item.endswith(file_extension): search(location,item,querylist) quit() def search(location,item,querylist): with open(os.path.join(location,item), 'r') as f: countlist = [] for search in querylist: #any search value after the first one is incorrectly reporting "0" countsearch = 0 for line in f: if search in line: countsearch = countsearch + 1 countlist.append(search) countlist.append(countsearch) #mechanism to update countsearch is not working for any value after the first print item, countlist start()

def check_start(): #location = raw_input("What is the folder containing the data you like processed located? ") location = "C:/Code/Samples/Dates/2015-06-07/Large-Scale Data Parsing/Data Files" content = os.listdir(location) for item in content: if item.endswith("processed"): countcol1 = 0 countcol2 = 0 countcol3 = 0 countcol4 = 0 #print os.path.join(currentdir,item) with open(os.path.join(location,item), 'r') as f: for line in f: if "CD90-N5722-15C" in line: countcol1 = countcol1 + 1 if "CD90-NB810-4C" in line: countcol2 = countcol2 + 1 if "CP90-N2475-8" in line: countcol3 = countcol3 + 1 if "CD90-VN530-22B" in line: countcol4 = countcol4 + 1 print item, "CD90-N5722-15C", countcol1, "CD90-NB810-4C", countcol2, "CP90-N2475-8", countcol3, "CD90-VN530-22B", countcol4

2条回答

网友
1楼 · 编辑于 2024-09-30 22:19:02

我不确定我是否完全理解你的问题，但这样的问题怎么样？你知道吗
def check_start(): raw_search_terms = raw_input('Enter search terms seperated by a comma:') search_term_list = raw_search_terms.split(',') #location = raw_input("What is the folder containing the data you like processed located? ") location = "C:/Code/Samples/Dates/2015-06-07/Large-Scale Data Parsing/Data Files" content = os.listdir(location) for item in content: if item.endswith("processed"): # create a dictionary of search terms with their counts (initialized to 0) search_term_count_dict = dict(zip(search_term_list, [0 for s in search_term_list])) for line in f: for s in search_term_list: if s in line: search_term_count_dict[s] += 1 print item for key, value in search_term_count_dict.iteritems() : print key, value

网友
2楼 · 编辑于 2024-09-30 22:19:02

您正在尝试对文件进行多次迭代。第一次之后，文件指针位于末尾，因此后续的搜索将失败，因为没有任何内容可供读取。你知道吗
如果添加行：
f.seek(0)，这将在每次读取之前重置指针：
def search(location,item,querylist): with open(os.path.join(location,item), 'r') as f: countlist = [] for search in querylist: #any search value after the first one is incorrectly reporting "0" countsearch = 0 for line in f: if search in line: countsearch = countsearch + 1 countlist.append(search) countlist.append(countsearch) #mechanism to update countsearch is not working for any value after the first f.seek(0) print item, countlist
另外，我已经猜到了压痕。。。你真的不应该使用制表符。你知道吗

相关问题更多 >

编程相关推荐

热门问题

热门文章