比较字典中的值，并根据值对每个值进行处理

import csv def readcsv(filename, column): file = open(filename, "rU") reader = csv.reader(file, delimiter=",") list = [] for row in reader: list.append(row[(column)]) file.close() return list def makeDict(id, fileName, detDate): iList = {z[0]:list(z[1:]) for z in zip((id),(fileName),(detDate))} return (iList) id = (readcsv("jul.csv", 2)) fileName = (readcsv("jul.csv", 1)) detDate = (readcsv("jul.csv", 0)) mainDict = makeDict((id), (fileName), (detDate))

Date fileURL ID 7/24/2018 16:04 https://localhost/file1.docx 2599302 7/24/2018 16:03 https://localhost/file3.docx 2349302 7/24/2018 16:01 https://localhost/file1.docx 2599302 7/24/2018 16:04 https://localhost/fil232.xml 2599303 7/24/2018 16:03 https://localhost/file1.docx 2349333 7/24/2018 16:01 https://localhost/file3.docx 2529374

import csv def readcsv(filename, column): file = open(filename, "rU") reader = csv.reader(file, delimiter=",") list = [] for row in reader: list.append(row[(column)]) file.close() return list def makeDict(id, fileName, detDate): iList = {z[0]:list(z[1:]) for z in zip((id),(fileName),(detDate))} return (iList) ## Group Keys by like file names ## def groupKeys(mainDict): same_filename = {} for key, line in (mainDict).items(): name, date = line if name not in same_filename: same_filename[name] = [key] else: same_filename[name].append( key ) return(same_filename) ########################################### Get latest ID ################## def getLatestID(same_filename, mainDict): ## for each file for k in (same_filename.keys()): curDate = 0 curID = 0 ## get each id value (aka matching ids holding same file) for v in (same_filename.get((k))): moveDupeList.append(v) ## add to a list of dupes ## if current id's date is equal to the highest found so far - note:date already set since its same if ((mainDict.get((v)))[1]) == (curDate): ## check which id is highest and set curId if new high found if (v) > (curId): curId = (v) ## else if date of current is greater than greatest found so far set new highest date and id elif ((mainDict.get((v)))[1]) > (curDate): curDate = ((mainDict.get((v)))[1]) curId = (v) if (curId) in moveDupeList: moveDupeList.remove((curId)) #remove latest from dupe list moveProperList.append((curId)) #add latest to proper list ########################################### Get latest ID ################## id = (readcsv("jul.csv", 2)) fileName = (readcsv("jul.csv", 1)) detDate = (readcsv("jul.csv", 0)) mainDict = makeDict((id), (fileName), (detDate)) same_filename = (groupKeys(mainDict)) getLatestID((same_filename), (mainDict))

1条回答

网友

1楼 · 发布于 2024-10-01 09:18:00

一个起点可以是构建另一个字典，为每个文件名提供所有对应键（id）的列表：

data = {2349302: ['7/24/2018 16:03', 'https://localhost/file3.docx'],
 2349333: ['7/24/2018 16:03', 'https://localhost/file1.docx'],
 2529374: ['7/24/2018 16:01', 'https://localhost/file3.docx'],
 2599302: ['7/24/2018 16:01', 'https://localhost/file1.docx'],
 2599303: ['7/24/2018 16:04', 'https://localhost/fil232.xml']}

similar_filename = {}
for key, line in data.items():
    date, name = line
    if name not in similar_filename:
        similar_filename[name] = [key]
    else:
        similar_filename[name].append( key )


similar_filename
>>> {'https://localhost/fil232.xml': [2599303],
 'https://localhost/file1.docx': [2599302, 2349333],
 'https://localhost/file3.docx': [2529374, 2349302]}

这是你的第一点。你知道吗

相关问题更多 >

编程相关推荐

热门问题

热门文章