修补文本文件

# filename = name of the diff file # date = extra information to be added as a prefix to each added line def process_diff(filename, date): # that's the file all the patches will be applied to merge_file = open("thesis_merged.txt", "r") # map its content to a list to manipulate it in memory merge_file_lines = [] for line in merge_file: line = line.rstrip() merge_file_lines.append(line) merge_file.close() # open for writing: merge_file = open("thesis_merged.txt", "w") # that's the diff file, containing all the changes diff_file = open(filename, "r") print "-", filename, "-" * 20 # also map it to a list diff_file_lines = [] for line in diff_file: line = line.rstrip() if not line.startswith("\\ No newline at end of file"): # useless information ... or not? diff_file_lines.append(line) # ignore header: #--- thesis_words_0.txt 2010-12-04 18:16:26.020000000 +0100 #+++ thesis_words_1.txt 2010-12-04 18:16:26.197000000 +0100 diff_file_lines = diff_file_lines[2:] hunks = [] for i, line in enumerate(diff_file_lines): if line.startswith("@@"): hunks.append( get_hunk(diff_file_lines, i) ) for hunk in hunks: head = hunk[0] # @@ -252,10 +251,9 @@ tmp = head[3:-3].split(" ") # [-252,10] [+251,9] line_nr_minus = tmp[0].split(",")[0] line_nr_minus = int(line_nr_minus[1:]) # 252 line_nr_plus = tmp[1].split(",")[0] line_nr_plus = int(line_nr_plus[1:]) # 251 for j, line in enumerate(hunk[1:]): if line.startswith("-"): # delete line from the file in memory del merge_file_lines[line_nr_minus-1] plus_counter = 0 # counts the number of added lines for k, line in enumerate(hunk[1:]): if line.startswith("+"): # insert line, one after another merge_file_lines.insert((line_nr_plus-1)+plus_counter, line[1:]) plus_counter += 1 for line in merge_file_lines: # write the updated file back to the disk merge_file.write(line.rstrip() + "\n") merge_file.close() diff_file.close() print "\n\n" def get_hunk(lines, i): hunk = [] hunk.append(lines[i]) # @@ -252,10 +251,9 @@ lines = lines[i+1:] for line in lines: if line.startswith("@@"): # next hunk begins, so stop here break else: hunk.append(line) return hunk

2条回答

网友

1楼 · 编辑于 2024-06-17 23:35:54

尝试使用来自python-patch的解析器-至少您可以手动逐个应用hunks来查看哪个失败了。API不稳定，但解析器是稳定的，所以您可以复制补丁.py从主干/到你的项目。不过，如果能得到一些关于所需API的建议，那就太好了。在

网友

2楼 · 编辑于 2024-06-17 23:35:54

代码中确实有一个错误，我没有正确地解释diff文件（当一个diff文件中有多个hunk时，没有意识到需要进行换行）

def process_diff(filename, date, step_nr):
    merge_file = open("thesis_merged.txt", "r")
    merge_file_lines = [line.rstrip() for line in merge_file]
    merge_file.close()

    diff_file = open(filename, "r")
    print "-", filename, "-"*2, step_nr, "-"*2, date

    diff_file_lines = [line.rstrip() for line in diff_file]
    hunks = []
    for i, line in enumerate(diff_file_lines):
        if line.startswith("@@"):
            hunks.append( get_hunk(diff_file_lines, i) )
    diff_file.close()

    line_shift = 0
    for hunk in hunks:
        head = hunk[0]
        # @@ -252,10 +251,9 @@
        tmp = head[3:-3].split(" ") # [-252,10] [+251,9]

        line_nr_minus = tmp[0].split(",")[0]
        minusses = 1
        if len( tmp[0].split(",") ) > 1:
            minusses = int( tmp[0].split(",")[1] )
        line_nr_minus = int(line_nr_minus[1:]) # 252

        line_nr_plus = tmp[1].split(",")[0]
        plusses = 1
        if len( tmp[1].split(",") ) > 1:
            plusses = int( tmp[1].split(",")[1] )
        line_nr_plus = int(line_nr_plus[1:]) # 251

        line_nr_minus += line_shift

        #@@ -248,3 +249 @@
        #-already
        #-proposes,
        #-"generative"
        #+generative

        if hunk[1]: # -
            for line in hunk[1]:
                del merge_file_lines[line_nr_minus-1]

        plus_counter = 0
        if hunk[2]: # +
            for line in hunk[2]:
                prefix = ""
                if len(line) > 1:
                    prefix = "{" + date + "}"
                merge_file_lines.insert((line_nr_plus-1)+plus_counter, prefix + line[1:])
                plus_counter += 1

        line_shift += plusses - minusses

相关问题更多 >

编程相关推荐

热门问题

热门文章