将多个文件连接到python

#support functions def tail(file_path): last_line = None with open(file_path) as file: line=file.readline() while line: last_line=str(line) line=file.readline() return last_line def wait_for_flush(output_file,tail_in): c = 0 while not file_exists(output_file): sleep(5) c += 1 if c > 100: raise BrokenConcatenation(output_file) tail_out = tail(output_file) while tail_out != tail_in: while not tail_out: sleep(2) tail_out = tail(output_file) c += 1 if c > 100: raise BrokenConcatenation(output_file) tail_out = tail(output_file) c += 1 sleep(2) if c > 100: raise BrokenConcatenation(output_file) def merge_two_files(file1,file2): with open(file1, 'a+') as f1: with open(file2) as f2: line=f2.readline() while line: f1.write(line) line=f2.readline() #forcing disk write f1.flush() os.fsync(f1) #main functions def concat_files(output_file,list_file_paths,stdout_file=None,add_tag=False): print('Concatenating files into ',output_file,flush=True,file=stdout_file) print(output_file) list_files=list(list_file_paths) while len(list_files)>1: file1=list_files.pop(0) file2=list_files.pop(0) merge_two_files(file1,file2) sleep(1) os.remove(file2) list_files.append(file1) final_file=list_files.pop() move_file(final_file,output_file) def concat_files(output_file,list_file_paths,stdout_file=None,add_tag=False): print('Concatenating files into ',output_file,flush=True,file=stdout_file) with open(output_file, 'wb',buffering=0) as wfd: for f in list_file_paths: with open(f,'rb') as fd: shutil.copyfileobj(fd, wfd) #forcing disk write wfd.flush() os.fsync(wfd) sleep(2) def concat_files(output_file,list_file_paths,stdout_file=None,add_tag=False): print('Concatenating files into ',output_file,flush=True,file=stdout_file) with open(output_file, 'w+') as wfd: for f in list_file_paths: with open(f) as fd: line = fd.readline() while line: wfd.write(line) line = fd.readline() if add_tag: tail_in='#'+f+'\n' wfd.write(tail_in) else: tail_in=tail(f) # forcing disk write wfd.flush() os.fsync(wfd) wait_for_flush(output_file,tail_in) #resets file whenever we open file, doesnt work def concat_files(output_file,list_file_paths,stdout_file=None): print('Concatenating files into ',output_file,flush=True,file=stdout_file) for f in list_file_paths: with open(output_file, 'wb') as wfd: with open(f,'rb') as fd: shutil.copyfileobj(fd, wfd) #forcing disk write wfd.flush() os.fsync(wfd) def concat_files(output_file,list_file_paths,stdout_file=None): print('Concatenating files into ',output_file,flush=True,file=stdout_file) with open(output_file, 'w+') as outfile: for f in list_file_paths: with open(f) as infile: line=infile.readline() while line: outfile.write(line) line=infile.readline() #forcing disk write outfile.flush() os.fsync(outfile) def concat_files(output_file,list_file_paths,stdout_file=None): print('Concatenating files into ',output_file,flush=True,file=stdout_file) with open(output_file, 'wb') as wfd: for f in list_file_paths: with open(f,'rb') as fd: shutil.copyfileobj(fd, wfd) #forcing disk write wfd.flush() os.fsync(wfd)

1条回答

网友

1楼 · 发布于 2024-06-30 15:43:23

如果您不想将大文件读入内存，我认为这应该可以：

def concat_files(output_file, list_file_paths):
    print('Concatenating files into', output_file)
    with open(output_file, 'w') as wfd:
        for f in list_file_paths:
            print(f, '...')
            with open(f) as fd:
                for line in fd:
                    wfd.write(line)
                wfd.write(f'eof - {f}\n')  # mod to indicate end of this file
    print('Done.')

这应该将output_file创建为一个新文件，并从list_file_paths读取每个文件，每次一行，写入新文件

更新：请参见mod以指示此文件的结尾

相关问题更多 >

编程相关推荐

热门问题

热门文章