如何在CSV文件中只选择一行？

import csv import sys import itertools f = sys.argv[1] uuid = sys.argv[2] target_row = sys.argv[3] tmpdir="/tmp/pagekicker/" folder = tmpdir+uuid destination1 = folder + '/csv/row.editedby' destination3 = folder + '/csv/row.booktitle' destination4 = folder + '/csv/row.seeds' destination5 = folder + '/csv/row.imprint' f = open(f, 'rb') f1 = open(destination1, 'w') f3 = open(destination3, 'w') f4 = open(destination4, 'w') f5 = open(destination5, 'w') target_row = int(target_row) try: reader = csv.reader(f) # creates the reader object for row in itertools.islice(reader,1,1): # iterates the rows of the file in orders editedby = row[0] # we throw away column 2 booktitle = row[2] print row[2] seeds = row[3] imprint = row[4] f1.write(editedby) f3.write(booktitle) f4.write(seeds) f5.write(imprint) f.close() f1.close() f3.close() f4.close() f5.close() finally: print 'done'

2条回答

网友

1楼 · 编辑于 2024-10-04 09:31:30

假设您从1（而不是0）开始计算行数，下面是一个独立的函数来执行此操作：

import csv
from contextlib import contextmanager
import sys
import itertools

@contextmanager
def multi_file_manager(files, mode='r'):
    """ Context manager for multiple files. """
    files = [open(file, mode) for file in files]
    yield files
    for file in files:
        file.close()

# This is the standalone function
def csv_read_row(filename, n):
    """ Read and return nth row of a csv file, counting from 1. """
    with open(filename, 'rb') as f:
        reader = csv.reader(f)
        return next(itertools.islice(reader, n-1, n))

if len(sys.argv) != 4:
    print('usage: utility <csv filename> <uuid> <target row>')
    sys.exit(1)

tmpdir = "/tmp/pagekicker"
f = sys.argv[1]
uuid = sys.argv[2]
target_row = int(sys.argv[3])
folder = os.path.join(tmpdir, uuid)

destinations = [folder+dest for dest in ('/csv/row.editedby',
                                         '/csv/row.booktitle',
                                         '/csv/row.seeds',
                                         '/csv/row.imprint')]

with multi_file_manager(destinations, mode='w') as files:
    row = csv_read_row(f, target_row)
    #editedby, booktitle, seeds, imprint = row[0], row[2], row[3], row[4]
    for i,j in zip(range(4), (0, 2, 3, 4)):
        files[i].write(row[j]+'\n')

网友

2楼 · 编辑于 2024-10-04 09:31:30

csv library DictReader（）对象能够显示当前行号：

reader = csv.DictReader(csv_file)
reader.line_num

您可以迭代，直到找到所需的正确行号，如下所示：

^{pr2}$

DictReader类还允许您将CSV文件中的第一行作为标题列，然后可以按如下方式访问它们：

reader["title_of_column1"]

这可能也会为您节省一些工作，而且在处理以下文件时，您应该使用python with block：

with open(f, 'rb') as f, open(destination1, 'w') as f1, open(destination3, 'w') as f3, open(destination4, 'w') as f5, open(destination5, 'w') as f5:
    target_row = int(target_row)
    try:
        reader = csv.reader(f)  # creates the reader object
        for row in itertools.islice(reader,1,1):   # iterates the rows of the file in orders
            editedby = row[0] # we throw away column 2
            booktitle = row[2]
            print row[2]
            seeds = row[3]
            imprint = row[4]
            f1.write(editedby)
            f3.write(booktitle)
            f4.write(seeds)
            f5.write(imprint)

这样你就不用担心把它们都关上了

相关问题更多 >

编程相关推荐

热门问题

热门文章