使用iPython中的for循环和范围函数打开多个文件、创建列表和字典

#!/usr/bin/env ipython import re import itertools import numpy sample = raw_input('sample: ') for i in range(10): filename = sample+'_rand{0}.genes.tajD'.format(i) 'gene{0}key'.format(i) = [] 'taj{0}value'.format(i) = [] with open(filename, 'r') as data: for line in data: line = line.strip().split('\t') gene, taj = line[0], line[3] 'gene{0}key'.format(i).append(gene) 'taj{0}value'.format(i).append(taj) 'dic{0}'.format(i) = dict(itertools.izip('gene{0}key'.format(i),'taj{0}value'.format(i))) outfilename = sample+'_tajD.genes.all' with open(sample+'_rand0.genes.tajD', 'r') as genes, open(outfilename, 'w') as outfile : for line in genes : line = line.strip().split('\t') mastergene = line[0] for i in range(10): 'value{0}'.format(i) = 'dic{0}'.format(i)[mastergene] allrand = [value0, value1, value2, value3, value4, value5, value6, value7, value8, value9] avg = numpy.mean(allrand) outfile.write(mastergene + '\t' + value0 + '\t' + value1 + '\t' + value2 +'\t' + value3 + '\t' + value4 + '\t' + value5 + '\t' + value6 + '\t' + value7 + '\t' + value8 + '\t' + value9 + '\t' + avg + '\n')

1条回答

网友

1楼 · 发布于 2024-09-30 14:36:27

'gene{0}key'.format(i) = []

这是新程序员尝试使用的典型反模式。您需要创建十个名为gene1key、gene2key、gene3key等的变量。正确的方法是使用一个列表或字典，然后使用i作为键索引。重写代码以使其语法正确的最简单方法是：

^{pr2}$

代码可以进一步简化。例如，由于genekeys和tajvalues只用于创建dictionaries，所以您可以直接填充dict而不需要存储中间值。您可以使values成为一个列表，因此您不必在numpy.mean和outfile.write期间显式地处理每个列表。在

dictionaries = {}
for i in range(10):
    filename = sample+'_rand{0}.genes.tajD'.format(i)
    dictionaries[i] = {}
    with open(filename, 'r') as data:
        for line in data:
            line = line.strip().split('\t')
            gene, taj = line[0], line[3]
            dictionaries[i][gene] = taj

with open(sample+'_rand0.genes.tajD', 'r') as genes, open(outfilename, 'w') as outfile :
    for line in genes :
        line = line.strip().split('\t')
        mastergene = line[0]
        values = []
        for i in range(10):
            values.append(dictionaries[i][mastergene])
        #alternative to the above for loop: values = [dictionaries[i][mastergene] for i in range 10]
        avg = numpy.mean(values)
        outfile.write(mastergene + '\t' + '\t'.join(values) + '\t' + avg + '\n')

相关问题更多 >

编程相关推荐

热门问题

热门文章