如何一次读多行？（练习稿）

def get_fasta_seqs(BIGFILE): #Returns returns an object containing all of seq locations f = open(BIGFILE) cnt = 0 seq_name = [] seq_start = [] seq_end = [] seqcount = 0 #print(line) #for loop skips first line check for seq name if f.readline(1) == '>': seq_name.append(cnt) seq_start.append(cnt+1) seqcount =+ 1 for line in f: cnt += 1 if f.readline(1) == '>': seq_name.append(cnt) seq_start.append(cnt+1) seqcount += 1 if seqcount > 1: seq_end.append(cnt-1) seq_end.append(cnt-1) #add location of final line seqs = fileseq(seq_name,seq_start,seq_end,seqcount) #This class only has a __init__ function for these lists return seqs def fasta_rev_compliment(fasta_read,fasta_write = "default",NTtype = "DNA"): if fasta_write == 'default': fasta_write = fasta_read[:-6] + "_RC.fasta" seq_map = get_fasta_seqs(fasta_read) print(seq_map.seq_name) f = open(fasta_write,'a') for i in range(seq_map.seqcount): #THIS IS WHAT I WANT TO CHANGE line = getline(fasta_read,seq_map.seq_name[i]+1) #getline is reading it as 1 indexed? f.write(line) my_fasta_seqs = get_fasta_seqs(fasta_read) for seqline in reversed(range(seq_map.seq_start[i],seq_map.seq_end[i]+1)): seq = getline(fasta_read,seqline+1) seq = seq.replace('\n','') seq = reverse_compliment(seq,NTtype = NTtype) #this function just returns the reverse compliment for that line. seq = seq + '\n' f.write(seq) f.close() fasta_rev_compliment('BIGFILE.fasta')

for i in range(seq_map.seqcount): #THIS IS WHAT I WANT TO CHANGE line = getline(fasta_read,seq_map.seq_name[i]+1) #getline is reading it as 1 indexed? f.write(line) my_fasta_seqs = get_fasta_seqs(fasta_read) for seqline in reversed(range(seq_map.seq_start[i],seq_map.seq_end[i]+1)): seq = getline(fasta_read,seqline+1)

def fasta_rev_compliment(fasta_read,fasta_write = "default",NTtype = "DNA",lines_to_record_before_flushing = 5): ###MORE CODE### #i want something like this for i in range(seq_map.seqcount): #THIS IS WHAT I WANT TO CHANGE #is their a way to load line = getline(fasta_read,seq_map.seq_name[i]+1) #getline is reading it as 1 indexed? f.write(line) my_fasta_seqs = get_fasta_seqs(fasta_read) for seqline in reversed(range(seq_map.seq_start[i],seq_map.seq_end[i]+1)): seq = getline(fasta_read,seqline+1) #Repeat n = 5 (or other specified number) times until flushing ram.

1条回答

网友

1楼 · 发布于 2024-10-04 01:32:31

下面是获取fasta文件的反向补码的示例。也许你可以从中得到一些想法

import re

file = """\
>Sequence_1  
ATG
TATA
>Sequence_2 
TATA
GACT
ATG""".splitlines()

s = ''
for line in file:
    line = line.rstrip()
    if line.startswith('>'):
        if len(s):
            # complement the sequence of fasta 'TAGC' to 'ATCG'
            # T to A, A to T, G to C, C to G
            s = s.translate(str.maketrans('TAGC', 'ATCG'))
            # reverse the string, 's[::-1]'
            # Also, print up to 50 fasta per line to the end of the sequence
            s = re.sub(r'(.{1,50})', r'\1\n', s[::-1])
            print(s, end='')
            s = ''
        print(line)
    else:
        s += line

# print last sequence
s = s.translate(str.maketrans('TAGC', 'ATCG'))
s = re.sub(r'(.{1,50})', r'\1\n', s[::-1])
print(s, end='')

印刷品：

>Sequence_1  
TATACAT
>Sequence_2 
CATAGTCTATA

相关问题更多 >

编程相关推荐

热门问题

热门文章