概要
from Bio import SeqIO fasta_file = 'test/test.fna' fasta = SeqIO.parse(fasta_file, 'fasta') # SeqRecord object r1 = next(fasta) print(r1.id) print(r1.description) print(len(r1)) r1_seq = r1.seq r1_seq[1806:2169].reverse_complement().translate()
from Bio import SeqIO fasta_file = 'test/test.fna' fasta = SeqIO.parse(fasta_file, 'fasta') # 1> file全体の処理 for r in fasta:
from Bio import SeqIO fasta_file = 'test/test.fna' # 2> file全体の処理2 fasta = list(SeqIO.parse(fasta_file, 'fasta'))
from Bio import SeqIO protein_fasta_file = 'test/test.faa' output = 'tmp.faa' fasta = SeqIO.parse(protein_fasta_file, 'fasta') threshold = 1000 fasta = [ r for r in fasta if len(r) >= threshold] fasta = sorted(fasta, key=len, reverse=True) with open(output, 'w') as f: SeqIO.write(fasta, f, 'fasta')
from Bio import SeqIO fasta_file = 'test/test.fna' fasta = SeqIO.parse(fasta_file, 'fasta') f = {r.id: r for r in fasta} print(f.keys()) print(f['NC_001140.6'])
from Bio import SeqIO from pyfaidx import Fasta fasta_file = 'test/test.fna' fasta = Fasta(fasta_file) # *.fai index fileが自動生成 # dict同様に使用可能 fasta.get_seq('NC_001140.6', 101, 200, rc=True)