承接上一篇采用类对代码进行封装
from Bio import SeqIO
import pandas as pd
from Bio.Seq import Seq
class GeneSeqExtractor:
def __init__(self, gtf_file, fasta_file):
self.gtf_file = gtf_file
self.fasta_file = fasta_file
self.gene_info = None
self.chrom_seqs = None
self.gene_seqs = None
def parse_gtf(self):
self.gene_info = pd.read_csv(self.gtf_file, sep='\t', comment='#', header=None,
usecols=[0,