fasta_file = open('SwissProt.fasta', 'r')
ac_list = []
for line in fasta_file:
if line[0] == '>':
fields = line.split('|')
ac_list.append(fields[1])
print(ac_list)
结果
['Q664P8', 'Q66K14', 'Q8K9I1', 'Q664P8', 'Q66K14', 'Q8E4B4', 'B3CQ06', 'Q9ATB4', 'Q83JA5', 'P14213', 'Q7SZM9', 'Q9FGE9']
ac_list.append(fields[0])时,结果:
['>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp', '>sp']
ac_list.append(fields[2])时,结果:
D:\Users\LeiLe\AppData\Local\Programs\Python\Python37\python.exe "D:/Program Files/pywork/Swissprot.py"
['TAUB_YERPS Taurine import ATP-binding protein TauB OS=Yersinia pseudotuberculosis serotype I (strain IP32953) OX=273123 GN=tauB PE=3 SV=1\n', 'TBC9B_HUMAN TBC1 domain family member 9B OS=Homo sapiens OX=9606 GN=TBC1D9B PE=1 SV=3\n', 'SYV_BUCAP Valine--tRNA ligase OS=Buchnera aphidicola subsp. Schizaphis graminum (strain Sg) OX=198804 GN=valS PE=3 SV=1\n', 'TAUB_YERPS Taurine import ATP-binding protein TauB OS=Yersinia pseudotuberculosis serotype I (strain IP32953) OX=273123 GN=tauB PE=3 SV=1\n', 'TBC9B_HUMAN TBC1 domain family member 9B OS=Homo sapiens OX=9606 GN=TBC1D9B PE=1 SV=3\n', 'TARI_STRA3 Ribitol-5-phosphate cytidylyltransferase OS=Streptococcus agalactiae serotype III (strain NEM316) OX=211110 GN=tarI PE=3 SV=1\n', 'SYS_WOLPP Serine--tRNA ligase OS=Wolbachia pipientis subsp. Culex pipiens (strain wPip) OX=570417 GN=serS PE=3 SV=1\n', 'TAD2B_ARATH Transcriptional adapter ADA2b OS=Arabidopsis thaliana OX=3702 GN=ADA2B PE=1 SV=1\n', 'SYW_SHIFL Tryptophan--tRNA ligase OS=Shigella flexneri OX=623 GN=trpS PE=3 SV=1\n', 'TAC1_TACTR Tachyplesin-1 OS=Tachypleus tridentatus OX=6853 PE=1 SV=2\n', 'TB1RA_XENLA F-box-like/WD repeat-containing protein TBL1XR1-A OS=Xenopus laevis OX=8355 GN=tbl1xr1-a PE=1 SV=1\n', 'TBL12_ARATH Protein trichome birefringence-like 12 OS=Arabidopsis thaliana OX=3702 GN=TBL12 PE=2 SV=1\n']
Process finished with exit code 0