#!/usr/bin/python#-*- coding:utf-8 -*-\"处理fasta⽂件,将ID号和序列放在⼀⾏\"import sys
with open(sys.argv[1]) as f: fw=open('out.fasta', 'w') line=f.read()
line=line.replace('\\n', '').replace('>', '\\n>') for aa in line: fw.write(aa) fw.close()\"\"\"
>chr1|hos107.1#gene1
ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTCCCCCCAAAGGGG>chr1|hos107.2#gene2
ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC
>chr1|hos107.4#gene3
ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC
>chr1|hos107.5#gene4
ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC\"\"\"\"\"\"
>chr1|hos107.1#gene1ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTCCCCCCAAAGGGG>chr1|hos107.2#gene2ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC>chr1|hos107.4#gene3ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC>chr1|hos107.5#gene4ACACTCCCGGGCCCCCCCCCCCCACCTTTCAAAAAAAAAAAAAAAAATTTTC\"\"\"
#提取⽬标序列
f=open('./out.fasta', 'r')fw=open('target.fasta', 'w') for line in f.readlines():
if line.startswith('>chr1|hos107.1'): fw.write(line)f.close()fw.close()
\"\"\"可以从上述处理好的单⾏⽂件out.fasta中提取指定⽬标ID的⽂件,并将其写⼊到target.fasta⽂件中\"\"\"
#整体思路:
#先统⼀fasta⽂件格式从test.fasta----out.fasta#取出⽬标ID序列:out.fasta----target.fasta
因篇幅问题不能全部显示,请点此查看更多更全内容
Copyright © 2019- jqkq.cn 版权所有 赣ICP备2024042794号-4
违法及侵权请联系:TEL:199 1889 7713 E-MAIL:2724546146@qq.com
本站由北京市万商天勤律师事务所王兴未律师提供法律服务