去除序列中的*号

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import os
import re
import argparse
import subprocess


parser = argparse.ArgumentParser(description="You should add those parameters")
parser.add_argument("-i","--input", type = str, help = "The input fasta file")
parser.add_argument("-o","--output", type = str, help = "The output fasta file")
#args = parser.parse_args()
args =parser.parse_known_args()[0]

# 输入的fasta文件转换成字典
file_open = open(args.input,"r")
file_read = file_open.readlines()
file_new = open(args.output,"w")
for line in file_read:
if "*" in line:
line = line.replace("*","") + "\n"
else:
line = line
line = line.replace(">","\n>")
file_new.write(line)

# 保存文件
file_new.close()

# 去除空行
comm = "sed -i '/^$/d' " + args.output
subprocess.call(comm,shell=True)

💌lixiang117423@foxmail.com
💌lixiang117423@gmail.com


去除序列中的*号
https://lixiang117423.github.io/article/removestarfromfa/
作者
小蓝哥
发布于
2022年4月7日
许可协议