parse_phobius.py 1.48 KiB
import re
import sys
from collections import defaultdict
from Bio import SeqIO
import pandas as pd
import click
@click.command(context_settings={'help_option_names': ('-h', '--help'), "max_content_width": 800})
@click.option('--phobius_file', '-t', default=None,
type=click.Path(exists=True, file_okay=True, dir_okay=False, readable=True, resolve_path=True),
required=True, show_default=True, help='Path to output of phobius file')
@click.option('--spphobius_output', '-o', default=None,
type=click.Path(exists=False, file_okay=True, dir_okay=False, readable=True, resolve_path=True),
required=True, show_default=True, help='Path to create output of secreted ID of sorted protein')
def main(phobius_file, spphobius_output):
""" This program retrieve ID of secreted protein of phobius with TM == 0 or TM == 1 """
sptargetp_id = []
with open(phobius_file) as f1:
for lignes in f1:
if re.search("^[^SEQUENCE]",lignes):
col = lignes.split()
if col[1] == "0" and col[2] == "Y":
#print(col[0],col[1],col[2])
sptargetp_id.append(col[0])
if col[1] == "1" and col[2] == "Y":
#print(col[0], col[1], col[2])
sptargetp_id.append(col[0])
output_id = open(spphobius_output, "w")
for elem in sptargetp_id:
output_id.write(elem+"\n")
output_id.close()
if __name__ == '__main__':
main()