From 299f5b7466bb8a5bbf6e61b22595e4769362cf3d Mon Sep 17 00:00:00 2001 From: SimonBache <simon.bache@etu.unistra.fr> Date: Thu, 9 Jun 2022 11:11:54 +0200 Subject: [PATCH] changes count_effectors.py and gff_sort.py --- scripts/count_effectors.py | 6 +++--- scripts/gff_sort.py | 8 ++++---- 2 files changed, 7 insertions(+), 7 deletions(-) diff --git a/scripts/count_effectors.py b/scripts/count_effectors.py index 1afcf32..97def27 100644 --- a/scripts/count_effectors.py +++ b/scripts/count_effectors.py @@ -36,9 +36,9 @@ def main(gff, output, fasta_file): for lignes in f1: ligne = lignes.rstrip("\n") col = ligne.split("\t") - id_1 = re.sub("ID=", "", col[8]) - id_2 = re.sub(";Name=\w+", "", id_1) - if col[2] =="gene": + if col[2] == "gene": + id_1 = re.sub("ID=", "", col[8]) + id_2 = re.sub(";Name=\w+", "", id_1) gff_parse.append(col[0]+" "+col[1]+" "+col[2]+" "+id_2) dico_gff[col[0]].append(id_2) diff --git a/scripts/gff_sort.py b/scripts/gff_sort.py index 6c465f3..e90487d 100644 --- a/scripts/gff_sort.py +++ b/scripts/gff_sort.py @@ -22,10 +22,10 @@ def main(gff, output, strain_name): with open(gff, "r") as f1: for lignes in f1: col = lignes.split("\t") - if re.search("gene",col[2]): - id_strain = re.sub("ID=","ID="+strain_name+"_",col[8]) - prot_gff = re.sub(";","T0;",id_strain) - gene_gff.append(col[0]+"\t"+col[1]+"\t"+col[2]+"\t"+col[3]+"\t"+col[4]+"\t"+col[5]+"\t"+col[6]+"\t"+col[7]+"\t"+prot_gff) + id_strain = re.sub("ID=","ID="+strain_name+"_",col[8]) + prot_gff = re.sub(";","T0;",id_strain) + prot_gff = re.sub("T0T0", "T0", prot_gff) + gene_gff.append(col[0]+"\t"+col[1]+"\t"+col[2]+"\t"+col[3]+"\t"+col[4]+"\t"+col[5]+"\t"+col[6]+"\t"+col[7]+"\t"+prot_gff) output_file = open(output,"w") for elem in gene_gff: -- GitLab