From 299f5b7466bb8a5bbf6e61b22595e4769362cf3d Mon Sep 17 00:00:00 2001
From: SimonBache <simon.bache@etu.unistra.fr>
Date: Thu, 9 Jun 2022 11:11:54 +0200
Subject: [PATCH] changes count_effectors.py and gff_sort.py

---
 scripts/count_effectors.py | 6 +++---
 scripts/gff_sort.py        | 8 ++++----
 2 files changed, 7 insertions(+), 7 deletions(-)

diff --git a/scripts/count_effectors.py b/scripts/count_effectors.py
index 1afcf32..97def27 100644
--- a/scripts/count_effectors.py
+++ b/scripts/count_effectors.py
@@ -36,9 +36,9 @@ def main(gff, output, fasta_file):
         for lignes in f1:
                 ligne = lignes.rstrip("\n")
                 col = ligne.split("\t")
-                id_1 = re.sub("ID=", "", col[8])
-                id_2 = re.sub(";Name=\w+", "", id_1)
-                if col[2] =="gene":
+                if col[2] == "gene":
+                    id_1 = re.sub("ID=", "", col[8])
+                    id_2 = re.sub(";Name=\w+", "", id_1)
                     gff_parse.append(col[0]+" "+col[1]+" "+col[2]+" "+id_2)
                     dico_gff[col[0]].append(id_2)
 
diff --git a/scripts/gff_sort.py b/scripts/gff_sort.py
index 6c465f3..e90487d 100644
--- a/scripts/gff_sort.py
+++ b/scripts/gff_sort.py
@@ -22,10 +22,10 @@ def main(gff, output, strain_name):
     with open(gff, "r") as f1:
         for lignes in f1:
             col = lignes.split("\t")
-            if re.search("gene",col[2]):
-                id_strain = re.sub("ID=","ID="+strain_name+"_",col[8])
-                prot_gff = re.sub(";","T0;",id_strain)
-                gene_gff.append(col[0]+"\t"+col[1]+"\t"+col[2]+"\t"+col[3]+"\t"+col[4]+"\t"+col[5]+"\t"+col[6]+"\t"+col[7]+"\t"+prot_gff)
+            id_strain = re.sub("ID=","ID="+strain_name+"_",col[8])
+            prot_gff = re.sub(";","T0;",id_strain)
+            prot_gff = re.sub("T0T0", "T0", prot_gff)
+            gene_gff.append(col[0]+"\t"+col[1]+"\t"+col[2]+"\t"+col[3]+"\t"+col[4]+"\t"+col[5]+"\t"+col[6]+"\t"+col[7]+"\t"+prot_gff)
 
     output_file = open(output,"w")
     for elem in gene_gff:
-- 
GitLab