TRANSVIHMI
nfernandez
Reads_Quality_Control

Repository

curl https://repo.anaconda.com/miniconda/Miniconda3-latest-MacOSX-x86_64.sh -o ~/Miniconda3-latest-MacOSX-x86_64.sh && \
bash ~/Miniconda3-latest-MacOSX-x86_64.sh -b -p ~/miniconda3/ && \
rm -f ~/Miniconda3-latest-MacOSX-x86_64.sh && \
~/miniconda3/condabin/conda update conda --yes && \
~/miniconda3/condabin/conda init && \
exit
curl https://repo.anaconda.com/miniconda/Miniconda3-latest-Linux-x86_64.sh -o ~/Miniconda3-latest-Linux-x86_64.sh && \
bash ~/Miniconda3-latest-Linux-x86_64.sh -b -p ~/miniconda3/ && \
rm -f ~/Miniconda3-latest-Linux-x86_64.sh && \
~/miniconda3/condabin/conda update conda --yes && \
~/miniconda3/condabin/conda init && \
exit
conda update -n base -c defaults conda
git clone --depth 1 https://forge.ird.fr/transvihmi/nfernandez/GeVarLi.git ~/GeVarLi/
cd ~/GeVarLi/ && git reset --hard HEAD && git pull --verbose
curl https://forge.ird.fr/transvihmi/nfernandez/GeVarLi/-/archive/main/GeVarLi-main.tar.gz -o ~/GeVarLi-main.tar.gz && \
tar -xzvf ~/GeVarLi-main.tar.gz && \
mv ~/GeVarLi-main/ ~/GeVarLi/ && \
rm -f ~/GeVarLi-main.tar.gz
bash Start_GeVarLi.sh
 🧩 GeVarLi/
  ├── 📂 archives/
  │    └── 📦 Results_{YYYY-MM-DD_HHhMM}_{REFERENCE}_{ALIGNER}_{MINCOV}_{SAMPLES}_archive.tar.gz
  └── 📂 results/
       ├── 🧬 All_{REFERENCE}_consensus_sequences.fasta
       ├── 📊 All_{REFERENCE}_genome_coverages.tsv
       ├── 📊 All_{REFERENCE}_nextclade_lineages.tsv
       ├── 📊 All_{REFERENCE}_pangolin_lineages.tsv
       ├── 🌐 All_readsQC_reports.html
       ├── 📂 00_Quality_Control/
       │    ├── 📂 fastq-screen/
       │    │    ├── 🌐 {SAMPLE}_R{1/2}_screen.html
       │    │    ├── 📈 {SAMPLE}_R{1/2}_screen.png
       │    │    └── 📄 {SAMPLE}_R{1/2}_screen.txt
       │    ├── 📂 fastqc/
       │    │    ├── 🌐 {SAMPLE}_R{1/2}_fastqc.html
       │    │    └── 📦 {SAMPLE}_R{1/2}_fastqc.zip
       │    └── 📂 multiqc/
       │         ├── 🌐 multiqc_report.html
       │         └──📂 multiqc_data/
       │             ├── 📝 multiqc.log
       │             ├── 📄 multiqc_citations.txt
       │             ├── 🌀 multiqc_data.json
       │             ├── 📄 multiqc_fastq_screen.txt
       │             ├── 📄 multiqc_fastqc.txt
       │             ├── 📄 multiqc_general_stats.txt
       |             └── 📄 multiqc_sources.txt
       ├── 📂 01_Trimmidapt
       │    ├── 📂 cutadapt/
       │    │    └── 📦 {SAMPLE}_cutadapt-removed_R{1/2}.fastq.gz       # [temp]
       │    └── 📂 sickle/
       │         ├── 📦 {SAMPLE}_sickle-trimmed_R{1/2}.fastq.gz         # [temp]
       │         └── 📦 {SAMPLE}_sickle-trimmed_SE.fastq.gz             # [temp]
       ├── 📂 02_Mapping/
       │    ├── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_mark-dup.bam
       │    ├── 🗂️  {SAMPLE}_{REFERENCE}_{ALIGNER}_mark-dup.bam.bai
       │    ├── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_mark-dup.primerclipped.bam
       │    ├── 🗂️  {SAMPLE}_{REFERENCE}_{ALIGNER}_mark-dup.primerclipped.bam.bai
       │    ├── 🧭 {SAMPLE}_{ALIGNER}-mapped.sam                        # [temp]
       │    ├── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_sorted-by-names.bam               # [temp]
       │    ├── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_fixed-mate.bam                    # [temp]
       │    └── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_sorted.bam                        # [temp]
       ├── 📂 03_Coverage/
       │    ├── 📊 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_coverage-stats.tsv
       │    ├── 🛏️  {SAMPLE}_{REFERENCE}_{ALIGNER}_genome-cov.bed                    # [temp]
       │    ├── 🛏️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_min-cov-filt.bed         # [temp]
       │    └── 🛏️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_low-cov-mask.bed         # [temp]
       ├── 📂 04_Variants/
       │    ├── 🧬 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_masked-ref.fasta
       │    ├── 🗂️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_masked-ref.fasta.fai
       │    ├── 🧭 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_indel-qual.bam
       │    ├── 🗂️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_indel-qual.bai
       │    ├── 🧮️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_variant-call.vcf
       │    ├── 🧮️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_variant-filt.vcf
       │    ├── 📦 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_variant-filt.vcf.bgz     # [temp]
       │    └── 🗂️  {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_variant-filt.vcf.bgz.tbi # [temp]
       ├── 📂 05_Consensus/
       │    └── 🧬 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_consensus.fasta
       ├── 📂 06_Lineages/
       │    ├── 📊 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_nextclade-report.tsv
       │    ├── 📊 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_pangolin-report.csv
       │    └── 📂 {SAMPLE}_{REFERENCE}_{ALIGNER}_{MINCOV}_nextclade-all/
       │         ├── 🧬 nextclade.aligned.fasta
       │         ├── 📊 nextclade.csv
       │         ├── 📊 nextclade.errors.csv
       │         ├── 📊 nextclade.insertions.csv
       │         ├── 🌀 nextclade.json
       │         ├── 🌀 nextclade.ndjson
       │         ├── 🌀 nextclade.auspice.json
       │         └── 🧬 nextclade_{GENE}.translation.fasta
       └── 📂 10_Reports/
            ├── ⚙️  config.log
            ├── 📝 settings.log
            ├── 🍜 gevarli-base_v.{VERSION}.yaml
            ├── 🍜 gevarli-tools_v.{VERSION}.yaml
            ├── 📂 files-summaries
            │    └── 📄 {PIPELINE}_files-summary.txt
            ├── 📂 graphs/
            │    ├── 📈 {PIPELINE}_dag.{PNG/PDF}
            │    ├── 📈 {PIPELINE}_filegraph.{PNG/PDF}
            │    └── 📈 {PIPELINE}_rulegraph.{PNG/PDF}
            └── 📂 tools-log/
                 ├── 📂 awk/
                 ├── 📂 bcftools/
                 ├── 📂 bedtools/
                 ├── 📂 bgzip/
                 ├── 📂 bowtie2/
                 ├── 📂 bwa/
                 ├── 📂 cutadapt/
                 ├── 📂 lofreq/
                 ├── 📂 nextclade/
                 ├── 📂 pangolin/
                 ├── 📂 samtools/
                 ├── 📂 sed/
                 ├── 📂 sickle-trim/
                 ├── 📂 tabix/
                 ├── 📝 fastq-screen.log
                 ├── 📝 fastqc.log
                 └── 📝 multiqc.log
 🧩 GeVarLi/
 ├── 🖥️️  Start_GeVarLi.sh
 ├── 📚 README.md
 ├── 🪪 LICENSE
 ├── 🛑 .gitignore
 ├── 📂 .git/
 ├── 📂 .snakemake/
 ├── 📂 configuration/
 │    ├── ⚙️  config.yaml
 │    ├── ⚙️  fastq-screen.conf
 │    └── ⚙️  multiqc.yaml
 ├── 📂 resources/
 │    ├── 📂 genomes/
 │    │    ├── 🧬 SARS-CoV-2_Wuhan_MN-908947-3.fasta
 │    │    ├── 🧬 Monkeypox-virus_Zaire_AF-380138-1.fasta
 │    │    ├── 🧬 Monkeypox-virus_UK_MT-903345-1.fasta
 │    │    ├── 🧬 Swinepox-virus_India_MW-036632-1.fasta
 │    │    ├── 🧬 Ebola-virus_Zaire_AF-272001-1.fasta
 │    │    ├── 🧬 Ebola-virus_Sudan_MH-121162-1.fasta
 │    │    ├── 🧬 Nipah-virus_Malaysia_AJ-564622-1.fasta
 │    │    ├── 🧬 HIV-1_HXB2_K-03455-1.fasta
 │    │    ├── 🧬 (your_favorite_genome_reference}.fasta
 │    │    ├── 🧬 Echerichia-coli_CP-060121-1.fasta
 │    │    ├── 🧬 Kanamycin-Resistance-Gene.fasta
 │    │    ├── 🧬 NGS-adapters.fasta
 │    │    ├── 🧬 Phi-X174_Coliphage_NC-001422-1.fasta
 │    │    ├── 🧬 UniVec_wo_phiX-kanamycin-NGSseq.fasta
 │    │    └── 🧬 {your_favorite_control_reference}.fasta
 │    ├── 📂 indexes/
 │    │    ├── 📂 bwa/
 │    │    │    ├── 🗂️  {GENOME}.amb
 │    │    │    ├── 🗂️  {GENOME}.ann
 │    │    │    ├── 🗂️  {GENOME}.bwt
 │    │    │    ├── 🗂️  {GENOME}.pac
 │    │    │    └── 🗂️  {GENOME}.sa
 │    │    └── 📂 bowtie2/
 │    │         ├── 🗂️  {GENOME}.1.bt2
 │    │         ├── 🗂️  {GENOME}.2.bt2
 │    │         ├── 🗂️  {GENOME}.3.bt2
 │    │         ├── 🗂️  {GENOME}.4.bt2
 │    │         ├── 🗂️  {GENOME}.rev.1.bt2
 │    │         └── 🗂️  {GENOME}.rev.2.bt2
 │    ├── 📂 nextclade/
 │    │    ├── 📂 sars-cov-2/
 │    │    │    ├── 🌍 genemap.gff
 │    │    │    ├── 🧪 primers.csv
 │    │    │    ├── ✅ qc.json
 │    │    │    ├── 🦠 reference.fasta
 │    │    │    ├── 🧬 sequences.fasta
 │    │    │    ├── 🏷️  tag.json
 │    │    │    └── 🌳 tree.json
 │    │    ├── 📂 MPXV/
 │    │    │    ├── 🌍 genemap.gff
 │    │    │    ├── 🧪 primers.csv
 │    │    │    ├── ✅ qc.json
 │    │    │    ├── 🦠 reference.fasta
 │    │    │    ├── 🧬 sequences.fasta
 │    │    │    ├── 🏷️  tag.json
 │    │    │    └── 🌳 tree.json
 │    │    ├── 📂 hMPWV/
 │    │    │    ├── 🌍 genemap.gff
 │    │    │    ├── 🧪 primers.csv
 │    │    │    ├── ✅ qc.json
 │    │    │    ├── 🦠 reference.fasta
 │    │    │    ├── 🧬 sequences.fasta
 │    │    │    ├── 🏷️  tag.json
 │    │    │    └── 🌳 tree.json
 │    │    └── 📂 hMPXV_B1/
 │    │         ├── 🌍 genemap.gff
 │    │         ├── 🧪 primers.csv
 │    │         ├── ✅ qc.json
 │    │         ├── 🦠 reference.fasta
 │    │         ├── 🧬 sequences.fasta
 │    │         ├── 🏷️  tag.json
 │    │         └── 🌳 tree.json
 │    ├── 📂 reads/
 │    │    ├── 🛡️  .gitkeep
 │    │    ├── 📦 {SAMPLE}_R1.fastq.gz
 │    │    └── 📦 {SAMPLE}_R2.fastq.gz
 │    ├── 📂 test_data/
 │    │    ├── 🛡️  .gitkeep
 │    │    ├── 📦 SARS-CoV-2_Omicron-BA.1.1_Covid-Seq-Lib-on-MiSeq_250000-reads_R1.fastq.gz
 │    │    └── 📦 SARS-CoV-2_Omicron-BA.1.1_Covid-Seq-Lib-on-MiSeq_250000-reads_R2.fastq.gz
 │    └── 📂 visuals/
 │         ├── 📈 gevarli_filegraph.png
 │         ├── 📈 gevarli_rulegraph.png
 │         ├── 📈 indexing_genomes_rulegraph.png
 │         └── 📈 quality_control_rulegraph.png
 └── 📂 workflow/
      ├── 📂 environments/
      │    ├── 📂 linux/
      │         ├── 🍜 bamclipper_v.1.0.0.yaml
      │    │    ├── 🍜 bcftools_v.1.17.yaml
      │    │    ├── 🍜 bedtools_v.2.31.0.yaml
      │    │    ├── 🍜 bowtie2_v.2.5.1.yaml
      │    │    ├── 🍜 bwa_v.0.7.17.yaml
      │    │    ├── 🍜 cutadapt_v.4.4.yaml
      │    │    ├── 🍜 fastq-screen_v.0.15.3.yaml
      │    │    ├── 🍜 fastqc_v.0.12.1.yaml
      │    │    ├── 🍜 gawk_v.5.1.0.yaml
      │    │    ├── 🍜 lofreq_v.2.1.5.yaml
      │    │    ├── 🍜 multiqc_v.1.14.yaml
      │    │    ├── 🍜 nextclade_v.2.14.0.yaml
      │    │    ├── 🍜 pangolin_v.4.3.yaml
      │    │    ├── 🍜 samtools_v.1.17.yaml
      │    │    ├── 🍜 sickle-trim_v.1.33.yaml
      │    │    └── 🍜 workflow-base_v.2023.06.yaml
      │    └── 📂 osx/
      │         ├── 🍜 bamclipper_v.1.0.0.yaml
      │         ├── 🍜 bcftools_v.1.17.yaml
      │         ├── 🍜 bedtools_v.2.31.0.yaml
      │         ├── 🍜 bowtie2_v.2.5.1.yaml
      │         ├── 🍜 bwa_v.0.7.17.yaml
      │         ├── 🍜 cutadapt_v.4.4.yaml
      │         ├── 🍜 fastq-screen_v.0.15.3.yaml
      │         ├── 🍜 fastqc_v.0.12.1.yaml
      │         ├── 🍜 gawk_v.5.1.0.yaml
      │         ├── 🍜 lofreq_v.2.1.5.yaml
      │         ├── 🍜 multiqc_v.1.14.yaml
      │         ├── 🍜 nextclade_v.2.14.0.yaml
      │         ├── 🍜 pangolin_v.4.3.yaml
      │         ├── 🍜 samtools_v.1.17.yaml
      │         ├── 🍜 sickle-trim_v.1.33.yaml
      │         └── 🍜 workflow-base_v.2023.06.yaml
      └── 📂 snakefiles/
	       ├── 📜 gevarli.smk
	       ├── 📜 indexing_genomes.smk
	       └── 📜 quality_control.smk